xref: /onnv-gate/usr/src/uts/common/os/contract.c (revision 6196:87d174d915a0)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
54845Svikram  * Common Development and Distribution License (the "License").
64845Svikram  * You may not use this file except in compliance with the License.
70Sstevel@tonic-gate  *
80Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
90Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
100Sstevel@tonic-gate  * See the License for the specific language governing permissions
110Sstevel@tonic-gate  * and limitations under the License.
120Sstevel@tonic-gate  *
130Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
140Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
150Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
160Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
170Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
180Sstevel@tonic-gate  *
190Sstevel@tonic-gate  * CDDL HEADER END
200Sstevel@tonic-gate  */
210Sstevel@tonic-gate /*
226073Sacruz  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
230Sstevel@tonic-gate  * Use is subject to license terms.
240Sstevel@tonic-gate  */
250Sstevel@tonic-gate 
260Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
270Sstevel@tonic-gate 
280Sstevel@tonic-gate /*
290Sstevel@tonic-gate  * Contracts
300Sstevel@tonic-gate  * ---------
310Sstevel@tonic-gate  *
320Sstevel@tonic-gate  * Contracts are a primitive which enrich the relationships between
330Sstevel@tonic-gate  * processes and system resources.  The primary purpose of contracts is
340Sstevel@tonic-gate  * to provide a means for the system to negotiate the departure from a
350Sstevel@tonic-gate  * binding relationship (e.g. pages locked in memory or a thread bound
360Sstevel@tonic-gate  * to processor), but they can also be used as a purely asynchronous
370Sstevel@tonic-gate  * error reporting mechanism as they are with process contracts.
380Sstevel@tonic-gate  *
390Sstevel@tonic-gate  * More information on how one interfaces with contracts and what
400Sstevel@tonic-gate  * contracts can do for you can be found in:
410Sstevel@tonic-gate  *   PSARC 2003/193 Solaris Contracts
420Sstevel@tonic-gate  *   PSARC 2004/460 Contracts addendum
430Sstevel@tonic-gate  *
440Sstevel@tonic-gate  * This file contains the core contracts framework.  By itself it is
450Sstevel@tonic-gate  * useless: it depends the contracts filesystem (ctfs) to provide an
460Sstevel@tonic-gate  * interface to user processes and individual contract types to
470Sstevel@tonic-gate  * implement the process/resource relationships.
480Sstevel@tonic-gate  *
490Sstevel@tonic-gate  * Data structure overview
500Sstevel@tonic-gate  * -----------------------
510Sstevel@tonic-gate  *
520Sstevel@tonic-gate  * A contract is represented by a contract_t, which itself points to an
530Sstevel@tonic-gate  * encapsulating contract-type specific contract object.  A contract_t
540Sstevel@tonic-gate  * contains the contract's static identity (including its terms), its
550Sstevel@tonic-gate  * linkage to various bookkeeping structures, the contract-specific
560Sstevel@tonic-gate  * event queue, and a reference count.
570Sstevel@tonic-gate  *
580Sstevel@tonic-gate  * A contract template is represented by a ct_template_t, which, like a
590Sstevel@tonic-gate  * contract, points to an encapsulating contract-type specific template
600Sstevel@tonic-gate  * object.  A ct_template_t contains the template's terms.
610Sstevel@tonic-gate  *
620Sstevel@tonic-gate  * An event queue is represented by a ct_equeue_t, and consists of a
630Sstevel@tonic-gate  * list of events, a list of listeners, and a list of listeners who are
640Sstevel@tonic-gate  * waiting for new events (affectionately referred to as "tail
650Sstevel@tonic-gate  * listeners").  There are three queue types, defined by ct_listnum_t
660Sstevel@tonic-gate  * (an enum).  An event may be on one of each type of queue
670Sstevel@tonic-gate  * simultaneously; the list linkage used by a queue is determined by
680Sstevel@tonic-gate  * its type.
690Sstevel@tonic-gate  *
700Sstevel@tonic-gate  * An event is represented by a ct_kevent_t, which contains mostly
710Sstevel@tonic-gate  * static event data (e.g. id, payload).  It also has an array of
720Sstevel@tonic-gate  * ct_member_t structures, each of which contains a list_node_t and
730Sstevel@tonic-gate  * represent the event's linkage in a specific event queue.
740Sstevel@tonic-gate  *
750Sstevel@tonic-gate  * Each open of an event endpoint results in the creation of a new
760Sstevel@tonic-gate  * listener, represented by a ct_listener_t.  In addition to linkage
770Sstevel@tonic-gate  * into the aforementioned lists in the event_queue, a ct_listener_t
780Sstevel@tonic-gate  * contains a pointer to the ct_kevent_t it is currently positioned at
790Sstevel@tonic-gate  * as well as a set of status flags and other administrative data.
800Sstevel@tonic-gate  *
810Sstevel@tonic-gate  * Each process has a list of contracts it owns, p_ct_held; a pointer
820Sstevel@tonic-gate  * to the process contract it is a member of, p_ct_process; the linkage
830Sstevel@tonic-gate  * for that membership, p_ct_member; and an array of event queue
840Sstevel@tonic-gate  * structures representing the process bundle queues.
850Sstevel@tonic-gate  *
860Sstevel@tonic-gate  * Each LWP has an array of its active templates, lwp_ct_active; and
870Sstevel@tonic-gate  * the most recently created contracts, lwp_ct_latest.
880Sstevel@tonic-gate  *
890Sstevel@tonic-gate  * A process contract has a list of member processes and a list of
900Sstevel@tonic-gate  * inherited contracts.
910Sstevel@tonic-gate  *
920Sstevel@tonic-gate  * There is a system-wide list of all contracts, as well as per-type
930Sstevel@tonic-gate  * lists of contracts.
940Sstevel@tonic-gate  *
950Sstevel@tonic-gate  * Lock ordering overview
960Sstevel@tonic-gate  * ----------------------
970Sstevel@tonic-gate  *
980Sstevel@tonic-gate  * Locks at the top are taken first:
990Sstevel@tonic-gate  *
1000Sstevel@tonic-gate  *                   ct_evtlock
1010Sstevel@tonic-gate  *                   regent ct_lock
1020Sstevel@tonic-gate  *                   member ct_lock
1030Sstevel@tonic-gate  *                   pidlock
1040Sstevel@tonic-gate  *                   p_lock
1050Sstevel@tonic-gate  *    contract ctq_lock         contract_lock
1060Sstevel@tonic-gate  *    pbundle ctq_lock
1070Sstevel@tonic-gate  *    cte_lock
1080Sstevel@tonic-gate  *                   ct_reflock
1090Sstevel@tonic-gate  *
1100Sstevel@tonic-gate  * contract_lock and ctq_lock/cte_lock are not currently taken at the
1110Sstevel@tonic-gate  * same time.
1120Sstevel@tonic-gate  *
1130Sstevel@tonic-gate  * Reference counting and locking
1140Sstevel@tonic-gate  * ------------------------------
1150Sstevel@tonic-gate  *
1160Sstevel@tonic-gate  * A contract has a reference count, protected by ct_reflock.
1170Sstevel@tonic-gate  * (ct_reflock is also used in a couple other places where atomic
1180Sstevel@tonic-gate  * access to a variable is needed in an innermost context).  A process
1190Sstevel@tonic-gate  * maintains a hold on each contract it owns.  A process contract has a
1200Sstevel@tonic-gate  * hold on each contract is has inherited.  Each event has a hold on
1210Sstevel@tonic-gate  * the contract which generated it.  Process contract templates have
1220Sstevel@tonic-gate  * holds on the contracts referred to by their transfer terms.  CTFS
1230Sstevel@tonic-gate  * contract directory nodes have holds on contracts.  Lastly, various
1240Sstevel@tonic-gate  * code paths may temporarily take holds on contracts to prevent them
1250Sstevel@tonic-gate  * from disappearing while other processing is going on.  It is
1260Sstevel@tonic-gate  * important to note that the global contract lists do not hold
1270Sstevel@tonic-gate  * references on contracts; a contract is removed from these structures
1280Sstevel@tonic-gate  * atomically with the release of its last reference.
1290Sstevel@tonic-gate  *
1300Sstevel@tonic-gate  * At a given point in time, a contract can either be owned by a
1310Sstevel@tonic-gate  * process, inherited by a regent process contract, or orphaned.  A
1320Sstevel@tonic-gate  * contract_t's  owner and regent pointers, ct_owner and ct_regent, are
1330Sstevel@tonic-gate  * protected by its ct_lock.  The linkage in the holder's (holder =
1340Sstevel@tonic-gate  * owner or regent) list of contracts, ct_ctlist, is protected by
1350Sstevel@tonic-gate  * whatever lock protects the holder's data structure.  In order for
1360Sstevel@tonic-gate  * these two directions to remain consistent, changing the holder of a
1370Sstevel@tonic-gate  * contract requires that both locks be held.
1380Sstevel@tonic-gate  *
1390Sstevel@tonic-gate  * Events also have reference counts.  There is one hold on an event
1400Sstevel@tonic-gate  * per queue it is present on, in addition to those needed for the
1410Sstevel@tonic-gate  * usual sundry reasons.  Individual listeners are associated with
1420Sstevel@tonic-gate  * specific queues, and increase a queue-specific reference count
1430Sstevel@tonic-gate  * stored in the ct_member_t structure.
1440Sstevel@tonic-gate  *
1450Sstevel@tonic-gate  * The dynamic contents of an event (reference count and flags) are
1460Sstevel@tonic-gate  * protected by its cte_lock, while the contents of the embedded
1470Sstevel@tonic-gate  * ct_member_t structures are protected by the locks of the queues they
1480Sstevel@tonic-gate  * are linked into.  A ct_listener_t's contents are also protected by
1490Sstevel@tonic-gate  * its event queue's ctq_lock.
1500Sstevel@tonic-gate  *
1510Sstevel@tonic-gate  * Resource controls
1520Sstevel@tonic-gate  * -----------------
1530Sstevel@tonic-gate  *
1540Sstevel@tonic-gate  * Control:      project.max-contracts (rc_project_contract)
1550Sstevel@tonic-gate  * Description:  Maximum number of contracts allowed a project.
1560Sstevel@tonic-gate  *
1570Sstevel@tonic-gate  *   When a contract is created, the project's allocation is tested and
1580Sstevel@tonic-gate  *   (assuming success) increased.  When the last reference to a
1590Sstevel@tonic-gate  *   contract is released, the creating project's allocation is
1600Sstevel@tonic-gate  *   decreased.
1610Sstevel@tonic-gate  */
1620Sstevel@tonic-gate 
1630Sstevel@tonic-gate #include <sys/mutex.h>
1640Sstevel@tonic-gate #include <sys/debug.h>
1650Sstevel@tonic-gate #include <sys/types.h>
1660Sstevel@tonic-gate #include <sys/param.h>
1670Sstevel@tonic-gate #include <sys/kmem.h>
1680Sstevel@tonic-gate #include <sys/thread.h>
1690Sstevel@tonic-gate #include <sys/id_space.h>
1700Sstevel@tonic-gate #include <sys/avl.h>
1710Sstevel@tonic-gate #include <sys/list.h>
1720Sstevel@tonic-gate #include <sys/sysmacros.h>
1730Sstevel@tonic-gate #include <sys/proc.h>
1740Sstevel@tonic-gate #include <sys/contract_impl.h>
1750Sstevel@tonic-gate #include <sys/contract/process_impl.h>
1764845Svikram #include <sys/dditypes.h>
1774845Svikram #include <sys/contract/device_impl.h>
1780Sstevel@tonic-gate #include <sys/systm.h>
1790Sstevel@tonic-gate #include <sys/atomic.h>
1800Sstevel@tonic-gate #include <sys/cmn_err.h>
1810Sstevel@tonic-gate #include <sys/model.h>
1820Sstevel@tonic-gate #include <sys/policy.h>
1830Sstevel@tonic-gate #include <sys/zone.h>
1840Sstevel@tonic-gate #include <sys/task.h>
1854845Svikram #include <sys/ddi.h>
1864845Svikram #include <sys/sunddi.h>
1870Sstevel@tonic-gate 
1880Sstevel@tonic-gate extern rctl_hndl_t rc_project_contract;
1890Sstevel@tonic-gate 
1900Sstevel@tonic-gate static id_space_t	*contract_ids;
1910Sstevel@tonic-gate static avl_tree_t	contract_avl;
1920Sstevel@tonic-gate static kmutex_t		contract_lock;
1930Sstevel@tonic-gate 
1940Sstevel@tonic-gate int			ct_ntypes = CTT_MAXTYPE;
1950Sstevel@tonic-gate static ct_type_t	*ct_types_static[CTT_MAXTYPE];
1960Sstevel@tonic-gate ct_type_t		**ct_types = ct_types_static;
1974845Svikram int			ct_debug;
1980Sstevel@tonic-gate 
1990Sstevel@tonic-gate static void cte_queue_create(ct_equeue_t *, ct_listnum_t, int, int);
2000Sstevel@tonic-gate static void cte_queue_destroy(ct_equeue_t *);
2010Sstevel@tonic-gate static void cte_queue_drain(ct_equeue_t *, int);
2020Sstevel@tonic-gate static void cte_trim(ct_equeue_t *, contract_t *);
2030Sstevel@tonic-gate static void cte_copy(ct_equeue_t *, ct_equeue_t *);
2040Sstevel@tonic-gate 
2050Sstevel@tonic-gate /*
2060Sstevel@tonic-gate  * contract_compar
2070Sstevel@tonic-gate  *
2080Sstevel@tonic-gate  * A contract comparator which sorts on contract ID.
2090Sstevel@tonic-gate  */
2100Sstevel@tonic-gate int
2110Sstevel@tonic-gate contract_compar(const void *x, const void *y)
2120Sstevel@tonic-gate {
2130Sstevel@tonic-gate 	const contract_t *ct1 = x;
2140Sstevel@tonic-gate 	const contract_t *ct2 = y;
2150Sstevel@tonic-gate 
2160Sstevel@tonic-gate 	if (ct1->ct_id < ct2->ct_id)
2170Sstevel@tonic-gate 		return (-1);
2180Sstevel@tonic-gate 	if (ct1->ct_id > ct2->ct_id)
2190Sstevel@tonic-gate 		return (1);
2200Sstevel@tonic-gate 	return (0);
2210Sstevel@tonic-gate }
2220Sstevel@tonic-gate 
2230Sstevel@tonic-gate /*
2240Sstevel@tonic-gate  * contract_init
2250Sstevel@tonic-gate  *
2260Sstevel@tonic-gate  * Initializes the contract subsystem, the specific contract types, and
2270Sstevel@tonic-gate  * process 0.
2280Sstevel@tonic-gate  */
2290Sstevel@tonic-gate void
2300Sstevel@tonic-gate contract_init(void)
2310Sstevel@tonic-gate {
2320Sstevel@tonic-gate 	/*
2330Sstevel@tonic-gate 	 * Initialize contract subsystem.
2340Sstevel@tonic-gate 	 */
2350Sstevel@tonic-gate 	contract_ids = id_space_create("contracts", 1, INT_MAX);
2360Sstevel@tonic-gate 	avl_create(&contract_avl, contract_compar, sizeof (contract_t),
2370Sstevel@tonic-gate 	    offsetof(contract_t, ct_ctavl));
2380Sstevel@tonic-gate 	mutex_init(&contract_lock, NULL, MUTEX_DEFAULT, NULL);
2390Sstevel@tonic-gate 
2400Sstevel@tonic-gate 	/*
2410Sstevel@tonic-gate 	 * Initialize contract types.
2420Sstevel@tonic-gate 	 */
2430Sstevel@tonic-gate 	contract_process_init();
2444845Svikram 	contract_device_init();
2450Sstevel@tonic-gate 
2460Sstevel@tonic-gate 	/*
2470Sstevel@tonic-gate 	 * Initialize p0/lwp0 contract state.
2480Sstevel@tonic-gate 	 */
2490Sstevel@tonic-gate 	avl_create(&p0.p_ct_held, contract_compar, sizeof (contract_t),
2500Sstevel@tonic-gate 	    offsetof(contract_t, ct_ctlist));
2510Sstevel@tonic-gate }
2520Sstevel@tonic-gate 
2530Sstevel@tonic-gate /*
2540Sstevel@tonic-gate  * contract_dtor
2550Sstevel@tonic-gate  *
2560Sstevel@tonic-gate  * Performs basic destruction of the common portions of a contract.
2570Sstevel@tonic-gate  * Called from the failure path of contract_ctor and from
2580Sstevel@tonic-gate  * contract_rele.
2590Sstevel@tonic-gate  */
2600Sstevel@tonic-gate static void
2610Sstevel@tonic-gate contract_dtor(contract_t *ct)
2620Sstevel@tonic-gate {
2630Sstevel@tonic-gate 	cte_queue_destroy(&ct->ct_events);
2640Sstevel@tonic-gate 	list_destroy(&ct->ct_vnodes);
2650Sstevel@tonic-gate 	mutex_destroy(&ct->ct_reflock);
2660Sstevel@tonic-gate 	mutex_destroy(&ct->ct_lock);
2670Sstevel@tonic-gate 	mutex_destroy(&ct->ct_evtlock);
2680Sstevel@tonic-gate }
2690Sstevel@tonic-gate 
2700Sstevel@tonic-gate /*
2710Sstevel@tonic-gate  * contract_ctor
2720Sstevel@tonic-gate  *
2730Sstevel@tonic-gate  * Called by a contract type to initialize a contract.  Fails if the
2740Sstevel@tonic-gate  * max-contract resource control would have been exceeded.  After a
2750Sstevel@tonic-gate  * successful call to contract_ctor, the contract is unlocked and
2760Sstevel@tonic-gate  * visible in all namespaces; any type-specific initialization should
2770Sstevel@tonic-gate  * be completed before calling contract_ctor.  Returns 0 on success.
2780Sstevel@tonic-gate  *
2790Sstevel@tonic-gate  * Because not all callers can tolerate failure, a 0 value for canfail
2800Sstevel@tonic-gate  * instructs contract_ctor to ignore the project.max-contracts resource
2810Sstevel@tonic-gate  * control.  Obviously, this "out" should only be employed by callers
2820Sstevel@tonic-gate  * who are sufficiently constrained in other ways (e.g. newproc).
2830Sstevel@tonic-gate  */
2840Sstevel@tonic-gate int
2850Sstevel@tonic-gate contract_ctor(contract_t *ct, ct_type_t *type, ct_template_t *tmpl, void *data,
2860Sstevel@tonic-gate     ctflags_t flags, proc_t *author, int canfail)
2870Sstevel@tonic-gate {
2880Sstevel@tonic-gate 	avl_index_t where;
2890Sstevel@tonic-gate 	klwp_t *curlwp = ttolwp(curthread);
2900Sstevel@tonic-gate 
2910Sstevel@tonic-gate 	ASSERT(author == curproc);
2920Sstevel@tonic-gate 
2930Sstevel@tonic-gate 	mutex_init(&ct->ct_lock, NULL, MUTEX_DEFAULT, NULL);
2940Sstevel@tonic-gate 	mutex_init(&ct->ct_reflock, NULL, MUTEX_DEFAULT, NULL);
2950Sstevel@tonic-gate 	mutex_init(&ct->ct_evtlock, NULL, MUTEX_DEFAULT, NULL);
2960Sstevel@tonic-gate 	ct->ct_id = id_alloc(contract_ids);
2970Sstevel@tonic-gate 
2980Sstevel@tonic-gate 	cte_queue_create(&ct->ct_events, CTEL_CONTRACT, 20, 0);
2990Sstevel@tonic-gate 	list_create(&ct->ct_vnodes, sizeof (contract_vnode_t),
3000Sstevel@tonic-gate 	    offsetof(contract_vnode_t, ctv_node));
3010Sstevel@tonic-gate 
3020Sstevel@tonic-gate 	/*
3030Sstevel@tonic-gate 	 * Instance data
3040Sstevel@tonic-gate 	 */
3050Sstevel@tonic-gate 	ct->ct_ref = 2;		/* one for the holder, one for "latest" */
3060Sstevel@tonic-gate 	ct->ct_cuid = crgetuid(CRED());
3070Sstevel@tonic-gate 	ct->ct_type = type;
3080Sstevel@tonic-gate 	ct->ct_data = data;
3090Sstevel@tonic-gate 	gethrestime(&ct->ct_ctime);
3100Sstevel@tonic-gate 	ct->ct_state = CTS_OWNED;
3110Sstevel@tonic-gate 	ct->ct_flags = flags;
3120Sstevel@tonic-gate 	ct->ct_regent = author->p_ct_process ?
3130Sstevel@tonic-gate 	    &author->p_ct_process->conp_contract : NULL;
3140Sstevel@tonic-gate 	ct->ct_ev_info = tmpl->ctmpl_ev_info;
3150Sstevel@tonic-gate 	ct->ct_ev_crit = tmpl->ctmpl_ev_crit;
3160Sstevel@tonic-gate 	ct->ct_cookie = tmpl->ctmpl_cookie;
3170Sstevel@tonic-gate 	ct->ct_owner = author;
3184845Svikram 	ct->ct_ntime.ctm_total = -1;
3194845Svikram 	ct->ct_qtime.ctm_total = -1;
3204845Svikram 	ct->ct_nevent = NULL;
3210Sstevel@tonic-gate 
3220Sstevel@tonic-gate 	/*
3230Sstevel@tonic-gate 	 * Test project.max-contracts.
3240Sstevel@tonic-gate 	 */
3250Sstevel@tonic-gate 	mutex_enter(&author->p_lock);
3260Sstevel@tonic-gate 	mutex_enter(&contract_lock);
3270Sstevel@tonic-gate 	if (canfail && rctl_test(rc_project_contract,
3280Sstevel@tonic-gate 	    author->p_task->tk_proj->kpj_rctls, author, 1,
3290Sstevel@tonic-gate 	    RCA_SAFE) & RCT_DENY) {
3300Sstevel@tonic-gate 		id_free(contract_ids, ct->ct_id);
3310Sstevel@tonic-gate 		mutex_exit(&contract_lock);
3320Sstevel@tonic-gate 		mutex_exit(&author->p_lock);
3330Sstevel@tonic-gate 		ct->ct_events.ctq_flags |= CTQ_DEAD;
3340Sstevel@tonic-gate 		contract_dtor(ct);
3350Sstevel@tonic-gate 		return (1);
3360Sstevel@tonic-gate 	}
3370Sstevel@tonic-gate 	ct->ct_proj = author->p_task->tk_proj;
3380Sstevel@tonic-gate 	ct->ct_proj->kpj_data.kpd_contract++;
3390Sstevel@tonic-gate 	(void) project_hold(ct->ct_proj);
3400Sstevel@tonic-gate 	mutex_exit(&contract_lock);
3410Sstevel@tonic-gate 
3420Sstevel@tonic-gate 	/*
3430Sstevel@tonic-gate 	 * Insert into holder's avl of contracts.
3440Sstevel@tonic-gate 	 * We use an avl not because order is important, but because
3450Sstevel@tonic-gate 	 * readdir of /proc/contracts requires we be able to use a
3460Sstevel@tonic-gate 	 * scalar as an index into the process's list of contracts
3470Sstevel@tonic-gate 	 */
3480Sstevel@tonic-gate 	ct->ct_zoneid = author->p_zone->zone_id;
3490Sstevel@tonic-gate 	ct->ct_czuniqid = ct->ct_mzuniqid = author->p_zone->zone_uniqid;
3500Sstevel@tonic-gate 	VERIFY(avl_find(&author->p_ct_held, ct, &where) == NULL);
3510Sstevel@tonic-gate 	avl_insert(&author->p_ct_held, ct, where);
3520Sstevel@tonic-gate 	mutex_exit(&author->p_lock);
3530Sstevel@tonic-gate 
3540Sstevel@tonic-gate 	/*
3550Sstevel@tonic-gate 	 * Insert into global contract AVL
3560Sstevel@tonic-gate 	 */
3570Sstevel@tonic-gate 	mutex_enter(&contract_lock);
3580Sstevel@tonic-gate 	VERIFY(avl_find(&contract_avl, ct, &where) == NULL);
3590Sstevel@tonic-gate 	avl_insert(&contract_avl, ct, where);
3600Sstevel@tonic-gate 	mutex_exit(&contract_lock);
3610Sstevel@tonic-gate 
3620Sstevel@tonic-gate 	/*
3630Sstevel@tonic-gate 	 * Insert into type AVL
3640Sstevel@tonic-gate 	 */
3650Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
3660Sstevel@tonic-gate 	VERIFY(avl_find(&type->ct_type_avl, ct, &where) == NULL);
3670Sstevel@tonic-gate 	avl_insert(&type->ct_type_avl, ct, where);
3680Sstevel@tonic-gate 	type->ct_type_timestruc = ct->ct_ctime;
3690Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
3700Sstevel@tonic-gate 
3710Sstevel@tonic-gate 	if (curlwp->lwp_ct_latest[type->ct_type_index])
3720Sstevel@tonic-gate 		contract_rele(curlwp->lwp_ct_latest[type->ct_type_index]);
3730Sstevel@tonic-gate 	curlwp->lwp_ct_latest[type->ct_type_index] = ct;
3740Sstevel@tonic-gate 
3750Sstevel@tonic-gate 	return (0);
3760Sstevel@tonic-gate }
3770Sstevel@tonic-gate 
3780Sstevel@tonic-gate /*
3790Sstevel@tonic-gate  * contract_rele
3800Sstevel@tonic-gate  *
3810Sstevel@tonic-gate  * Releases a reference to a contract.  If the caller had the last
3820Sstevel@tonic-gate  * reference, the contract is removed from all namespaces, its
3830Sstevel@tonic-gate  * allocation against the max-contracts resource control is released,
3840Sstevel@tonic-gate  * and the contract type's free entry point is invoked for any
3850Sstevel@tonic-gate  * type-specific deconstruction and to (presumably) free the object.
3860Sstevel@tonic-gate  */
3870Sstevel@tonic-gate void
3880Sstevel@tonic-gate contract_rele(contract_t *ct)
3890Sstevel@tonic-gate {
3900Sstevel@tonic-gate 	uint64_t nref;
3910Sstevel@tonic-gate 
3920Sstevel@tonic-gate 	mutex_enter(&ct->ct_reflock);
3930Sstevel@tonic-gate 	ASSERT(ct->ct_ref > 0);
3940Sstevel@tonic-gate 	nref = --ct->ct_ref;
3950Sstevel@tonic-gate 	mutex_exit(&ct->ct_reflock);
3960Sstevel@tonic-gate 	if (nref == 0) {
3970Sstevel@tonic-gate 		/*
3980Sstevel@tonic-gate 		 * ct_owner is cleared when it drops its reference.
3990Sstevel@tonic-gate 		 */
4000Sstevel@tonic-gate 		ASSERT(ct->ct_owner == NULL);
4010Sstevel@tonic-gate 		ASSERT(ct->ct_evcnt == 0);
4020Sstevel@tonic-gate 
4030Sstevel@tonic-gate 		/*
4040Sstevel@tonic-gate 		 * Remove from global contract AVL
4050Sstevel@tonic-gate 		 */
4060Sstevel@tonic-gate 		mutex_enter(&contract_lock);
4070Sstevel@tonic-gate 		avl_remove(&contract_avl, ct);
4080Sstevel@tonic-gate 		mutex_exit(&contract_lock);
4090Sstevel@tonic-gate 
4100Sstevel@tonic-gate 		/*
4110Sstevel@tonic-gate 		 * Remove from type AVL
4120Sstevel@tonic-gate 		 */
4130Sstevel@tonic-gate 		mutex_enter(&ct->ct_type->ct_type_lock);
4140Sstevel@tonic-gate 		avl_remove(&ct->ct_type->ct_type_avl, ct);
4150Sstevel@tonic-gate 		mutex_exit(&ct->ct_type->ct_type_lock);
4160Sstevel@tonic-gate 
4170Sstevel@tonic-gate 		/*
4180Sstevel@tonic-gate 		 * Release the contract's ID
4190Sstevel@tonic-gate 		 */
4200Sstevel@tonic-gate 		id_free(contract_ids, ct->ct_id);
4210Sstevel@tonic-gate 
4220Sstevel@tonic-gate 		/*
4230Sstevel@tonic-gate 		 * Release project hold
4240Sstevel@tonic-gate 		 */
4250Sstevel@tonic-gate 		mutex_enter(&contract_lock);
4260Sstevel@tonic-gate 		ct->ct_proj->kpj_data.kpd_contract--;
4270Sstevel@tonic-gate 		project_rele(ct->ct_proj);
4280Sstevel@tonic-gate 		mutex_exit(&contract_lock);
4290Sstevel@tonic-gate 
4300Sstevel@tonic-gate 		/*
4310Sstevel@tonic-gate 		 * Free the contract
4320Sstevel@tonic-gate 		 */
4330Sstevel@tonic-gate 		contract_dtor(ct);
4340Sstevel@tonic-gate 		ct->ct_type->ct_type_ops->contop_free(ct);
4350Sstevel@tonic-gate 	}
4360Sstevel@tonic-gate }
4370Sstevel@tonic-gate 
4380Sstevel@tonic-gate /*
4390Sstevel@tonic-gate  * contract_hold
4400Sstevel@tonic-gate  *
4410Sstevel@tonic-gate  * Adds a reference to a contract
4420Sstevel@tonic-gate  */
4430Sstevel@tonic-gate void
4440Sstevel@tonic-gate contract_hold(contract_t *ct)
4450Sstevel@tonic-gate {
4460Sstevel@tonic-gate 	mutex_enter(&ct->ct_reflock);
4470Sstevel@tonic-gate 	ASSERT(ct->ct_ref < UINT64_MAX);
4480Sstevel@tonic-gate 	ct->ct_ref++;
4490Sstevel@tonic-gate 	mutex_exit(&ct->ct_reflock);
4500Sstevel@tonic-gate }
4510Sstevel@tonic-gate 
4520Sstevel@tonic-gate /*
4530Sstevel@tonic-gate  * contract_getzuniqid
4540Sstevel@tonic-gate  *
4550Sstevel@tonic-gate  * Get a contract's zone unique ID.  Needed because 64-bit reads and
4560Sstevel@tonic-gate  * writes aren't atomic on x86.  Since there are contexts where we are
4570Sstevel@tonic-gate  * unable to take ct_lock, we instead use ct_reflock; in actuality any
4580Sstevel@tonic-gate  * lock would do.
4590Sstevel@tonic-gate  */
4600Sstevel@tonic-gate uint64_t
4610Sstevel@tonic-gate contract_getzuniqid(contract_t *ct)
4620Sstevel@tonic-gate {
4630Sstevel@tonic-gate 	uint64_t zuniqid;
4640Sstevel@tonic-gate 
4650Sstevel@tonic-gate 	mutex_enter(&ct->ct_reflock);
4660Sstevel@tonic-gate 	zuniqid = ct->ct_mzuniqid;
4670Sstevel@tonic-gate 	mutex_exit(&ct->ct_reflock);
4680Sstevel@tonic-gate 
4690Sstevel@tonic-gate 	return (zuniqid);
4700Sstevel@tonic-gate }
4710Sstevel@tonic-gate 
4720Sstevel@tonic-gate /*
4730Sstevel@tonic-gate  * contract_setzuniqid
4740Sstevel@tonic-gate  *
4750Sstevel@tonic-gate  * Sets a contract's zone unique ID.   See contract_getzuniqid.
4760Sstevel@tonic-gate  */
4770Sstevel@tonic-gate void
4780Sstevel@tonic-gate contract_setzuniqid(contract_t *ct, uint64_t zuniqid)
4790Sstevel@tonic-gate {
4800Sstevel@tonic-gate 	mutex_enter(&ct->ct_reflock);
4810Sstevel@tonic-gate 	ct->ct_mzuniqid = zuniqid;
4820Sstevel@tonic-gate 	mutex_exit(&ct->ct_reflock);
4830Sstevel@tonic-gate }
4840Sstevel@tonic-gate 
4850Sstevel@tonic-gate /*
4860Sstevel@tonic-gate  * contract_abandon
4870Sstevel@tonic-gate  *
4880Sstevel@tonic-gate  * Abandons the specified contract.  If "explicit" is clear, the
4890Sstevel@tonic-gate  * contract was implicitly abandoned (by process exit) and should be
4900Sstevel@tonic-gate  * inherited if its terms allow it and its owner was a member of a
4910Sstevel@tonic-gate  * regent contract.  Otherwise, the contract type's abandon entry point
4920Sstevel@tonic-gate  * is invoked to either destroy or orphan the contract.
4930Sstevel@tonic-gate  */
4940Sstevel@tonic-gate int
4950Sstevel@tonic-gate contract_abandon(contract_t *ct, proc_t *p, int explicit)
4960Sstevel@tonic-gate {
4970Sstevel@tonic-gate 	ct_equeue_t *q = NULL;
4980Sstevel@tonic-gate 	contract_t *parent = &p->p_ct_process->conp_contract;
4990Sstevel@tonic-gate 	int inherit = 0;
5000Sstevel@tonic-gate 
5010Sstevel@tonic-gate 	ASSERT(p == curproc);
5020Sstevel@tonic-gate 
5030Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
5040Sstevel@tonic-gate 
5050Sstevel@tonic-gate 	/*
5060Sstevel@tonic-gate 	 * Multiple contract locks are taken contract -> subcontract.
5070Sstevel@tonic-gate 	 * Check if the contract will be inherited so we can acquire
5080Sstevel@tonic-gate 	 * all the necessary locks before making sensitive changes.
5090Sstevel@tonic-gate 	 */
5100Sstevel@tonic-gate 	if (!explicit && (ct->ct_flags & CTF_INHERIT) &&
5110Sstevel@tonic-gate 	    contract_process_accept(parent)) {
5120Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
5130Sstevel@tonic-gate 		mutex_enter(&parent->ct_lock);
5140Sstevel@tonic-gate 		mutex_enter(&ct->ct_lock);
5150Sstevel@tonic-gate 		inherit = 1;
5160Sstevel@tonic-gate 	}
5170Sstevel@tonic-gate 
5180Sstevel@tonic-gate 	if (ct->ct_owner != p) {
5190Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
5200Sstevel@tonic-gate 		if (inherit)
5210Sstevel@tonic-gate 			mutex_exit(&parent->ct_lock);
5220Sstevel@tonic-gate 		return (EINVAL);
5230Sstevel@tonic-gate 	}
5240Sstevel@tonic-gate 
5250Sstevel@tonic-gate 	mutex_enter(&p->p_lock);
5260Sstevel@tonic-gate 	if (explicit)
5270Sstevel@tonic-gate 		avl_remove(&p->p_ct_held, ct);
5280Sstevel@tonic-gate 	ct->ct_owner = NULL;
5290Sstevel@tonic-gate 	mutex_exit(&p->p_lock);
5300Sstevel@tonic-gate 
5310Sstevel@tonic-gate 	/*
5320Sstevel@tonic-gate 	 * Since we can't call cte_trim with the contract lock held,
5330Sstevel@tonic-gate 	 * we grab the queue pointer here.
5340Sstevel@tonic-gate 	 */
5350Sstevel@tonic-gate 	if (p->p_ct_equeue)
5360Sstevel@tonic-gate 		q = p->p_ct_equeue[ct->ct_type->ct_type_index];
5370Sstevel@tonic-gate 
5380Sstevel@tonic-gate 	/*
5390Sstevel@tonic-gate 	 * contop_abandon may destroy the contract so we rely on it to
5400Sstevel@tonic-gate 	 * drop ct_lock.  We retain a reference on the contract so that
5410Sstevel@tonic-gate 	 * the cte_trim which follows functions properly.  Even though
5420Sstevel@tonic-gate 	 * cte_trim doesn't dereference the contract pointer, it is
5430Sstevel@tonic-gate 	 * still necessary to retain a reference to the contract so
5440Sstevel@tonic-gate 	 * that we don't trim events which are sent by a subsequently
5450Sstevel@tonic-gate 	 * allocated contract infortuitously located at the same address.
5460Sstevel@tonic-gate 	 */
5470Sstevel@tonic-gate 	contract_hold(ct);
5480Sstevel@tonic-gate 
5490Sstevel@tonic-gate 	if (inherit) {
5500Sstevel@tonic-gate 		ct->ct_state = CTS_INHERITED;
5510Sstevel@tonic-gate 		ASSERT(ct->ct_regent == parent);
5520Sstevel@tonic-gate 		contract_process_take(parent, ct);
5530Sstevel@tonic-gate 
5540Sstevel@tonic-gate 		/*
5550Sstevel@tonic-gate 		 * We are handing off the process's reference to the
5560Sstevel@tonic-gate 		 * parent contract.  For this reason, the order in
5570Sstevel@tonic-gate 		 * which we drop the contract locks is also important.
5580Sstevel@tonic-gate 		 */
5590Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
5600Sstevel@tonic-gate 		mutex_exit(&parent->ct_lock);
5610Sstevel@tonic-gate 	} else {
5620Sstevel@tonic-gate 		ct->ct_regent = NULL;
5630Sstevel@tonic-gate 		ct->ct_type->ct_type_ops->contop_abandon(ct);
5640Sstevel@tonic-gate 	}
5650Sstevel@tonic-gate 
5660Sstevel@tonic-gate 	/*
5670Sstevel@tonic-gate 	 * ct_lock has been dropped; we can safely trim the event
5680Sstevel@tonic-gate 	 * queue now.
5690Sstevel@tonic-gate 	 */
5700Sstevel@tonic-gate 	if (q) {
5710Sstevel@tonic-gate 		mutex_enter(&q->ctq_lock);
5720Sstevel@tonic-gate 		cte_trim(q, ct);
5730Sstevel@tonic-gate 		mutex_exit(&q->ctq_lock);
5740Sstevel@tonic-gate 	}
5750Sstevel@tonic-gate 
5760Sstevel@tonic-gate 	contract_rele(ct);
5770Sstevel@tonic-gate 
5780Sstevel@tonic-gate 	return (0);
5790Sstevel@tonic-gate }
5800Sstevel@tonic-gate 
5814845Svikram int
5824845Svikram contract_newct(contract_t *ct)
5834845Svikram {
5844845Svikram 	return (ct->ct_type->ct_type_ops->contop_newct(ct));
5854845Svikram }
5864845Svikram 
5870Sstevel@tonic-gate /*
5880Sstevel@tonic-gate  * contract_adopt
5890Sstevel@tonic-gate  *
5900Sstevel@tonic-gate  * Adopts a contract.  After a successful call to this routine, the
5910Sstevel@tonic-gate  * previously inherited contract will belong to the calling process,
5920Sstevel@tonic-gate  * and its events will have been appended to its new owner's process
5930Sstevel@tonic-gate  * bundle queue.
5940Sstevel@tonic-gate  */
5950Sstevel@tonic-gate int
5960Sstevel@tonic-gate contract_adopt(contract_t *ct, proc_t *p)
5970Sstevel@tonic-gate {
5980Sstevel@tonic-gate 	avl_index_t where;
5990Sstevel@tonic-gate 	ct_equeue_t *q;
6000Sstevel@tonic-gate 	contract_t *parent;
6010Sstevel@tonic-gate 
6020Sstevel@tonic-gate 	ASSERT(p == curproc);
6030Sstevel@tonic-gate 
6040Sstevel@tonic-gate 	/*
6050Sstevel@tonic-gate 	 * Ensure the process has an event queue.  Checked by ASSERTs
6060Sstevel@tonic-gate 	 * below.
6070Sstevel@tonic-gate 	 */
6080Sstevel@tonic-gate 	(void) contract_type_pbundle(ct->ct_type, p);
6090Sstevel@tonic-gate 
6100Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
6110Sstevel@tonic-gate 	parent = ct->ct_regent;
6120Sstevel@tonic-gate 	if (ct->ct_state != CTS_INHERITED ||
6130Sstevel@tonic-gate 	    &p->p_ct_process->conp_contract != parent ||
6140Sstevel@tonic-gate 	    p->p_zone->zone_uniqid != ct->ct_czuniqid) {
6150Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
6160Sstevel@tonic-gate 		return (EINVAL);
6170Sstevel@tonic-gate 	}
6180Sstevel@tonic-gate 
6190Sstevel@tonic-gate 	/*
6200Sstevel@tonic-gate 	 * Multiple contract locks are taken contract -> subcontract.
6210Sstevel@tonic-gate 	 */
6220Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
6230Sstevel@tonic-gate 	mutex_enter(&parent->ct_lock);
6240Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
6250Sstevel@tonic-gate 
6260Sstevel@tonic-gate 	/*
6270Sstevel@tonic-gate 	 * It is possible that the contract was adopted by someone else
6280Sstevel@tonic-gate 	 * while its lock was dropped.  It isn't possible for the
6290Sstevel@tonic-gate 	 * contract to have been inherited by a different regent
6300Sstevel@tonic-gate 	 * contract.
6310Sstevel@tonic-gate 	 */
6320Sstevel@tonic-gate 	if (ct->ct_state != CTS_INHERITED) {
6330Sstevel@tonic-gate 		mutex_exit(&parent->ct_lock);
6340Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
6350Sstevel@tonic-gate 		return (EBUSY);
6360Sstevel@tonic-gate 	}
6370Sstevel@tonic-gate 	ASSERT(ct->ct_regent == parent);
6380Sstevel@tonic-gate 
6390Sstevel@tonic-gate 	ct->ct_state = CTS_OWNED;
6400Sstevel@tonic-gate 
6410Sstevel@tonic-gate 	contract_process_adopt(ct, p);
6420Sstevel@tonic-gate 
6430Sstevel@tonic-gate 	mutex_enter(&p->p_lock);
6440Sstevel@tonic-gate 	ct->ct_owner = p;
6450Sstevel@tonic-gate 	VERIFY(avl_find(&p->p_ct_held, ct, &where) == NULL);
6460Sstevel@tonic-gate 	avl_insert(&p->p_ct_held, ct, where);
6470Sstevel@tonic-gate 	mutex_exit(&p->p_lock);
6480Sstevel@tonic-gate 
6490Sstevel@tonic-gate 	ASSERT(ct->ct_owner->p_ct_equeue);
6500Sstevel@tonic-gate 	ASSERT(ct->ct_owner->p_ct_equeue[ct->ct_type->ct_type_index]);
6510Sstevel@tonic-gate 	q = ct->ct_owner->p_ct_equeue[ct->ct_type->ct_type_index];
6520Sstevel@tonic-gate 	cte_copy(&ct->ct_events, q);
6530Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
6540Sstevel@tonic-gate 
6550Sstevel@tonic-gate 	return (0);
6560Sstevel@tonic-gate }
6570Sstevel@tonic-gate 
6580Sstevel@tonic-gate /*
6590Sstevel@tonic-gate  * contract_ack
6600Sstevel@tonic-gate  *
6610Sstevel@tonic-gate  * Acknowledges receipt of a critical event.
6620Sstevel@tonic-gate  */
6630Sstevel@tonic-gate int
6644845Svikram contract_ack(contract_t *ct, uint64_t evid, int ack)
6650Sstevel@tonic-gate {
6660Sstevel@tonic-gate 	ct_kevent_t *ev;
6670Sstevel@tonic-gate 	list_t *queue = &ct->ct_events.ctq_events;
6680Sstevel@tonic-gate 	int error = ESRCH;
6694845Svikram 	int nego = 0;
6704845Svikram 	uint_t evtype;
6714845Svikram 
6724845Svikram 	ASSERT(ack == CT_ACK || ack == CT_NACK);
6730Sstevel@tonic-gate 
6740Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
6750Sstevel@tonic-gate 	mutex_enter(&ct->ct_events.ctq_lock);
6760Sstevel@tonic-gate 	/*
6770Sstevel@tonic-gate 	 * We are probably ACKing something near the head of the queue.
6780Sstevel@tonic-gate 	 */
6790Sstevel@tonic-gate 	for (ev = list_head(queue); ev; ev = list_next(queue, ev)) {
6800Sstevel@tonic-gate 		if (ev->cte_id == evid) {
6814845Svikram 			if (ev->cte_flags & CTE_NEG)
6824845Svikram 				nego = 1;
6834845Svikram 			else if (ack == CT_NACK)
6844845Svikram 				break;
6850Sstevel@tonic-gate 			if ((ev->cte_flags & (CTE_INFO | CTE_ACK)) == 0) {
6860Sstevel@tonic-gate 				ev->cte_flags |= CTE_ACK;
6870Sstevel@tonic-gate 				ct->ct_evcnt--;
6884845Svikram 				evtype = ev->cte_type;
6890Sstevel@tonic-gate 				error = 0;
6900Sstevel@tonic-gate 			}
6910Sstevel@tonic-gate 			break;
6920Sstevel@tonic-gate 		}
6930Sstevel@tonic-gate 	}
6940Sstevel@tonic-gate 	mutex_exit(&ct->ct_events.ctq_lock);
6950Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
6960Sstevel@tonic-gate 
6974845Svikram 	/*
6984845Svikram 	 * Not all critical events are negotiation events, however
6994845Svikram 	 * every negotiation event is a critical event. NEGEND events
7004845Svikram 	 * are critical events but are not negotiation events
7014845Svikram 	 */
7024845Svikram 	if (error || !nego)
7034845Svikram 		return (error);
7044845Svikram 
7054845Svikram 	if (ack == CT_ACK)
7064845Svikram 		error = ct->ct_type->ct_type_ops->contop_ack(ct, evtype, evid);
7074845Svikram 	else
7084845Svikram 		error = ct->ct_type->ct_type_ops->contop_nack(ct, evtype, evid);
7094845Svikram 
7100Sstevel@tonic-gate 	return (error);
7110Sstevel@tonic-gate }
7120Sstevel@tonic-gate 
7134845Svikram /*ARGSUSED*/
7144845Svikram int
7154845Svikram contract_ack_inval(contract_t *ct, uint_t evtype, uint64_t evid)
7164845Svikram {
7174845Svikram 	cmn_err(CE_PANIC, "contract_ack_inval: unsupported call: ctid: %u",
7184845Svikram 	    ct->ct_id);
7194845Svikram 	return (ENOSYS);
7204845Svikram }
7214845Svikram 
7224845Svikram /*ARGSUSED*/
7234845Svikram int
7244845Svikram contract_qack_inval(contract_t *ct, uint_t evtype, uint64_t evid)
7254845Svikram {
7264845Svikram 	cmn_err(CE_PANIC, "contract_ack_inval: unsupported call: ctid: %u",
7274845Svikram 	    ct->ct_id);
7284845Svikram 	return (ENOSYS);
7294845Svikram }
7304845Svikram 
7314845Svikram /*ARGSUSED*/
7324845Svikram int
7334845Svikram contract_qack_notsup(contract_t *ct, uint_t evtype, uint64_t evid)
7344845Svikram {
7354845Svikram 	return (ERANGE);
7364845Svikram }
7374845Svikram 
7384845Svikram /*
7394845Svikram  * contract_qack
7404845Svikram  *
7414845Svikram  * Asks that negotiations be extended by another time quantum
7424845Svikram  */
7434845Svikram int
7444845Svikram contract_qack(contract_t *ct, uint64_t evid)
7454845Svikram {
7464845Svikram 	ct_kevent_t *ev;
7474845Svikram 	list_t *queue = &ct->ct_events.ctq_events;
7484845Svikram 	int nego = 0;
7494845Svikram 	uint_t evtype;
7504845Svikram 
7514845Svikram 	mutex_enter(&ct->ct_lock);
7524845Svikram 	mutex_enter(&ct->ct_events.ctq_lock);
7534845Svikram 
7544845Svikram 	for (ev = list_head(queue); ev; ev = list_next(queue, ev)) {
7554845Svikram 		if (ev->cte_id == evid) {
7564845Svikram 			if ((ev->cte_flags & (CTE_NEG | CTE_ACK)) == CTE_NEG) {
7574845Svikram 				evtype = ev->cte_type;
7584845Svikram 				nego = 1;
7594845Svikram 			}
7604845Svikram 			break;
7614845Svikram 		}
7624845Svikram 	}
7634845Svikram 	mutex_exit(&ct->ct_events.ctq_lock);
7644845Svikram 	mutex_exit(&ct->ct_lock);
7654845Svikram 
7664845Svikram 	/*
7674845Svikram 	 * Only a negotiated event (which is by definition also a critical
7684845Svikram 	 * event) which has not yet been acknowledged can provide
7694845Svikram 	 * time quanta to a negotiating owner process.
7704845Svikram 	 */
7714845Svikram 	if (!nego)
7724845Svikram 		return (ESRCH);
7734845Svikram 
7744845Svikram 	return (ct->ct_type->ct_type_ops->contop_qack(ct, evtype, evid));
7754845Svikram }
7764845Svikram 
7770Sstevel@tonic-gate /*
7780Sstevel@tonic-gate  * contract_orphan
7790Sstevel@tonic-gate  *
7800Sstevel@tonic-gate  * Icky-poo.  This is a process-contract special, used to ACK all
7810Sstevel@tonic-gate  * critical messages when a contract is orphaned.
7820Sstevel@tonic-gate  */
7830Sstevel@tonic-gate void
7840Sstevel@tonic-gate contract_orphan(contract_t *ct)
7850Sstevel@tonic-gate {
7860Sstevel@tonic-gate 	ct_kevent_t *ev;
7870Sstevel@tonic-gate 	list_t *queue = &ct->ct_events.ctq_events;
7880Sstevel@tonic-gate 
7890Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&ct->ct_lock));
7900Sstevel@tonic-gate 	ASSERT(ct->ct_state != CTS_ORPHAN);
7910Sstevel@tonic-gate 
7920Sstevel@tonic-gate 	mutex_enter(&ct->ct_events.ctq_lock);
7930Sstevel@tonic-gate 	ct->ct_state = CTS_ORPHAN;
7940Sstevel@tonic-gate 	for (ev = list_head(queue); ev; ev = list_next(queue, ev)) {
7950Sstevel@tonic-gate 		if ((ev->cte_flags & (CTE_INFO | CTE_ACK)) == 0) {
7960Sstevel@tonic-gate 			ev->cte_flags |= CTE_ACK;
7970Sstevel@tonic-gate 			ct->ct_evcnt--;
7980Sstevel@tonic-gate 		}
7990Sstevel@tonic-gate 	}
8000Sstevel@tonic-gate 	mutex_exit(&ct->ct_events.ctq_lock);
8010Sstevel@tonic-gate 
8020Sstevel@tonic-gate 	ASSERT(ct->ct_evcnt == 0);
8030Sstevel@tonic-gate }
8040Sstevel@tonic-gate 
8050Sstevel@tonic-gate /*
8060Sstevel@tonic-gate  * contract_destroy
8070Sstevel@tonic-gate  *
8080Sstevel@tonic-gate  * Explicit contract destruction.  Called when contract is empty.
8090Sstevel@tonic-gate  * The contract will actually stick around until all of its events are
8100Sstevel@tonic-gate  * removed from the bundle and and process bundle queues, and all fds
8110Sstevel@tonic-gate  * which refer to it are closed.  See contract_dtor if you are looking
8120Sstevel@tonic-gate  * for what destroys the contract structure.
8130Sstevel@tonic-gate  */
8140Sstevel@tonic-gate void
8150Sstevel@tonic-gate contract_destroy(contract_t *ct)
8160Sstevel@tonic-gate {
8170Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&ct->ct_lock));
8180Sstevel@tonic-gate 	ASSERT(ct->ct_state != CTS_DEAD);
8190Sstevel@tonic-gate 	ASSERT(ct->ct_owner == NULL);
8200Sstevel@tonic-gate 
8210Sstevel@tonic-gate 	ct->ct_state = CTS_DEAD;
8220Sstevel@tonic-gate 	cte_queue_drain(&ct->ct_events, 1);
8230Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
8240Sstevel@tonic-gate 	mutex_enter(&ct->ct_type->ct_type_events.ctq_lock);
8250Sstevel@tonic-gate 	cte_trim(&ct->ct_type->ct_type_events, ct);
8260Sstevel@tonic-gate 	mutex_exit(&ct->ct_type->ct_type_events.ctq_lock);
8270Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
8280Sstevel@tonic-gate 	ct->ct_type->ct_type_ops->contop_destroy(ct);
8290Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
8300Sstevel@tonic-gate 	contract_rele(ct);
8310Sstevel@tonic-gate }
8320Sstevel@tonic-gate 
8330Sstevel@tonic-gate /*
8340Sstevel@tonic-gate  * contract_vnode_get
8350Sstevel@tonic-gate  *
8360Sstevel@tonic-gate  * Obtains the contract directory vnode for this contract, if there is
8370Sstevel@tonic-gate  * one.  The caller must VN_RELE the vnode when they are through using
8380Sstevel@tonic-gate  * it.
8390Sstevel@tonic-gate  */
8400Sstevel@tonic-gate vnode_t *
8410Sstevel@tonic-gate contract_vnode_get(contract_t *ct, vfs_t *vfsp)
8420Sstevel@tonic-gate {
8430Sstevel@tonic-gate 	contract_vnode_t *ctv;
8440Sstevel@tonic-gate 	vnode_t *vp = NULL;
8450Sstevel@tonic-gate 
8460Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
8470Sstevel@tonic-gate 	for (ctv = list_head(&ct->ct_vnodes); ctv != NULL;
8480Sstevel@tonic-gate 	    ctv = list_next(&ct->ct_vnodes, ctv))
8490Sstevel@tonic-gate 		if (ctv->ctv_vnode->v_vfsp == vfsp) {
8500Sstevel@tonic-gate 			vp = ctv->ctv_vnode;
8510Sstevel@tonic-gate 			VN_HOLD(vp);
8520Sstevel@tonic-gate 			break;
8530Sstevel@tonic-gate 		}
8540Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
8550Sstevel@tonic-gate 	return (vp);
8560Sstevel@tonic-gate }
8570Sstevel@tonic-gate 
8580Sstevel@tonic-gate /*
8590Sstevel@tonic-gate  * contract_vnode_set
8600Sstevel@tonic-gate  *
8610Sstevel@tonic-gate  * Sets the contract directory vnode for this contract.  We don't hold
8620Sstevel@tonic-gate  * a reference on the vnode because we don't want to prevent it from
8630Sstevel@tonic-gate  * being freed.  The vnode's inactive entry point will take care of
8640Sstevel@tonic-gate  * notifying us when it should be removed.
8650Sstevel@tonic-gate  */
8660Sstevel@tonic-gate void
8670Sstevel@tonic-gate contract_vnode_set(contract_t *ct, contract_vnode_t *ctv, vnode_t *vnode)
8680Sstevel@tonic-gate {
8690Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
8700Sstevel@tonic-gate 	ctv->ctv_vnode = vnode;
8710Sstevel@tonic-gate 	list_insert_head(&ct->ct_vnodes, ctv);
8720Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
8730Sstevel@tonic-gate }
8740Sstevel@tonic-gate 
8750Sstevel@tonic-gate /*
8760Sstevel@tonic-gate  * contract_vnode_clear
8770Sstevel@tonic-gate  *
8780Sstevel@tonic-gate  * Removes this vnode as the contract directory vnode for this
8790Sstevel@tonic-gate  * contract.  Called from a contract directory's inactive entry point,
8800Sstevel@tonic-gate  * this may return 0 indicating that the vnode gained another reference
8810Sstevel@tonic-gate  * because of a simultaneous call to contract_vnode_get.
8820Sstevel@tonic-gate  */
8830Sstevel@tonic-gate int
8840Sstevel@tonic-gate contract_vnode_clear(contract_t *ct, contract_vnode_t *ctv)
8850Sstevel@tonic-gate {
8860Sstevel@tonic-gate 	vnode_t *vp = ctv->ctv_vnode;
8870Sstevel@tonic-gate 	int result;
8880Sstevel@tonic-gate 
8890Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
8900Sstevel@tonic-gate 	mutex_enter(&vp->v_lock);
8910Sstevel@tonic-gate 	if (vp->v_count == 1) {
8920Sstevel@tonic-gate 		list_remove(&ct->ct_vnodes, ctv);
8930Sstevel@tonic-gate 		result = 1;
8940Sstevel@tonic-gate 	} else {
8950Sstevel@tonic-gate 		vp->v_count--;
8960Sstevel@tonic-gate 		result = 0;
8970Sstevel@tonic-gate 	}
8980Sstevel@tonic-gate 	mutex_exit(&vp->v_lock);
8990Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
9000Sstevel@tonic-gate 
9010Sstevel@tonic-gate 	return (result);
9020Sstevel@tonic-gate }
9030Sstevel@tonic-gate 
9040Sstevel@tonic-gate /*
9050Sstevel@tonic-gate  * contract_exit
9060Sstevel@tonic-gate  *
9070Sstevel@tonic-gate  * Abandons all contracts held by process p, and drains process p's
9080Sstevel@tonic-gate  * bundle queues.  Called on process exit.
9090Sstevel@tonic-gate  */
9100Sstevel@tonic-gate void
9110Sstevel@tonic-gate contract_exit(proc_t *p)
9120Sstevel@tonic-gate {
9130Sstevel@tonic-gate 	contract_t *ct;
9140Sstevel@tonic-gate 	void *cookie = NULL;
9150Sstevel@tonic-gate 	int i;
9160Sstevel@tonic-gate 
9170Sstevel@tonic-gate 	ASSERT(p == curproc);
9180Sstevel@tonic-gate 
9190Sstevel@tonic-gate 	/*
9200Sstevel@tonic-gate 	 * Abandon held contracts.  contract_abandon knows enough not
9210Sstevel@tonic-gate 	 * to remove the contract from the list a second time.  We are
9220Sstevel@tonic-gate 	 * exiting, so no locks are needed here.  But because
9230Sstevel@tonic-gate 	 * contract_abandon will take p_lock, we need to make sure we
9240Sstevel@tonic-gate 	 * aren't holding it.
9250Sstevel@tonic-gate 	 */
9260Sstevel@tonic-gate 	ASSERT(MUTEX_NOT_HELD(&p->p_lock));
9270Sstevel@tonic-gate 	while ((ct = avl_destroy_nodes(&p->p_ct_held, &cookie)) != NULL)
9280Sstevel@tonic-gate 		VERIFY(contract_abandon(ct, p, 0) == 0);
9290Sstevel@tonic-gate 
9300Sstevel@tonic-gate 	/*
9310Sstevel@tonic-gate 	 * Drain pbundles.  Because a process bundle queue could have
9320Sstevel@tonic-gate 	 * been passed to another process, they may not be freed right
9330Sstevel@tonic-gate 	 * away.
9340Sstevel@tonic-gate 	 */
9350Sstevel@tonic-gate 	if (p->p_ct_equeue) {
9360Sstevel@tonic-gate 		for (i = 0; i < CTT_MAXTYPE; i++)
9370Sstevel@tonic-gate 			if (p->p_ct_equeue[i])
9380Sstevel@tonic-gate 				cte_queue_drain(p->p_ct_equeue[i], 0);
9390Sstevel@tonic-gate 		kmem_free(p->p_ct_equeue, CTT_MAXTYPE * sizeof (ct_equeue_t *));
9400Sstevel@tonic-gate 	}
9410Sstevel@tonic-gate }
9420Sstevel@tonic-gate 
9434845Svikram static int
9444845Svikram get_time_left(struct ct_time *t)
9454845Svikram {
9464845Svikram 	clock_t ticks_elapsed;
9474845Svikram 	int secs_elapsed;
9484845Svikram 
9494845Svikram 	if (t->ctm_total == -1)
9504845Svikram 		return (-1);
9514845Svikram 
9524845Svikram 	ticks_elapsed = ddi_get_lbolt() - t->ctm_start;
9534845Svikram 	secs_elapsed = t->ctm_total - (drv_hztousec(ticks_elapsed)/MICROSEC);
9544845Svikram 	return (secs_elapsed > 0 ? secs_elapsed : 0);
9554845Svikram }
9564845Svikram 
9570Sstevel@tonic-gate /*
9580Sstevel@tonic-gate  * contract_status_common
9590Sstevel@tonic-gate  *
9600Sstevel@tonic-gate  * Populates a ct_status structure.  Used by contract types in their
9610Sstevel@tonic-gate  * status entry points and ctfs when only common information is
9620Sstevel@tonic-gate  * requested.
9630Sstevel@tonic-gate  */
9640Sstevel@tonic-gate void
9650Sstevel@tonic-gate contract_status_common(contract_t *ct, zone_t *zone, void *status,
9660Sstevel@tonic-gate     model_t model)
9670Sstevel@tonic-gate {
9680Sstevel@tonic-gate 	STRUCT_HANDLE(ct_status, lstatus);
9690Sstevel@tonic-gate 
9700Sstevel@tonic-gate 	STRUCT_SET_HANDLE(lstatus, model, status);
9710Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&ct->ct_lock));
9720Sstevel@tonic-gate 	if (zone->zone_uniqid == GLOBAL_ZONEUNIQID ||
9730Sstevel@tonic-gate 	    zone->zone_uniqid == ct->ct_czuniqid) {
9740Sstevel@tonic-gate 		zone_t *czone;
9750Sstevel@tonic-gate 		zoneid_t zoneid = -1;
9760Sstevel@tonic-gate 
9770Sstevel@tonic-gate 		/*
9780Sstevel@tonic-gate 		 * Contracts don't have holds on the zones they were
9790Sstevel@tonic-gate 		 * created by.  If the contract's zone no longer
9800Sstevel@tonic-gate 		 * exists, we say its zoneid is -1.
9810Sstevel@tonic-gate 		 */
9820Sstevel@tonic-gate 		if (zone->zone_uniqid == ct->ct_czuniqid ||
9830Sstevel@tonic-gate 		    ct->ct_czuniqid == GLOBAL_ZONEUNIQID) {
9840Sstevel@tonic-gate 			zoneid = ct->ct_zoneid;
9850Sstevel@tonic-gate 		} else if ((czone = zone_find_by_id(ct->ct_zoneid)) != NULL) {
9860Sstevel@tonic-gate 			if (czone->zone_uniqid == ct->ct_mzuniqid)
9870Sstevel@tonic-gate 				zoneid = ct->ct_zoneid;
9880Sstevel@tonic-gate 			zone_rele(czone);
9890Sstevel@tonic-gate 		}
9900Sstevel@tonic-gate 
9910Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_zoneid, zoneid);
9920Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_holder,
9930Sstevel@tonic-gate 		    (ct->ct_state == CTS_OWNED) ? ct->ct_owner->p_pid :
9940Sstevel@tonic-gate 		    (ct->ct_state == CTS_INHERITED) ? ct->ct_regent->ct_id : 0);
9950Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_state, ct->ct_state);
9960Sstevel@tonic-gate 	} else {
9970Sstevel@tonic-gate 		/*
9980Sstevel@tonic-gate 		 * We are looking at a contract which was created by a
9990Sstevel@tonic-gate 		 * process outside of our zone.  We provide fake zone,
10000Sstevel@tonic-gate 		 * holder, and state information.
10010Sstevel@tonic-gate 		 */
10020Sstevel@tonic-gate 
10030Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_zoneid, zone->zone_id);
10040Sstevel@tonic-gate 		/*
10050Sstevel@tonic-gate 		 * Since "zone" can't disappear until the calling ctfs
10060Sstevel@tonic-gate 		 * is unmounted, zone_zsched must be valid.
10070Sstevel@tonic-gate 		 */
10080Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_holder, (ct->ct_state < CTS_ORPHAN) ?
10090Sstevel@tonic-gate 		    zone->zone_zsched->p_pid : 0);
10100Sstevel@tonic-gate 		STRUCT_FSET(lstatus, ctst_state, (ct->ct_state < CTS_ORPHAN) ?
10110Sstevel@tonic-gate 		    CTS_OWNED : ct->ct_state);
10120Sstevel@tonic-gate 	}
10130Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_nevents, ct->ct_evcnt);
10144845Svikram 	STRUCT_FSET(lstatus, ctst_ntime, get_time_left(&ct->ct_ntime));
10154845Svikram 	STRUCT_FSET(lstatus, ctst_qtime, get_time_left(&ct->ct_qtime));
10160Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_nevid,
10170Sstevel@tonic-gate 	    ct->ct_nevent ? ct->ct_nevent->cte_id : 0);
10180Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_critical, ct->ct_ev_crit);
10190Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_informative, ct->ct_ev_info);
10200Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_cookie, ct->ct_cookie);
10210Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_type, ct->ct_type->ct_type_index);
10220Sstevel@tonic-gate 	STRUCT_FSET(lstatus, ctst_id, ct->ct_id);
10230Sstevel@tonic-gate }
10240Sstevel@tonic-gate 
10250Sstevel@tonic-gate /*
10260Sstevel@tonic-gate  * contract_checkcred
10270Sstevel@tonic-gate  *
10280Sstevel@tonic-gate  * Determines if the specified contract is owned by a process with the
10290Sstevel@tonic-gate  * same effective uid as the specified credential.  The caller must
10300Sstevel@tonic-gate  * ensure that the uid spaces are the same.  Returns 1 on success.
10310Sstevel@tonic-gate  */
10320Sstevel@tonic-gate static int
10330Sstevel@tonic-gate contract_checkcred(contract_t *ct, const cred_t *cr)
10340Sstevel@tonic-gate {
10350Sstevel@tonic-gate 	proc_t *p;
10360Sstevel@tonic-gate 	int fail = 1;
10370Sstevel@tonic-gate 
10380Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
10390Sstevel@tonic-gate 	if ((p = ct->ct_owner) != NULL) {
10400Sstevel@tonic-gate 		mutex_enter(&p->p_crlock);
10410Sstevel@tonic-gate 		fail = crgetuid(cr) != crgetuid(p->p_cred);
10420Sstevel@tonic-gate 		mutex_exit(&p->p_crlock);
10430Sstevel@tonic-gate 	}
10440Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
10450Sstevel@tonic-gate 
10460Sstevel@tonic-gate 	return (!fail);
10470Sstevel@tonic-gate }
10480Sstevel@tonic-gate 
10490Sstevel@tonic-gate /*
10500Sstevel@tonic-gate  * contract_owned
10510Sstevel@tonic-gate  *
10520Sstevel@tonic-gate  * Determines if the specified credential can view an event generated
10530Sstevel@tonic-gate  * by the specified contract.  If locked is set, the contract's ct_lock
10540Sstevel@tonic-gate  * is held and the caller will need to do additional work to determine
10550Sstevel@tonic-gate  * if they truly can see the event.  Returns 1 on success.
10560Sstevel@tonic-gate  */
10570Sstevel@tonic-gate int
10580Sstevel@tonic-gate contract_owned(contract_t *ct, const cred_t *cr, int locked)
10590Sstevel@tonic-gate {
10600Sstevel@tonic-gate 	int owner, cmatch, zmatch;
10610Sstevel@tonic-gate 	uint64_t zuniqid, mzuniqid;
10620Sstevel@tonic-gate 	uid_t euid;
10630Sstevel@tonic-gate 
10640Sstevel@tonic-gate 	ASSERT(locked || MUTEX_NOT_HELD(&ct->ct_lock));
10650Sstevel@tonic-gate 
10660Sstevel@tonic-gate 	zuniqid = curproc->p_zone->zone_uniqid;
10670Sstevel@tonic-gate 	mzuniqid = contract_getzuniqid(ct);
10680Sstevel@tonic-gate 	euid = crgetuid(cr);
10690Sstevel@tonic-gate 
10700Sstevel@tonic-gate 	/*
10710Sstevel@tonic-gate 	 * owner: we own the contract
10720Sstevel@tonic-gate 	 * cmatch: we are in the creator's (and holder's) zone and our
10730Sstevel@tonic-gate 	 *   uid matches the creator's or holder's
10740Sstevel@tonic-gate 	 * zmatch: we are in the effective zone of a contract created
10750Sstevel@tonic-gate 	 *   in the global zone, and our uid matches that of the
10760Sstevel@tonic-gate 	 *   virtualized holder's (zsched/kcred)
10770Sstevel@tonic-gate 	 */
10780Sstevel@tonic-gate 	owner = (ct->ct_owner == curproc);
10790Sstevel@tonic-gate 	cmatch = (zuniqid == ct->ct_czuniqid) &&
10800Sstevel@tonic-gate 	    ((ct->ct_cuid == euid) || (!locked && contract_checkcred(ct, cr)));
10810Sstevel@tonic-gate 	zmatch = (ct->ct_czuniqid != mzuniqid) && (zuniqid == mzuniqid) &&
10820Sstevel@tonic-gate 	    (crgetuid(kcred) == euid);
10830Sstevel@tonic-gate 
10840Sstevel@tonic-gate 	return (owner || cmatch || zmatch);
10850Sstevel@tonic-gate }
10860Sstevel@tonic-gate 
10870Sstevel@tonic-gate 
10880Sstevel@tonic-gate /*
10890Sstevel@tonic-gate  * contract_type_init
10900Sstevel@tonic-gate  *
10910Sstevel@tonic-gate  * Called by contract types to register themselves with the contracts
10920Sstevel@tonic-gate  * framework.
10930Sstevel@tonic-gate  */
10940Sstevel@tonic-gate ct_type_t *
10950Sstevel@tonic-gate contract_type_init(ct_typeid_t type, const char *name, contops_t *ops,
10960Sstevel@tonic-gate     ct_f_default_t *dfault)
10970Sstevel@tonic-gate {
10980Sstevel@tonic-gate 	ct_type_t *result;
10990Sstevel@tonic-gate 
11000Sstevel@tonic-gate 	ASSERT(type < CTT_MAXTYPE);
11010Sstevel@tonic-gate 
11020Sstevel@tonic-gate 	result = kmem_alloc(sizeof (ct_type_t), KM_SLEEP);
11030Sstevel@tonic-gate 
11040Sstevel@tonic-gate 	mutex_init(&result->ct_type_lock, NULL, MUTEX_DEFAULT, NULL);
11050Sstevel@tonic-gate 	avl_create(&result->ct_type_avl, contract_compar, sizeof (contract_t),
11060Sstevel@tonic-gate 	    offsetof(contract_t, ct_cttavl));
11070Sstevel@tonic-gate 	cte_queue_create(&result->ct_type_events, CTEL_BUNDLE, 20, 0);
11080Sstevel@tonic-gate 	result->ct_type_name = name;
11090Sstevel@tonic-gate 	result->ct_type_ops = ops;
11100Sstevel@tonic-gate 	result->ct_type_default = dfault;
11110Sstevel@tonic-gate 	result->ct_type_evid = 0;
11120Sstevel@tonic-gate 	gethrestime(&result->ct_type_timestruc);
11130Sstevel@tonic-gate 	result->ct_type_index = type;
11140Sstevel@tonic-gate 
11150Sstevel@tonic-gate 	ct_types[type] = result;
11160Sstevel@tonic-gate 
11170Sstevel@tonic-gate 	return (result);
11180Sstevel@tonic-gate }
11190Sstevel@tonic-gate 
11200Sstevel@tonic-gate /*
11210Sstevel@tonic-gate  * contract_type_count
11220Sstevel@tonic-gate  *
11230Sstevel@tonic-gate  * Obtains the number of contracts of a particular type.
11240Sstevel@tonic-gate  */
11250Sstevel@tonic-gate int
11260Sstevel@tonic-gate contract_type_count(ct_type_t *type)
11270Sstevel@tonic-gate {
11280Sstevel@tonic-gate 	ulong_t count;
11290Sstevel@tonic-gate 
11300Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
11310Sstevel@tonic-gate 	count = avl_numnodes(&type->ct_type_avl);
11320Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
11330Sstevel@tonic-gate 
11340Sstevel@tonic-gate 	return (count);
11350Sstevel@tonic-gate }
11360Sstevel@tonic-gate 
11370Sstevel@tonic-gate /*
11380Sstevel@tonic-gate  * contract_type_max
11390Sstevel@tonic-gate  *
11400Sstevel@tonic-gate  * Obtains the maximum contract id of of a particular type.
11410Sstevel@tonic-gate  */
11420Sstevel@tonic-gate ctid_t
11430Sstevel@tonic-gate contract_type_max(ct_type_t *type)
11440Sstevel@tonic-gate {
11450Sstevel@tonic-gate 	contract_t *ct;
11460Sstevel@tonic-gate 	ctid_t res;
11470Sstevel@tonic-gate 
11480Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
11490Sstevel@tonic-gate 	ct = avl_last(&type->ct_type_avl);
11500Sstevel@tonic-gate 	res = ct ? ct->ct_id : -1;
11510Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
11520Sstevel@tonic-gate 
11530Sstevel@tonic-gate 	return (res);
11540Sstevel@tonic-gate }
11550Sstevel@tonic-gate 
11560Sstevel@tonic-gate /*
11570Sstevel@tonic-gate  * contract_max
11580Sstevel@tonic-gate  *
11590Sstevel@tonic-gate  * Obtains the maximum contract id.
11600Sstevel@tonic-gate  */
11610Sstevel@tonic-gate ctid_t
11620Sstevel@tonic-gate contract_max(void)
11630Sstevel@tonic-gate {
11640Sstevel@tonic-gate 	contract_t *ct;
11650Sstevel@tonic-gate 	ctid_t res;
11660Sstevel@tonic-gate 
11670Sstevel@tonic-gate 	mutex_enter(&contract_lock);
11680Sstevel@tonic-gate 	ct = avl_last(&contract_avl);
11690Sstevel@tonic-gate 	res = ct ? ct->ct_id : -1;
11700Sstevel@tonic-gate 	mutex_exit(&contract_lock);
11710Sstevel@tonic-gate 
11720Sstevel@tonic-gate 	return (res);
11730Sstevel@tonic-gate }
11740Sstevel@tonic-gate 
11750Sstevel@tonic-gate /*
11760Sstevel@tonic-gate  * contract_lookup_common
11770Sstevel@tonic-gate  *
11780Sstevel@tonic-gate  * Common code for contract_lookup and contract_type_lookup.  Takes a
11790Sstevel@tonic-gate  * pointer to an AVL tree to search in.  Should be called with the
11800Sstevel@tonic-gate  * appropriate tree-protecting lock held (unfortunately unassertable).
11810Sstevel@tonic-gate  */
11820Sstevel@tonic-gate static ctid_t
11830Sstevel@tonic-gate contract_lookup_common(avl_tree_t *tree, uint64_t zuniqid, ctid_t current)
11840Sstevel@tonic-gate {
11850Sstevel@tonic-gate 	contract_t template, *ct;
11860Sstevel@tonic-gate 	avl_index_t where;
11870Sstevel@tonic-gate 	ctid_t res;
11880Sstevel@tonic-gate 
11890Sstevel@tonic-gate 	template.ct_id = current;
11900Sstevel@tonic-gate 	ct = avl_find(tree, &template, &where);
11910Sstevel@tonic-gate 	if (ct == NULL)
11920Sstevel@tonic-gate 		ct = avl_nearest(tree, where, AVL_AFTER);
11930Sstevel@tonic-gate 	if (zuniqid != GLOBAL_ZONEUNIQID)
11940Sstevel@tonic-gate 		while (ct && (contract_getzuniqid(ct) != zuniqid))
11950Sstevel@tonic-gate 			ct = AVL_NEXT(tree, ct);
11960Sstevel@tonic-gate 	res = ct ? ct->ct_id : -1;
11970Sstevel@tonic-gate 
11980Sstevel@tonic-gate 	return (res);
11990Sstevel@tonic-gate }
12000Sstevel@tonic-gate 
12010Sstevel@tonic-gate /*
12020Sstevel@tonic-gate  * contract_type_lookup
12030Sstevel@tonic-gate  *
12040Sstevel@tonic-gate  * Returns the next type contract after the specified id, visible from
12050Sstevel@tonic-gate  * the specified zone.
12060Sstevel@tonic-gate  */
12070Sstevel@tonic-gate ctid_t
12080Sstevel@tonic-gate contract_type_lookup(ct_type_t *type, uint64_t zuniqid, ctid_t current)
12090Sstevel@tonic-gate {
12100Sstevel@tonic-gate 	ctid_t res;
12110Sstevel@tonic-gate 
12120Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
12130Sstevel@tonic-gate 	res = contract_lookup_common(&type->ct_type_avl, zuniqid, current);
12140Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
12150Sstevel@tonic-gate 
12160Sstevel@tonic-gate 	return (res);
12170Sstevel@tonic-gate }
12180Sstevel@tonic-gate 
12190Sstevel@tonic-gate /*
12200Sstevel@tonic-gate  * contract_lookup
12210Sstevel@tonic-gate  *
12220Sstevel@tonic-gate  * Returns the next contract after the specified id, visible from the
12230Sstevel@tonic-gate  * specified zone.
12240Sstevel@tonic-gate  */
12250Sstevel@tonic-gate ctid_t
12260Sstevel@tonic-gate contract_lookup(uint64_t zuniqid, ctid_t current)
12270Sstevel@tonic-gate {
12280Sstevel@tonic-gate 	ctid_t res;
12290Sstevel@tonic-gate 
12300Sstevel@tonic-gate 	mutex_enter(&contract_lock);
12310Sstevel@tonic-gate 	res = contract_lookup_common(&contract_avl, zuniqid, current);
12320Sstevel@tonic-gate 	mutex_exit(&contract_lock);
12330Sstevel@tonic-gate 
12340Sstevel@tonic-gate 	return (res);
12350Sstevel@tonic-gate }
12360Sstevel@tonic-gate 
12370Sstevel@tonic-gate /*
12380Sstevel@tonic-gate  * contract_plookup
12390Sstevel@tonic-gate  *
12400Sstevel@tonic-gate  * Returns the next contract held by process p after the specified id,
12410Sstevel@tonic-gate  * visible from the specified zone.  Made complicated by the fact that
12420Sstevel@tonic-gate  * contracts visible in a zone but held by processes outside of the
12430Sstevel@tonic-gate  * zone need to appear as being held by zsched to zone members.
12440Sstevel@tonic-gate  */
12450Sstevel@tonic-gate ctid_t
12460Sstevel@tonic-gate contract_plookup(proc_t *p, ctid_t current, uint64_t zuniqid)
12470Sstevel@tonic-gate {
12480Sstevel@tonic-gate 	contract_t template, *ct;
12490Sstevel@tonic-gate 	avl_index_t where;
12500Sstevel@tonic-gate 	ctid_t res;
12510Sstevel@tonic-gate 
12520Sstevel@tonic-gate 	template.ct_id = current;
12530Sstevel@tonic-gate 	if (zuniqid != GLOBAL_ZONEUNIQID &&
12540Sstevel@tonic-gate 	    (p->p_flag & (SSYS|SZONETOP)) == (SSYS|SZONETOP)) {
12550Sstevel@tonic-gate 		/* This is inelegant. */
12560Sstevel@tonic-gate 		mutex_enter(&contract_lock);
12570Sstevel@tonic-gate 		ct = avl_find(&contract_avl, &template, &where);
12580Sstevel@tonic-gate 		if (ct == NULL)
12590Sstevel@tonic-gate 			ct = avl_nearest(&contract_avl, where, AVL_AFTER);
12600Sstevel@tonic-gate 		while (ct && !(ct->ct_state < CTS_ORPHAN &&
12610Sstevel@tonic-gate 		    contract_getzuniqid(ct) == zuniqid &&
12620Sstevel@tonic-gate 		    ct->ct_czuniqid == GLOBAL_ZONEUNIQID))
12630Sstevel@tonic-gate 			ct = AVL_NEXT(&contract_avl, ct);
12640Sstevel@tonic-gate 		res = ct ? ct->ct_id : -1;
12650Sstevel@tonic-gate 		mutex_exit(&contract_lock);
12660Sstevel@tonic-gate 	} else {
12670Sstevel@tonic-gate 		mutex_enter(&p->p_lock);
12680Sstevel@tonic-gate 		ct = avl_find(&p->p_ct_held, &template, &where);
12690Sstevel@tonic-gate 		if (ct == NULL)
12700Sstevel@tonic-gate 			ct = avl_nearest(&p->p_ct_held, where, AVL_AFTER);
12710Sstevel@tonic-gate 		res = ct ? ct->ct_id : -1;
12720Sstevel@tonic-gate 		mutex_exit(&p->p_lock);
12730Sstevel@tonic-gate 	}
12740Sstevel@tonic-gate 
12750Sstevel@tonic-gate 	return (res);
12760Sstevel@tonic-gate }
12770Sstevel@tonic-gate 
12780Sstevel@tonic-gate /*
12790Sstevel@tonic-gate  * contract_ptr_common
12800Sstevel@tonic-gate  *
12810Sstevel@tonic-gate  * Common code for contract_ptr and contract_type_ptr.  Takes a pointer
12820Sstevel@tonic-gate  * to an AVL tree to search in.  Should be called with the appropriate
12830Sstevel@tonic-gate  * tree-protecting lock held (unfortunately unassertable).
12840Sstevel@tonic-gate  */
12850Sstevel@tonic-gate static contract_t *
12860Sstevel@tonic-gate contract_ptr_common(avl_tree_t *tree, ctid_t id, uint64_t zuniqid)
12870Sstevel@tonic-gate {
12880Sstevel@tonic-gate 	contract_t template, *ct;
12890Sstevel@tonic-gate 
12900Sstevel@tonic-gate 	template.ct_id = id;
12910Sstevel@tonic-gate 	ct = avl_find(tree, &template, NULL);
12920Sstevel@tonic-gate 	if (ct == NULL || (zuniqid != GLOBAL_ZONEUNIQID &&
12930Sstevel@tonic-gate 	    contract_getzuniqid(ct) != zuniqid)) {
12940Sstevel@tonic-gate 		return (NULL);
12950Sstevel@tonic-gate 	}
12960Sstevel@tonic-gate 
12970Sstevel@tonic-gate 	/*
12980Sstevel@tonic-gate 	 * Check to see if a thread is in the window in contract_rele
12990Sstevel@tonic-gate 	 * between dropping the reference count and removing the
13000Sstevel@tonic-gate 	 * contract from the type AVL.
13010Sstevel@tonic-gate 	 */
13020Sstevel@tonic-gate 	mutex_enter(&ct->ct_reflock);
13030Sstevel@tonic-gate 	if (ct->ct_ref) {
13040Sstevel@tonic-gate 		ct->ct_ref++;
13050Sstevel@tonic-gate 		mutex_exit(&ct->ct_reflock);
13060Sstevel@tonic-gate 	} else {
13070Sstevel@tonic-gate 		mutex_exit(&ct->ct_reflock);
13080Sstevel@tonic-gate 		ct = NULL;
13090Sstevel@tonic-gate 	}
13100Sstevel@tonic-gate 
13110Sstevel@tonic-gate 	return (ct);
13120Sstevel@tonic-gate }
13130Sstevel@tonic-gate 
13140Sstevel@tonic-gate /*
13150Sstevel@tonic-gate  * contract_type_ptr
13160Sstevel@tonic-gate  *
13170Sstevel@tonic-gate  * Returns a pointer to the contract with the specified id.  The
13180Sstevel@tonic-gate  * contract is held, so the caller needs to release the reference when
13190Sstevel@tonic-gate  * it is through with the contract.
13200Sstevel@tonic-gate  */
13210Sstevel@tonic-gate contract_t *
13220Sstevel@tonic-gate contract_type_ptr(ct_type_t *type, ctid_t id, uint64_t zuniqid)
13230Sstevel@tonic-gate {
13240Sstevel@tonic-gate 	contract_t *ct;
13250Sstevel@tonic-gate 
13260Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
13270Sstevel@tonic-gate 	ct = contract_ptr_common(&type->ct_type_avl, id, zuniqid);
13280Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
13290Sstevel@tonic-gate 
13300Sstevel@tonic-gate 	return (ct);
13310Sstevel@tonic-gate }
13320Sstevel@tonic-gate 
13330Sstevel@tonic-gate /*
13340Sstevel@tonic-gate  * contract_ptr
13350Sstevel@tonic-gate  *
13360Sstevel@tonic-gate  * Returns a pointer to the contract with the specified id.  The
13370Sstevel@tonic-gate  * contract is held, so the caller needs to release the reference when
13380Sstevel@tonic-gate  * it is through with the contract.
13390Sstevel@tonic-gate  */
13400Sstevel@tonic-gate contract_t *
13410Sstevel@tonic-gate contract_ptr(ctid_t id, uint64_t zuniqid)
13420Sstevel@tonic-gate {
13430Sstevel@tonic-gate 	contract_t *ct;
13440Sstevel@tonic-gate 
13450Sstevel@tonic-gate 	mutex_enter(&contract_lock);
13460Sstevel@tonic-gate 	ct = contract_ptr_common(&contract_avl, id, zuniqid);
13470Sstevel@tonic-gate 	mutex_exit(&contract_lock);
13480Sstevel@tonic-gate 
13490Sstevel@tonic-gate 	return (ct);
13500Sstevel@tonic-gate }
13510Sstevel@tonic-gate 
13520Sstevel@tonic-gate /*
13530Sstevel@tonic-gate  * contract_type_time
13540Sstevel@tonic-gate  *
13550Sstevel@tonic-gate  * Obtains the last time a contract of a particular type was created.
13560Sstevel@tonic-gate  */
13570Sstevel@tonic-gate void
13580Sstevel@tonic-gate contract_type_time(ct_type_t *type, timestruc_t *time)
13590Sstevel@tonic-gate {
13600Sstevel@tonic-gate 	mutex_enter(&type->ct_type_lock);
13610Sstevel@tonic-gate 	*time = type->ct_type_timestruc;
13620Sstevel@tonic-gate 	mutex_exit(&type->ct_type_lock);
13630Sstevel@tonic-gate }
13640Sstevel@tonic-gate 
13650Sstevel@tonic-gate /*
13660Sstevel@tonic-gate  * contract_type_bundle
13670Sstevel@tonic-gate  *
13680Sstevel@tonic-gate  * Obtains a type's bundle queue.
13690Sstevel@tonic-gate  */
13700Sstevel@tonic-gate ct_equeue_t *
13710Sstevel@tonic-gate contract_type_bundle(ct_type_t *type)
13720Sstevel@tonic-gate {
13730Sstevel@tonic-gate 	return (&type->ct_type_events);
13740Sstevel@tonic-gate }
13750Sstevel@tonic-gate 
13760Sstevel@tonic-gate /*
13770Sstevel@tonic-gate  * contract_type_pbundle
13780Sstevel@tonic-gate  *
13790Sstevel@tonic-gate  * Obtain's a process's bundle queue.  If one doesn't exist, one is
13800Sstevel@tonic-gate  * created.  Often used simply to ensure that a bundle queue is
13810Sstevel@tonic-gate  * allocated.
13820Sstevel@tonic-gate  */
13830Sstevel@tonic-gate ct_equeue_t *
13840Sstevel@tonic-gate contract_type_pbundle(ct_type_t *type, proc_t *pp)
13850Sstevel@tonic-gate {
13860Sstevel@tonic-gate 	/*
13870Sstevel@tonic-gate 	 * If there isn't an array of bundle queues, allocate one.
13880Sstevel@tonic-gate 	 */
13890Sstevel@tonic-gate 	if (pp->p_ct_equeue == NULL) {
13900Sstevel@tonic-gate 		size_t size = CTT_MAXTYPE * sizeof (ct_equeue_t *);
13910Sstevel@tonic-gate 		ct_equeue_t **qa = kmem_zalloc(size, KM_SLEEP);
13920Sstevel@tonic-gate 
13930Sstevel@tonic-gate 		mutex_enter(&pp->p_lock);
13940Sstevel@tonic-gate 		if (pp->p_ct_equeue)
13950Sstevel@tonic-gate 			kmem_free(qa, size);
13960Sstevel@tonic-gate 		else
13970Sstevel@tonic-gate 			pp->p_ct_equeue = qa;
13980Sstevel@tonic-gate 		mutex_exit(&pp->p_lock);
13990Sstevel@tonic-gate 	}
14000Sstevel@tonic-gate 
14010Sstevel@tonic-gate 	/*
14020Sstevel@tonic-gate 	 * If there isn't a bundle queue of the required type, allocate
14030Sstevel@tonic-gate 	 * one.
14040Sstevel@tonic-gate 	 */
14050Sstevel@tonic-gate 	if (pp->p_ct_equeue[type->ct_type_index] == NULL) {
14060Sstevel@tonic-gate 		ct_equeue_t *q = kmem_zalloc(sizeof (ct_equeue_t), KM_SLEEP);
14070Sstevel@tonic-gate 		cte_queue_create(q, CTEL_PBUNDLE, 20, 1);
14080Sstevel@tonic-gate 
14090Sstevel@tonic-gate 		mutex_enter(&pp->p_lock);
14100Sstevel@tonic-gate 		if (pp->p_ct_equeue[type->ct_type_index])
14110Sstevel@tonic-gate 			cte_queue_drain(q, 0);
14120Sstevel@tonic-gate 		else
14130Sstevel@tonic-gate 			pp->p_ct_equeue[type->ct_type_index] = q;
14140Sstevel@tonic-gate 		mutex_exit(&pp->p_lock);
14150Sstevel@tonic-gate 	}
14160Sstevel@tonic-gate 
14170Sstevel@tonic-gate 	return (pp->p_ct_equeue[type->ct_type_index]);
14180Sstevel@tonic-gate }
14190Sstevel@tonic-gate 
14200Sstevel@tonic-gate /*
14210Sstevel@tonic-gate  * ctmpl_free
14220Sstevel@tonic-gate  *
14230Sstevel@tonic-gate  * Frees a template.
14240Sstevel@tonic-gate  */
14250Sstevel@tonic-gate void
14260Sstevel@tonic-gate ctmpl_free(ct_template_t *template)
14270Sstevel@tonic-gate {
14280Sstevel@tonic-gate 	mutex_destroy(&template->ctmpl_lock);
14290Sstevel@tonic-gate 	template->ctmpl_ops->ctop_free(template);
14300Sstevel@tonic-gate }
14310Sstevel@tonic-gate 
14320Sstevel@tonic-gate /*
14330Sstevel@tonic-gate  * ctmpl_dup
14340Sstevel@tonic-gate  *
14350Sstevel@tonic-gate  * Creates a copy of a template.
14360Sstevel@tonic-gate  */
14370Sstevel@tonic-gate ct_template_t *
14380Sstevel@tonic-gate ctmpl_dup(ct_template_t *template)
14390Sstevel@tonic-gate {
14400Sstevel@tonic-gate 	ct_template_t *new;
14410Sstevel@tonic-gate 
14420Sstevel@tonic-gate 	if (template == NULL)
14430Sstevel@tonic-gate 		return (NULL);
14440Sstevel@tonic-gate 
14450Sstevel@tonic-gate 	new = template->ctmpl_ops->ctop_dup(template);
14460Sstevel@tonic-gate 	/*
14470Sstevel@tonic-gate 	 * ctmpl_lock was taken by ctop_dup's call to ctmpl_copy and
14480Sstevel@tonic-gate 	 * should have remain held until now.
14490Sstevel@tonic-gate 	 */
14500Sstevel@tonic-gate 	mutex_exit(&template->ctmpl_lock);
14510Sstevel@tonic-gate 
14520Sstevel@tonic-gate 	return (new);
14530Sstevel@tonic-gate }
14540Sstevel@tonic-gate 
14550Sstevel@tonic-gate /*
14560Sstevel@tonic-gate  * ctmpl_set
14570Sstevel@tonic-gate  *
14580Sstevel@tonic-gate  * Sets the requested terms of a template.
14590Sstevel@tonic-gate  */
14600Sstevel@tonic-gate int
14610Sstevel@tonic-gate ctmpl_set(ct_template_t *template, ct_param_t *param, const cred_t *cr)
14620Sstevel@tonic-gate {
14630Sstevel@tonic-gate 	int result = 0;
1464*6196Sacruz 	uint64_t param_value;
1465*6196Sacruz 
1466*6196Sacruz 	if (param->ctpm_id == CTP_COOKIE ||
1467*6196Sacruz 	    param->ctpm_id == CTP_EV_INFO ||
1468*6196Sacruz 	    param->ctpm_id == CTP_EV_CRITICAL) {
1469*6196Sacruz 		if (param->ctpm_size < sizeof (uint64_t)) {
1470*6196Sacruz 			return (EINVAL);
1471*6196Sacruz 		} else {
1472*6196Sacruz 			param_value = *(uint64_t *)param->ctpm_value;
1473*6196Sacruz 		}
1474*6196Sacruz 	}
14750Sstevel@tonic-gate 
14760Sstevel@tonic-gate 	mutex_enter(&template->ctmpl_lock);
14770Sstevel@tonic-gate 	switch (param->ctpm_id) {
14780Sstevel@tonic-gate 	case CTP_COOKIE:
14796073Sacruz 		template->ctmpl_cookie = param_value;
14800Sstevel@tonic-gate 		break;
14810Sstevel@tonic-gate 	case CTP_EV_INFO:
14826073Sacruz 		if (param_value & ~(uint64_t)template->ctmpl_ops->allevents)
14830Sstevel@tonic-gate 			result = EINVAL;
14840Sstevel@tonic-gate 		else
14856073Sacruz 			template->ctmpl_ev_info = param_value;
14860Sstevel@tonic-gate 		break;
14870Sstevel@tonic-gate 	case CTP_EV_CRITICAL:
14886073Sacruz 		if (param_value & ~(uint64_t)template->ctmpl_ops->allevents) {
14890Sstevel@tonic-gate 			result = EINVAL;
14900Sstevel@tonic-gate 			break;
14916073Sacruz 		} else if ((~template->ctmpl_ev_crit & param_value) == 0) {
14920Sstevel@tonic-gate 			/*
14930Sstevel@tonic-gate 			 * Assume that a pure reduction of the critical
14940Sstevel@tonic-gate 			 * set is allowed by the contract type.
14950Sstevel@tonic-gate 			 */
14966073Sacruz 			template->ctmpl_ev_crit = param_value;
14970Sstevel@tonic-gate 			break;
14980Sstevel@tonic-gate 		}
14990Sstevel@tonic-gate 		/*
15000Sstevel@tonic-gate 		 * There may be restrictions on what we can make
15010Sstevel@tonic-gate 		 * critical, so we defer to the judgement of the
15020Sstevel@tonic-gate 		 * contract type.
15030Sstevel@tonic-gate 		 */
15040Sstevel@tonic-gate 		/* FALLTHROUGH */
15050Sstevel@tonic-gate 	default:
15060Sstevel@tonic-gate 		result = template->ctmpl_ops->ctop_set(template, param, cr);
15070Sstevel@tonic-gate 	}
15080Sstevel@tonic-gate 	mutex_exit(&template->ctmpl_lock);
15090Sstevel@tonic-gate 
15100Sstevel@tonic-gate 	return (result);
15110Sstevel@tonic-gate }
15120Sstevel@tonic-gate 
15130Sstevel@tonic-gate /*
15140Sstevel@tonic-gate  * ctmpl_get
15150Sstevel@tonic-gate  *
15160Sstevel@tonic-gate  * Obtains the requested terms from a template.
1517*6196Sacruz  *
1518*6196Sacruz  * If the term requested is a variable-sized term and the buffer
1519*6196Sacruz  * provided is too small for the data, we truncate the data and return
1520*6196Sacruz  * the buffer size necessary to fit the term in param->ctpm_size. If the
1521*6196Sacruz  * term requested is fix-sized (uint64_t) and the buffer provided is too
1522*6196Sacruz  * small, we return EINVAL.  This should never happen if you're using
1523*6196Sacruz  * libcontract(3LIB), only if you call ioctl with a hand constructed
1524*6196Sacruz  * ct_param_t argument.
1525*6196Sacruz  *
1526*6196Sacruz  * Currently, only contract specific parameters have variable-sized
1527*6196Sacruz  * parameters.
15280Sstevel@tonic-gate  */
15290Sstevel@tonic-gate int
15300Sstevel@tonic-gate ctmpl_get(ct_template_t *template, ct_param_t *param)
15310Sstevel@tonic-gate {
15320Sstevel@tonic-gate 	int result = 0;
1533*6196Sacruz 	uint64_t *param_value;
1534*6196Sacruz 
1535*6196Sacruz 	if (param->ctpm_id == CTP_COOKIE ||
1536*6196Sacruz 	    param->ctpm_id == CTP_EV_INFO ||
1537*6196Sacruz 	    param->ctpm_id == CTP_EV_CRITICAL) {
1538*6196Sacruz 		if (param->ctpm_size < sizeof (uint64_t)) {
1539*6196Sacruz 			return (EINVAL);
1540*6196Sacruz 		} else {
1541*6196Sacruz 			param_value = param->ctpm_value;
1542*6196Sacruz 			param->ctpm_size = sizeof (uint64_t);
1543*6196Sacruz 		}
1544*6196Sacruz 	}
15450Sstevel@tonic-gate 
15460Sstevel@tonic-gate 	mutex_enter(&template->ctmpl_lock);
15470Sstevel@tonic-gate 	switch (param->ctpm_id) {
15480Sstevel@tonic-gate 	case CTP_COOKIE:
15496073Sacruz 		*param_value = template->ctmpl_cookie;
15500Sstevel@tonic-gate 		break;
15510Sstevel@tonic-gate 	case CTP_EV_INFO:
15526073Sacruz 		*param_value = template->ctmpl_ev_info;
15530Sstevel@tonic-gate 		break;
15540Sstevel@tonic-gate 	case CTP_EV_CRITICAL:
15556073Sacruz 		*param_value = template->ctmpl_ev_crit;
15560Sstevel@tonic-gate 		break;
15570Sstevel@tonic-gate 	default:
15580Sstevel@tonic-gate 		result = template->ctmpl_ops->ctop_get(template, param);
15590Sstevel@tonic-gate 	}
15600Sstevel@tonic-gate 	mutex_exit(&template->ctmpl_lock);
15610Sstevel@tonic-gate 
15620Sstevel@tonic-gate 	return (result);
15630Sstevel@tonic-gate }
15640Sstevel@tonic-gate 
15650Sstevel@tonic-gate /*
15660Sstevel@tonic-gate  * ctmpl_makecurrent
15670Sstevel@tonic-gate  *
15680Sstevel@tonic-gate  * Used by ctmpl_activate and ctmpl_clear to set the current thread's
15690Sstevel@tonic-gate  * active template.  Frees the old active template, if there was one.
15700Sstevel@tonic-gate  */
15710Sstevel@tonic-gate static void
15720Sstevel@tonic-gate ctmpl_makecurrent(ct_template_t *template, ct_template_t *new)
15730Sstevel@tonic-gate {
15740Sstevel@tonic-gate 	klwp_t *curlwp = ttolwp(curthread);
15750Sstevel@tonic-gate 	proc_t *p = curproc;
15760Sstevel@tonic-gate 	ct_template_t *old;
15770Sstevel@tonic-gate 
15780Sstevel@tonic-gate 	mutex_enter(&p->p_lock);
15790Sstevel@tonic-gate 	old = curlwp->lwp_ct_active[template->ctmpl_type->ct_type_index];
15800Sstevel@tonic-gate 	curlwp->lwp_ct_active[template->ctmpl_type->ct_type_index] = new;
15810Sstevel@tonic-gate 	mutex_exit(&p->p_lock);
15820Sstevel@tonic-gate 
15830Sstevel@tonic-gate 	if (old)
15840Sstevel@tonic-gate 		ctmpl_free(old);
15850Sstevel@tonic-gate }
15860Sstevel@tonic-gate 
15870Sstevel@tonic-gate /*
15880Sstevel@tonic-gate  * ctmpl_activate
15890Sstevel@tonic-gate  *
15900Sstevel@tonic-gate  * Copy the specified template as the current thread's activate
15910Sstevel@tonic-gate  * template of that type.
15920Sstevel@tonic-gate  */
15930Sstevel@tonic-gate void
15940Sstevel@tonic-gate ctmpl_activate(ct_template_t *template)
15950Sstevel@tonic-gate {
15960Sstevel@tonic-gate 	ctmpl_makecurrent(template, ctmpl_dup(template));
15970Sstevel@tonic-gate }
15980Sstevel@tonic-gate 
15990Sstevel@tonic-gate /*
16000Sstevel@tonic-gate  * ctmpl_clear
16010Sstevel@tonic-gate  *
16020Sstevel@tonic-gate  * Clears the current thread's activate template of the same type as
16030Sstevel@tonic-gate  * the specified template.
16040Sstevel@tonic-gate  */
16050Sstevel@tonic-gate void
16060Sstevel@tonic-gate ctmpl_clear(ct_template_t *template)
16070Sstevel@tonic-gate {
16080Sstevel@tonic-gate 	ctmpl_makecurrent(template, NULL);
16090Sstevel@tonic-gate }
16100Sstevel@tonic-gate 
16110Sstevel@tonic-gate /*
16120Sstevel@tonic-gate  * ctmpl_create
16130Sstevel@tonic-gate  *
16140Sstevel@tonic-gate  * Creates a new contract using the specified template.
16150Sstevel@tonic-gate  */
16160Sstevel@tonic-gate int
16174845Svikram ctmpl_create(ct_template_t *template, ctid_t *ctidp)
16180Sstevel@tonic-gate {
16194845Svikram 	return (template->ctmpl_ops->ctop_create(template, ctidp));
16200Sstevel@tonic-gate }
16210Sstevel@tonic-gate 
16220Sstevel@tonic-gate /*
16230Sstevel@tonic-gate  * ctmpl_init
16240Sstevel@tonic-gate  *
16250Sstevel@tonic-gate  * Initializes the common portion of a new contract template.
16260Sstevel@tonic-gate  */
16270Sstevel@tonic-gate void
16280Sstevel@tonic-gate ctmpl_init(ct_template_t *new, ctmplops_t *ops, ct_type_t *type, void *data)
16290Sstevel@tonic-gate {
16300Sstevel@tonic-gate 	mutex_init(&new->ctmpl_lock, NULL, MUTEX_DEFAULT, NULL);
16310Sstevel@tonic-gate 	new->ctmpl_ops = ops;
16320Sstevel@tonic-gate 	new->ctmpl_type = type;
16330Sstevel@tonic-gate 	new->ctmpl_data = data;
16340Sstevel@tonic-gate 	new->ctmpl_ev_info = new->ctmpl_ev_crit = 0;
16350Sstevel@tonic-gate 	new->ctmpl_cookie = 0;
16360Sstevel@tonic-gate }
16370Sstevel@tonic-gate 
16380Sstevel@tonic-gate /*
16390Sstevel@tonic-gate  * ctmpl_copy
16400Sstevel@tonic-gate  *
16410Sstevel@tonic-gate  * Copies the common portions of a contract template.  Intended for use
16420Sstevel@tonic-gate  * by a contract type's ctop_dup template op.  Returns with the old
16430Sstevel@tonic-gate  * template's lock held, which will should remain held until the
16440Sstevel@tonic-gate  * template op returns (it is dropped by ctmpl_dup).
16450Sstevel@tonic-gate  */
16460Sstevel@tonic-gate void
16470Sstevel@tonic-gate ctmpl_copy(ct_template_t *new, ct_template_t *old)
16480Sstevel@tonic-gate {
16490Sstevel@tonic-gate 	mutex_init(&new->ctmpl_lock, NULL, MUTEX_DEFAULT, NULL);
16500Sstevel@tonic-gate 	mutex_enter(&old->ctmpl_lock);
16510Sstevel@tonic-gate 	new->ctmpl_ops = old->ctmpl_ops;
16520Sstevel@tonic-gate 	new->ctmpl_type = old->ctmpl_type;
16530Sstevel@tonic-gate 	new->ctmpl_ev_crit = old->ctmpl_ev_crit;
16540Sstevel@tonic-gate 	new->ctmpl_ev_info = old->ctmpl_ev_info;
16550Sstevel@tonic-gate 	new->ctmpl_cookie = old->ctmpl_cookie;
16560Sstevel@tonic-gate }
16570Sstevel@tonic-gate 
16580Sstevel@tonic-gate /*
16590Sstevel@tonic-gate  * ctmpl_create_inval
16600Sstevel@tonic-gate  *
16610Sstevel@tonic-gate  * Returns EINVAL.  Provided for the convenience of those contract
16620Sstevel@tonic-gate  * types which don't support ct_tmpl_create(3contract) and would
16630Sstevel@tonic-gate  * otherwise need to create their own stub for the ctop_create template
16640Sstevel@tonic-gate  * op.
16650Sstevel@tonic-gate  */
16660Sstevel@tonic-gate /*ARGSUSED*/
16670Sstevel@tonic-gate int
16684845Svikram ctmpl_create_inval(ct_template_t *template, ctid_t *ctidp)
16690Sstevel@tonic-gate {
16700Sstevel@tonic-gate 	return (EINVAL);
16710Sstevel@tonic-gate }
16720Sstevel@tonic-gate 
16730Sstevel@tonic-gate 
16740Sstevel@tonic-gate /*
16750Sstevel@tonic-gate  * cte_queue_create
16760Sstevel@tonic-gate  *
16770Sstevel@tonic-gate  * Initializes a queue of a particular type.  If dynamic is set, the
16780Sstevel@tonic-gate  * queue is to be freed when its last listener is removed after being
16790Sstevel@tonic-gate  * drained.
16800Sstevel@tonic-gate  */
16810Sstevel@tonic-gate static void
16820Sstevel@tonic-gate cte_queue_create(ct_equeue_t *q, ct_listnum_t list, int maxinf, int dynamic)
16830Sstevel@tonic-gate {
16840Sstevel@tonic-gate 	mutex_init(&q->ctq_lock, NULL, MUTEX_DEFAULT, NULL);
16850Sstevel@tonic-gate 	q->ctq_listno = list;
16860Sstevel@tonic-gate 	list_create(&q->ctq_events, sizeof (ct_kevent_t),
16870Sstevel@tonic-gate 	    offsetof(ct_kevent_t, cte_nodes[list].ctm_node));
16880Sstevel@tonic-gate 	list_create(&q->ctq_listeners, sizeof (ct_listener_t),
16890Sstevel@tonic-gate 	    offsetof(ct_listener_t, ctl_allnode));
16900Sstevel@tonic-gate 	list_create(&q->ctq_tail, sizeof (ct_listener_t),
16910Sstevel@tonic-gate 	    offsetof(ct_listener_t, ctl_tailnode));
16920Sstevel@tonic-gate 	gethrestime(&q->ctq_atime);
16930Sstevel@tonic-gate 	q->ctq_nlisteners = 0;
16940Sstevel@tonic-gate 	q->ctq_nreliable = 0;
16950Sstevel@tonic-gate 	q->ctq_ninf = 0;
16960Sstevel@tonic-gate 	q->ctq_max = maxinf;
16970Sstevel@tonic-gate 
16980Sstevel@tonic-gate 	/*
16990Sstevel@tonic-gate 	 * Bundle queues and contract queues are embedded in other
17000Sstevel@tonic-gate 	 * structures and are implicitly referenced counted by virtue
17010Sstevel@tonic-gate 	 * of their vnodes' indirect hold on their contracts.  Process
17020Sstevel@tonic-gate 	 * bundle queues are dynamically allocated and may persist
17030Sstevel@tonic-gate 	 * after the death of the process, so they must be explicitly
17040Sstevel@tonic-gate 	 * reference counted.
17050Sstevel@tonic-gate 	 */
17060Sstevel@tonic-gate 	q->ctq_flags = dynamic ? CTQ_REFFED : 0;
17070Sstevel@tonic-gate }
17080Sstevel@tonic-gate 
17090Sstevel@tonic-gate /*
17100Sstevel@tonic-gate  * cte_queue_destroy
17110Sstevel@tonic-gate  *
17120Sstevel@tonic-gate  * Destroys the specified queue.  The queue is freed if referenced
17130Sstevel@tonic-gate  * counted.
17140Sstevel@tonic-gate  */
17150Sstevel@tonic-gate static void
17160Sstevel@tonic-gate cte_queue_destroy(ct_equeue_t *q)
17170Sstevel@tonic-gate {
17180Sstevel@tonic-gate 	ASSERT(q->ctq_flags & CTQ_DEAD);
17190Sstevel@tonic-gate 	ASSERT(q->ctq_nlisteners == 0);
17200Sstevel@tonic-gate 	ASSERT(q->ctq_nreliable == 0);
17210Sstevel@tonic-gate 	list_destroy(&q->ctq_events);
17220Sstevel@tonic-gate 	list_destroy(&q->ctq_listeners);
17230Sstevel@tonic-gate 	list_destroy(&q->ctq_tail);
17240Sstevel@tonic-gate 	mutex_destroy(&q->ctq_lock);
17250Sstevel@tonic-gate 	if (q->ctq_flags & CTQ_REFFED)
17260Sstevel@tonic-gate 		kmem_free(q, sizeof (ct_equeue_t));
17270Sstevel@tonic-gate }
17280Sstevel@tonic-gate 
17290Sstevel@tonic-gate /*
17300Sstevel@tonic-gate  * cte_hold
17310Sstevel@tonic-gate  *
17320Sstevel@tonic-gate  * Takes a hold on the specified event.
17330Sstevel@tonic-gate  */
17340Sstevel@tonic-gate static void
17350Sstevel@tonic-gate cte_hold(ct_kevent_t *e)
17360Sstevel@tonic-gate {
17370Sstevel@tonic-gate 	mutex_enter(&e->cte_lock);
17380Sstevel@tonic-gate 	ASSERT(e->cte_refs > 0);
17390Sstevel@tonic-gate 	e->cte_refs++;
17400Sstevel@tonic-gate 	mutex_exit(&e->cte_lock);
17410Sstevel@tonic-gate }
17420Sstevel@tonic-gate 
17430Sstevel@tonic-gate /*
17440Sstevel@tonic-gate  * cte_rele
17450Sstevel@tonic-gate  *
17460Sstevel@tonic-gate  * Releases a hold on the specified event.  If the caller had the last
17470Sstevel@tonic-gate  * reference, frees the event and releases its hold on the contract
17480Sstevel@tonic-gate  * that generated it.
17490Sstevel@tonic-gate  */
17500Sstevel@tonic-gate static void
17510Sstevel@tonic-gate cte_rele(ct_kevent_t *e)
17520Sstevel@tonic-gate {
17530Sstevel@tonic-gate 	mutex_enter(&e->cte_lock);
17540Sstevel@tonic-gate 	ASSERT(e->cte_refs > 0);
17550Sstevel@tonic-gate 	if (--e->cte_refs) {
17560Sstevel@tonic-gate 		mutex_exit(&e->cte_lock);
17570Sstevel@tonic-gate 		return;
17580Sstevel@tonic-gate 	}
17590Sstevel@tonic-gate 
17600Sstevel@tonic-gate 	contract_rele(e->cte_contract);
17610Sstevel@tonic-gate 
17620Sstevel@tonic-gate 	mutex_destroy(&e->cte_lock);
17630Sstevel@tonic-gate 	if (e->cte_data)
17640Sstevel@tonic-gate 		nvlist_free(e->cte_data);
17650Sstevel@tonic-gate 	if (e->cte_gdata)
17660Sstevel@tonic-gate 		nvlist_free(e->cte_gdata);
17670Sstevel@tonic-gate 	kmem_free(e, sizeof (ct_kevent_t));
17680Sstevel@tonic-gate }
17690Sstevel@tonic-gate 
17700Sstevel@tonic-gate /*
17710Sstevel@tonic-gate  * cte_qrele
17720Sstevel@tonic-gate  *
17730Sstevel@tonic-gate  * Remove this listener's hold on the specified event, removing and
17740Sstevel@tonic-gate  * releasing the queue's hold on the event if appropriate.
17750Sstevel@tonic-gate  */
17760Sstevel@tonic-gate static void
17770Sstevel@tonic-gate cte_qrele(ct_equeue_t *q, ct_listener_t *l, ct_kevent_t *e)
17780Sstevel@tonic-gate {
17790Sstevel@tonic-gate 	ct_member_t *member = &e->cte_nodes[q->ctq_listno];
17800Sstevel@tonic-gate 
17810Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
17820Sstevel@tonic-gate 
17830Sstevel@tonic-gate 	if (l->ctl_flags & CTLF_RELIABLE)
17840Sstevel@tonic-gate 		member->ctm_nreliable--;
17850Sstevel@tonic-gate 	if ((--member->ctm_refs == 0) && member->ctm_trimmed) {
17860Sstevel@tonic-gate 		member->ctm_trimmed = 0;
17870Sstevel@tonic-gate 		list_remove(&q->ctq_events, e);
17880Sstevel@tonic-gate 		cte_rele(e);
17890Sstevel@tonic-gate 	}
17900Sstevel@tonic-gate }
17910Sstevel@tonic-gate 
17920Sstevel@tonic-gate /*
17930Sstevel@tonic-gate  * cte_qmove
17940Sstevel@tonic-gate  *
17950Sstevel@tonic-gate  * Move this listener to the specified event in the queue.
17960Sstevel@tonic-gate  */
17970Sstevel@tonic-gate static ct_kevent_t *
17980Sstevel@tonic-gate cte_qmove(ct_equeue_t *q, ct_listener_t *l, ct_kevent_t *e)
17990Sstevel@tonic-gate {
18000Sstevel@tonic-gate 	ct_kevent_t *olde;
18010Sstevel@tonic-gate 
18020Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
18030Sstevel@tonic-gate 	ASSERT(l->ctl_equeue == q);
18040Sstevel@tonic-gate 
18050Sstevel@tonic-gate 	if ((olde = l->ctl_position) == NULL)
18060Sstevel@tonic-gate 		list_remove(&q->ctq_tail, l);
18070Sstevel@tonic-gate 
18080Sstevel@tonic-gate 	while (e != NULL && e->cte_nodes[q->ctq_listno].ctm_trimmed)
18090Sstevel@tonic-gate 		e = list_next(&q->ctq_events, e);
18100Sstevel@tonic-gate 
18110Sstevel@tonic-gate 	if (e != NULL) {
18120Sstevel@tonic-gate 		e->cte_nodes[q->ctq_listno].ctm_refs++;
18130Sstevel@tonic-gate 		if (l->ctl_flags & CTLF_RELIABLE)
18140Sstevel@tonic-gate 			e->cte_nodes[q->ctq_listno].ctm_nreliable++;
18150Sstevel@tonic-gate 	} else {
18160Sstevel@tonic-gate 		list_insert_tail(&q->ctq_tail, l);
18170Sstevel@tonic-gate 	}
18180Sstevel@tonic-gate 
18190Sstevel@tonic-gate 	l->ctl_position = e;
18200Sstevel@tonic-gate 	if (olde)
18210Sstevel@tonic-gate 		cte_qrele(q, l, olde);
18220Sstevel@tonic-gate 
18230Sstevel@tonic-gate 	return (e);
18240Sstevel@tonic-gate }
18250Sstevel@tonic-gate 
18260Sstevel@tonic-gate /*
18270Sstevel@tonic-gate  * cte_checkcred
18280Sstevel@tonic-gate  *
18290Sstevel@tonic-gate  * Determines if the specified event's contract is owned by a process
18300Sstevel@tonic-gate  * with the same effective uid as the specified credential.  Called
18310Sstevel@tonic-gate  * after a failed call to contract_owned with locked set.  Because it
18320Sstevel@tonic-gate  * drops the queue lock, its caller (cte_qreadable) needs to make sure
18330Sstevel@tonic-gate  * we're still in the same place after we return.  Returns 1 on
18340Sstevel@tonic-gate  * success.
18350Sstevel@tonic-gate  */
18360Sstevel@tonic-gate static int
18370Sstevel@tonic-gate cte_checkcred(ct_equeue_t *q, ct_kevent_t *e, const cred_t *cr)
18380Sstevel@tonic-gate {
18390Sstevel@tonic-gate 	int result;
18400Sstevel@tonic-gate 	contract_t *ct = e->cte_contract;
18410Sstevel@tonic-gate 
18420Sstevel@tonic-gate 	cte_hold(e);
18430Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
18440Sstevel@tonic-gate 	result = curproc->p_zone->zone_uniqid == ct->ct_czuniqid &&
18450Sstevel@tonic-gate 	    contract_checkcred(ct, cr);
18460Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
18470Sstevel@tonic-gate 	cte_rele(e);
18480Sstevel@tonic-gate 
18490Sstevel@tonic-gate 	return (result);
18500Sstevel@tonic-gate }
18510Sstevel@tonic-gate 
18520Sstevel@tonic-gate /*
18530Sstevel@tonic-gate  * cte_qreadable
18540Sstevel@tonic-gate  *
18550Sstevel@tonic-gate  * Ensures that the listener is pointing to a valid event that the
18560Sstevel@tonic-gate  * caller has the credentials to read.  Returns 0 if we can read the
18570Sstevel@tonic-gate  * event we're pointing to.
18580Sstevel@tonic-gate  */
18590Sstevel@tonic-gate static int
18600Sstevel@tonic-gate cte_qreadable(ct_equeue_t *q, ct_listener_t *l, const cred_t *cr,
18610Sstevel@tonic-gate     uint64_t zuniqid, int crit)
18620Sstevel@tonic-gate {
18630Sstevel@tonic-gate 	ct_kevent_t *e, *next;
18640Sstevel@tonic-gate 	contract_t *ct;
18650Sstevel@tonic-gate 
18660Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
18670Sstevel@tonic-gate 	ASSERT(l->ctl_equeue == q);
18680Sstevel@tonic-gate 
18690Sstevel@tonic-gate 	if (l->ctl_flags & CTLF_COPYOUT)
18700Sstevel@tonic-gate 		return (1);
18710Sstevel@tonic-gate 
18720Sstevel@tonic-gate 	next = l->ctl_position;
18730Sstevel@tonic-gate 	while (e = cte_qmove(q, l, next)) {
18740Sstevel@tonic-gate 		ct = e->cte_contract;
18750Sstevel@tonic-gate 		/*
18760Sstevel@tonic-gate 		 * Check obvious things first.  If we are looking for a
18770Sstevel@tonic-gate 		 * critical message, is this one?  If we aren't in the
18780Sstevel@tonic-gate 		 * global zone, is this message meant for us?
18790Sstevel@tonic-gate 		 */
18800Sstevel@tonic-gate 		if ((crit && (e->cte_flags & (CTE_INFO | CTE_ACK))) ||
18810Sstevel@tonic-gate 		    (cr != NULL && zuniqid != GLOBAL_ZONEUNIQID &&
18820Sstevel@tonic-gate 		    zuniqid != contract_getzuniqid(ct))) {
18830Sstevel@tonic-gate 
18840Sstevel@tonic-gate 			next = list_next(&q->ctq_events, e);
18850Sstevel@tonic-gate 
18860Sstevel@tonic-gate 		/*
18870Sstevel@tonic-gate 		 * Next, see if our effective uid equals that of owner
18880Sstevel@tonic-gate 		 * or author of the contract.  Since we are holding the
18890Sstevel@tonic-gate 		 * queue lock, contract_owned can't always check if we
18900Sstevel@tonic-gate 		 * have the same effective uid as the contract's
18910Sstevel@tonic-gate 		 * owner.  If it comes to that, it fails and we take
18920Sstevel@tonic-gate 		 * the slow(er) path.
18930Sstevel@tonic-gate 		 */
18940Sstevel@tonic-gate 		} else if (cr != NULL && !contract_owned(ct, cr, B_TRUE)) {
18950Sstevel@tonic-gate 
18960Sstevel@tonic-gate 			/*
18970Sstevel@tonic-gate 			 * At this point we either don't have any claim
18980Sstevel@tonic-gate 			 * to this contract or we match the effective
18990Sstevel@tonic-gate 			 * uid of the owner but couldn't tell.  We
19000Sstevel@tonic-gate 			 * first test for a NULL holder so that events
19010Sstevel@tonic-gate 			 * from orphans and inherited contracts avoid
19020Sstevel@tonic-gate 			 * the penalty phase.
19030Sstevel@tonic-gate 			 */
19040Sstevel@tonic-gate 			if (e->cte_contract->ct_owner == NULL &&
19050Sstevel@tonic-gate 			    !secpolicy_contract_observer_choice(cr))
19060Sstevel@tonic-gate 				next = list_next(&q->ctq_events, e);
19070Sstevel@tonic-gate 
19080Sstevel@tonic-gate 			/*
19090Sstevel@tonic-gate 			 * cte_checkcred will juggle locks to see if we
19100Sstevel@tonic-gate 			 * have the same uid as the event's contract's
19110Sstevel@tonic-gate 			 * current owner.  If it succeeds, we have to
19120Sstevel@tonic-gate 			 * make sure we are in the same point in the
19130Sstevel@tonic-gate 			 * queue.
19140Sstevel@tonic-gate 			 */
19150Sstevel@tonic-gate 			else if (cte_checkcred(q, e, cr) &&
19160Sstevel@tonic-gate 			    l->ctl_position == e)
19170Sstevel@tonic-gate 				break;
19180Sstevel@tonic-gate 
19190Sstevel@tonic-gate 			/*
19200Sstevel@tonic-gate 			 * cte_checkcred failed; see if we're in the
19210Sstevel@tonic-gate 			 * same place.
19220Sstevel@tonic-gate 			 */
19230Sstevel@tonic-gate 			else if (l->ctl_position == e)
19240Sstevel@tonic-gate 				if (secpolicy_contract_observer_choice(cr))
19250Sstevel@tonic-gate 					break;
19260Sstevel@tonic-gate 				else
19270Sstevel@tonic-gate 					next = list_next(&q->ctq_events, e);
19280Sstevel@tonic-gate 
19290Sstevel@tonic-gate 			/*
19300Sstevel@tonic-gate 			 * cte_checkcred failed, and our position was
19310Sstevel@tonic-gate 			 * changed.  Start from there.
19320Sstevel@tonic-gate 			 */
19330Sstevel@tonic-gate 			else
19340Sstevel@tonic-gate 				next = l->ctl_position;
19350Sstevel@tonic-gate 		} else {
19360Sstevel@tonic-gate 			break;
19370Sstevel@tonic-gate 		}
19380Sstevel@tonic-gate 	}
19390Sstevel@tonic-gate 
19400Sstevel@tonic-gate 	/*
19410Sstevel@tonic-gate 	 * We check for CTLF_COPYOUT again in case we dropped the queue
19420Sstevel@tonic-gate 	 * lock in cte_checkcred.
19430Sstevel@tonic-gate 	 */
19440Sstevel@tonic-gate 	return ((l->ctl_flags & CTLF_COPYOUT) || (l->ctl_position == NULL));
19450Sstevel@tonic-gate }
19460Sstevel@tonic-gate 
19470Sstevel@tonic-gate /*
19480Sstevel@tonic-gate  * cte_qwakeup
19490Sstevel@tonic-gate  *
19500Sstevel@tonic-gate  * Wakes up any waiting listeners and points them at the specified event.
19510Sstevel@tonic-gate  */
19520Sstevel@tonic-gate static void
19530Sstevel@tonic-gate cte_qwakeup(ct_equeue_t *q, ct_kevent_t *e)
19540Sstevel@tonic-gate {
19550Sstevel@tonic-gate 	ct_listener_t *l;
19560Sstevel@tonic-gate 
19570Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
19580Sstevel@tonic-gate 
19590Sstevel@tonic-gate 	while (l = list_head(&q->ctq_tail)) {
19600Sstevel@tonic-gate 		list_remove(&q->ctq_tail, l);
19610Sstevel@tonic-gate 		e->cte_nodes[q->ctq_listno].ctm_refs++;
19620Sstevel@tonic-gate 		if (l->ctl_flags & CTLF_RELIABLE)
19630Sstevel@tonic-gate 			e->cte_nodes[q->ctq_listno].ctm_nreliable++;
19640Sstevel@tonic-gate 		l->ctl_position = e;
19650Sstevel@tonic-gate 		cv_signal(&l->ctl_cv);
19660Sstevel@tonic-gate 		pollwakeup(&l->ctl_pollhead, POLLIN);
19670Sstevel@tonic-gate 	}
19680Sstevel@tonic-gate }
19690Sstevel@tonic-gate 
19700Sstevel@tonic-gate /*
19710Sstevel@tonic-gate  * cte_copy
19720Sstevel@tonic-gate  *
19730Sstevel@tonic-gate  * Copies events from the specified contract event queue to the
19740Sstevel@tonic-gate  * end of the specified process bundle queue.  Only called from
19750Sstevel@tonic-gate  * contract_adopt.
19760Sstevel@tonic-gate  *
19770Sstevel@tonic-gate  * We copy to the end of the target queue instead of mixing the events
19780Sstevel@tonic-gate  * in their proper order because otherwise the act of adopting a
19790Sstevel@tonic-gate  * contract would require a process to reset all process bundle
19800Sstevel@tonic-gate  * listeners it needed to see the new events.  This would, in turn,
19810Sstevel@tonic-gate  * require the process to keep track of which preexisting events had
19820Sstevel@tonic-gate  * already been processed.
19830Sstevel@tonic-gate  */
19840Sstevel@tonic-gate static void
19850Sstevel@tonic-gate cte_copy(ct_equeue_t *q, ct_equeue_t *newq)
19860Sstevel@tonic-gate {
19870Sstevel@tonic-gate 	ct_kevent_t *e, *first = NULL;
19880Sstevel@tonic-gate 
19890Sstevel@tonic-gate 	ASSERT(q->ctq_listno == CTEL_CONTRACT);
19900Sstevel@tonic-gate 	ASSERT(newq->ctq_listno == CTEL_PBUNDLE);
19910Sstevel@tonic-gate 
19920Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
19930Sstevel@tonic-gate 	mutex_enter(&newq->ctq_lock);
19940Sstevel@tonic-gate 
19950Sstevel@tonic-gate 	/*
19960Sstevel@tonic-gate 	 * For now, only copy critical events.
19970Sstevel@tonic-gate 	 */
19980Sstevel@tonic-gate 	for (e = list_head(&q->ctq_events); e != NULL;
19990Sstevel@tonic-gate 	    e = list_next(&q->ctq_events, e)) {
20000Sstevel@tonic-gate 		if ((e->cte_flags & (CTE_INFO | CTE_ACK)) == 0) {
20010Sstevel@tonic-gate 			if (first == NULL)
20020Sstevel@tonic-gate 				first = e;
20030Sstevel@tonic-gate 			list_insert_tail(&newq->ctq_events, e);
20040Sstevel@tonic-gate 			cte_hold(e);
20050Sstevel@tonic-gate 		}
20060Sstevel@tonic-gate 	}
20070Sstevel@tonic-gate 
20080Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
20090Sstevel@tonic-gate 
20100Sstevel@tonic-gate 	if (first)
20110Sstevel@tonic-gate 		cte_qwakeup(newq, first);
20120Sstevel@tonic-gate 
20130Sstevel@tonic-gate 	mutex_exit(&newq->ctq_lock);
20140Sstevel@tonic-gate }
20150Sstevel@tonic-gate 
20160Sstevel@tonic-gate /*
20170Sstevel@tonic-gate  * cte_trim
20180Sstevel@tonic-gate  *
20190Sstevel@tonic-gate  * Trims unneeded events from an event queue.  Algorithm works as
20200Sstevel@tonic-gate  * follows:
20210Sstevel@tonic-gate  *
20220Sstevel@tonic-gate  *   Removes all informative and acknowledged critical events until the
20230Sstevel@tonic-gate  *   first referenced event is found.
20240Sstevel@tonic-gate  *
20250Sstevel@tonic-gate  *   If a contract is specified, removes all events (regardless of
20260Sstevel@tonic-gate  *   acknowledgement) generated by that contract until the first event
20270Sstevel@tonic-gate  *   referenced by a reliable listener is found.  Reference events are
20280Sstevel@tonic-gate  *   removed by marking them "trimmed".  Such events will be removed
20290Sstevel@tonic-gate  *   when the last reference is dropped and will be skipped by future
20300Sstevel@tonic-gate  *   listeners.
20310Sstevel@tonic-gate  *
20320Sstevel@tonic-gate  * This is pretty basic.  Ideally this should remove from the middle of
20330Sstevel@tonic-gate  * the list (i.e. beyond the first referenced event), and even
20340Sstevel@tonic-gate  * referenced events.
20350Sstevel@tonic-gate  */
20360Sstevel@tonic-gate static void
20370Sstevel@tonic-gate cte_trim(ct_equeue_t *q, contract_t *ct)
20380Sstevel@tonic-gate {
20390Sstevel@tonic-gate 	ct_kevent_t *e, *next;
20400Sstevel@tonic-gate 	int flags, stopper;
20410Sstevel@tonic-gate 	int start = 1;
20420Sstevel@tonic-gate 
20430Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
20440Sstevel@tonic-gate 
20450Sstevel@tonic-gate 	for (e = list_head(&q->ctq_events); e != NULL; e = next) {
20460Sstevel@tonic-gate 		next = list_next(&q->ctq_events, e);
20470Sstevel@tonic-gate 		flags = e->cte_flags;
20480Sstevel@tonic-gate 		stopper = (q->ctq_listno != CTEL_PBUNDLE) &&
20490Sstevel@tonic-gate 		    (e->cte_nodes[q->ctq_listno].ctm_nreliable > 0);
20500Sstevel@tonic-gate 		if (e->cte_nodes[q->ctq_listno].ctm_refs == 0) {
20510Sstevel@tonic-gate 			if ((start && (flags & (CTE_INFO | CTE_ACK))) ||
20520Sstevel@tonic-gate 			    (e->cte_contract == ct)) {
20530Sstevel@tonic-gate 				/*
20540Sstevel@tonic-gate 				 * Toss informative and ACKed critical messages.
20550Sstevel@tonic-gate 				 */
20560Sstevel@tonic-gate 				list_remove(&q->ctq_events, e);
20570Sstevel@tonic-gate 				cte_rele(e);
20580Sstevel@tonic-gate 			}
20590Sstevel@tonic-gate 		} else if ((e->cte_contract == ct) && !stopper) {
20600Sstevel@tonic-gate 			ASSERT(q->ctq_nlisteners != 0);
20610Sstevel@tonic-gate 			e->cte_nodes[q->ctq_listno].ctm_trimmed = 1;
20620Sstevel@tonic-gate 		} else if (ct && !stopper) {
20630Sstevel@tonic-gate 			start = 0;
20640Sstevel@tonic-gate 		} else {
20650Sstevel@tonic-gate 			/*
20660Sstevel@tonic-gate 			 * Don't free messages past the first reader.
20670Sstevel@tonic-gate 			 */
20680Sstevel@tonic-gate 			break;
20690Sstevel@tonic-gate 		}
20700Sstevel@tonic-gate 	}
20710Sstevel@tonic-gate }
20720Sstevel@tonic-gate 
20730Sstevel@tonic-gate /*
20740Sstevel@tonic-gate  * cte_queue_drain
20750Sstevel@tonic-gate  *
20760Sstevel@tonic-gate  * Drain all events from the specified queue, and mark it dead.  If
20770Sstevel@tonic-gate  * "ack" is set, acknowledge any critical events we find along the
20780Sstevel@tonic-gate  * way.
20790Sstevel@tonic-gate  */
20800Sstevel@tonic-gate static void
20810Sstevel@tonic-gate cte_queue_drain(ct_equeue_t *q, int ack)
20820Sstevel@tonic-gate {
20830Sstevel@tonic-gate 	ct_kevent_t *e, *next;
20840Sstevel@tonic-gate 	ct_listener_t *l;
20850Sstevel@tonic-gate 
20860Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
20870Sstevel@tonic-gate 
20880Sstevel@tonic-gate 	for (e = list_head(&q->ctq_events); e != NULL; e = next) {
20890Sstevel@tonic-gate 		next = list_next(&q->ctq_events, e);
20900Sstevel@tonic-gate 		if (ack && ((e->cte_flags & (CTE_INFO | CTE_ACK)) == 0)) {
20910Sstevel@tonic-gate 			/*
20920Sstevel@tonic-gate 			 * Make sure critical messages are eventually
20930Sstevel@tonic-gate 			 * removed from the bundle queues.
20940Sstevel@tonic-gate 			 */
20950Sstevel@tonic-gate 			mutex_enter(&e->cte_lock);
20960Sstevel@tonic-gate 			e->cte_flags |= CTE_ACK;
20970Sstevel@tonic-gate 			mutex_exit(&e->cte_lock);
20980Sstevel@tonic-gate 			ASSERT(MUTEX_HELD(&e->cte_contract->ct_lock));
20990Sstevel@tonic-gate 			e->cte_contract->ct_evcnt--;
21000Sstevel@tonic-gate 		}
21010Sstevel@tonic-gate 		list_remove(&q->ctq_events, e);
21020Sstevel@tonic-gate 		e->cte_nodes[q->ctq_listno].ctm_refs = 0;
21030Sstevel@tonic-gate 		e->cte_nodes[q->ctq_listno].ctm_nreliable = 0;
21040Sstevel@tonic-gate 		e->cte_nodes[q->ctq_listno].ctm_trimmed = 0;
21050Sstevel@tonic-gate 		cte_rele(e);
21060Sstevel@tonic-gate 	}
21070Sstevel@tonic-gate 
21080Sstevel@tonic-gate 	/*
21090Sstevel@tonic-gate 	 * This is necessary only because of CTEL_PBUNDLE listeners;
21100Sstevel@tonic-gate 	 * the events they point to can move from one pbundle to
21110Sstevel@tonic-gate 	 * another.  Fortunately, this only happens if the contract is
21120Sstevel@tonic-gate 	 * inherited, which (in turn) only happens if the process
21130Sstevel@tonic-gate 	 * exits, which means it's an all-or-nothing deal.  If this
21140Sstevel@tonic-gate 	 * wasn't the case, we would instead need to keep track of
21150Sstevel@tonic-gate 	 * listeners on a per-event basis, not just a per-queue basis.
21160Sstevel@tonic-gate 	 * This would have the side benefit of letting us clean up
21170Sstevel@tonic-gate 	 * trimmed events sooner (i.e. immediately), but would
21180Sstevel@tonic-gate 	 * unfortunately make events even bigger than they already
21190Sstevel@tonic-gate 	 * are.
21200Sstevel@tonic-gate 	 */
21210Sstevel@tonic-gate 	for (l = list_head(&q->ctq_listeners); l;
21220Sstevel@tonic-gate 	    l = list_next(&q->ctq_listeners, l)) {
21230Sstevel@tonic-gate 		l->ctl_flags |= CTLF_DEAD;
21240Sstevel@tonic-gate 		if (l->ctl_position) {
21250Sstevel@tonic-gate 			l->ctl_position = NULL;
21260Sstevel@tonic-gate 			list_insert_tail(&q->ctq_tail, l);
21270Sstevel@tonic-gate 		}
21280Sstevel@tonic-gate 		cv_broadcast(&l->ctl_cv);
21290Sstevel@tonic-gate 	}
21300Sstevel@tonic-gate 
21310Sstevel@tonic-gate 	/*
21320Sstevel@tonic-gate 	 * Disallow events.
21330Sstevel@tonic-gate 	 */
21340Sstevel@tonic-gate 	q->ctq_flags |= CTQ_DEAD;
21350Sstevel@tonic-gate 
21360Sstevel@tonic-gate 	/*
21370Sstevel@tonic-gate 	 * If we represent the last reference to a reference counted
21380Sstevel@tonic-gate 	 * process bundle queue, free it.
21390Sstevel@tonic-gate 	 */
21400Sstevel@tonic-gate 	if ((q->ctq_flags & CTQ_REFFED) && (q->ctq_nlisteners == 0))
21410Sstevel@tonic-gate 		cte_queue_destroy(q);
21420Sstevel@tonic-gate 	else
21430Sstevel@tonic-gate 		mutex_exit(&q->ctq_lock);
21440Sstevel@tonic-gate }
21450Sstevel@tonic-gate 
21460Sstevel@tonic-gate /*
21470Sstevel@tonic-gate  * cte_publish
21480Sstevel@tonic-gate  *
21490Sstevel@tonic-gate  * Publishes an event to a specific queue.  Only called by
21500Sstevel@tonic-gate  * cte_publish_all.
21510Sstevel@tonic-gate  */
21520Sstevel@tonic-gate static void
21530Sstevel@tonic-gate cte_publish(ct_equeue_t *q, ct_kevent_t *e, timespec_t *tsp)
21540Sstevel@tonic-gate {
21550Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&q->ctq_lock));
21560Sstevel@tonic-gate 
21570Sstevel@tonic-gate 	q->ctq_atime = *tsp;
21580Sstevel@tonic-gate 
21590Sstevel@tonic-gate 	/*
21600Sstevel@tonic-gate 	 * Don't publish if the event is informative and there aren't
21610Sstevel@tonic-gate 	 * any listeners, or if the queue has been shut down.
21620Sstevel@tonic-gate 	 */
21630Sstevel@tonic-gate 	if (((q->ctq_nlisteners == 0) && (e->cte_flags & (CTE_INFO|CTE_ACK))) ||
21640Sstevel@tonic-gate 	    (q->ctq_flags & CTQ_DEAD)) {
21650Sstevel@tonic-gate 		mutex_exit(&q->ctq_lock);
21660Sstevel@tonic-gate 		cte_rele(e);
21670Sstevel@tonic-gate 		return;
21680Sstevel@tonic-gate 	}
21690Sstevel@tonic-gate 
21700Sstevel@tonic-gate 	/*
21710Sstevel@tonic-gate 	 * Enqueue event
21720Sstevel@tonic-gate 	 */
21730Sstevel@tonic-gate 	list_insert_tail(&q->ctq_events, e);
21740Sstevel@tonic-gate 
21750Sstevel@tonic-gate 	/*
21760Sstevel@tonic-gate 	 * Check for waiting listeners
21770Sstevel@tonic-gate 	 */
21780Sstevel@tonic-gate 	cte_qwakeup(q, e);
21790Sstevel@tonic-gate 
21800Sstevel@tonic-gate 	/*
21810Sstevel@tonic-gate 	 * Trim unnecessary events from the queue.
21820Sstevel@tonic-gate 	 */
21830Sstevel@tonic-gate 	cte_trim(q, NULL);
21840Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
21850Sstevel@tonic-gate }
21860Sstevel@tonic-gate 
21870Sstevel@tonic-gate /*
21880Sstevel@tonic-gate  * cte_publish_all
21890Sstevel@tonic-gate  *
21900Sstevel@tonic-gate  * Publish an event to all necessary event queues.  The event, e, must
21910Sstevel@tonic-gate  * be zallocated by the caller, and the event's flags and type must be
21920Sstevel@tonic-gate  * set.  The rest of the event's fields are initialized here.
21930Sstevel@tonic-gate  */
21944845Svikram uint64_t
21950Sstevel@tonic-gate cte_publish_all(contract_t *ct, ct_kevent_t *e, nvlist_t *data, nvlist_t *gdata)
21960Sstevel@tonic-gate {
21970Sstevel@tonic-gate 	ct_equeue_t *q;
21980Sstevel@tonic-gate 	timespec_t ts;
21994845Svikram 	uint64_t evid;
22004845Svikram 	ct_kevent_t *negev;
22014845Svikram 	int negend;
22020Sstevel@tonic-gate 
22030Sstevel@tonic-gate 	e->cte_contract = ct;
22040Sstevel@tonic-gate 	e->cte_data = data;
22050Sstevel@tonic-gate 	e->cte_gdata = gdata;
22060Sstevel@tonic-gate 	e->cte_refs = 3;
22074845Svikram 	evid = e->cte_id = atomic_add_64_nv(&ct->ct_type->ct_type_evid, 1);
22080Sstevel@tonic-gate 	contract_hold(ct);
22090Sstevel@tonic-gate 
22104845Svikram 	/*
22114845Svikram 	 * For a negotiation event we set the ct->ct_nevent field of the
22124845Svikram 	 * contract for the duration of the negotiation
22134845Svikram 	 */
22144845Svikram 	negend = 0;
22154845Svikram 	if (e->cte_flags & CTE_NEG) {
22164845Svikram 		cte_hold(e);
22174845Svikram 		ct->ct_nevent = e;
22184845Svikram 	} else if (e->cte_type == CT_EV_NEGEND) {
22194845Svikram 		negend = 1;
22204845Svikram 	}
22214845Svikram 
22220Sstevel@tonic-gate 	gethrestime(&ts);
22230Sstevel@tonic-gate 
22240Sstevel@tonic-gate 	/*
22250Sstevel@tonic-gate 	 * ct_evtlock simply (and only) ensures that two events sent
22260Sstevel@tonic-gate 	 * from the same contract are delivered to all queues in the
22270Sstevel@tonic-gate 	 * same order.
22280Sstevel@tonic-gate 	 */
22290Sstevel@tonic-gate 	mutex_enter(&ct->ct_evtlock);
22300Sstevel@tonic-gate 
22310Sstevel@tonic-gate 	/*
22320Sstevel@tonic-gate 	 * CTEL_CONTRACT - First deliver to the contract queue, acking
22330Sstevel@tonic-gate 	 * the event if the contract has been orphaned.
22340Sstevel@tonic-gate 	 */
22350Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
22360Sstevel@tonic-gate 	mutex_enter(&ct->ct_events.ctq_lock);
22370Sstevel@tonic-gate 	if ((e->cte_flags & CTE_INFO) == 0) {
22380Sstevel@tonic-gate 		if (ct->ct_state >= CTS_ORPHAN)
22390Sstevel@tonic-gate 			e->cte_flags |= CTE_ACK;
22400Sstevel@tonic-gate 		else
22410Sstevel@tonic-gate 			ct->ct_evcnt++;
22420Sstevel@tonic-gate 	}
22430Sstevel@tonic-gate 	mutex_exit(&ct->ct_lock);
22440Sstevel@tonic-gate 	cte_publish(&ct->ct_events, e, &ts);
22450Sstevel@tonic-gate 
22460Sstevel@tonic-gate 	/*
22470Sstevel@tonic-gate 	 * CTEL_BUNDLE - Next deliver to the contract type's bundle
22480Sstevel@tonic-gate 	 * queue.
22490Sstevel@tonic-gate 	 */
22500Sstevel@tonic-gate 	mutex_enter(&ct->ct_type->ct_type_events.ctq_lock);
22510Sstevel@tonic-gate 	cte_publish(&ct->ct_type->ct_type_events, e, &ts);
22520Sstevel@tonic-gate 
22530Sstevel@tonic-gate 	/*
22540Sstevel@tonic-gate 	 * CTEL_PBUNDLE - Finally, if the contract has an owner,
22550Sstevel@tonic-gate 	 * deliver to the owner's process bundle queue.
22560Sstevel@tonic-gate 	 */
22570Sstevel@tonic-gate 	mutex_enter(&ct->ct_lock);
22580Sstevel@tonic-gate 	if (ct->ct_owner) {
22590Sstevel@tonic-gate 		/*
22600Sstevel@tonic-gate 		 * proc_exit doesn't free event queues until it has
22610Sstevel@tonic-gate 		 * abandoned all contracts.
22620Sstevel@tonic-gate 		 */
22630Sstevel@tonic-gate 		ASSERT(ct->ct_owner->p_ct_equeue);
22640Sstevel@tonic-gate 		ASSERT(ct->ct_owner->p_ct_equeue[ct->ct_type->ct_type_index]);
22650Sstevel@tonic-gate 		q = ct->ct_owner->p_ct_equeue[ct->ct_type->ct_type_index];
22660Sstevel@tonic-gate 		mutex_enter(&q->ctq_lock);
22670Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
22680Sstevel@tonic-gate 		cte_publish(q, e, &ts);
22690Sstevel@tonic-gate 	} else {
22700Sstevel@tonic-gate 		mutex_exit(&ct->ct_lock);
22710Sstevel@tonic-gate 		cte_rele(e);
22720Sstevel@tonic-gate 	}
22730Sstevel@tonic-gate 
22744845Svikram 	if (negend) {
22754845Svikram 		mutex_enter(&ct->ct_lock);
22764845Svikram 		negev = ct->ct_nevent;
22774845Svikram 		ct->ct_nevent = NULL;
22784845Svikram 		cte_rele(negev);
22794845Svikram 		mutex_exit(&ct->ct_lock);
22804845Svikram 	}
22814845Svikram 
22820Sstevel@tonic-gate 	mutex_exit(&ct->ct_evtlock);
22834845Svikram 
22844845Svikram 	return (evid);
22850Sstevel@tonic-gate }
22860Sstevel@tonic-gate 
22870Sstevel@tonic-gate /*
22880Sstevel@tonic-gate  * cte_add_listener
22890Sstevel@tonic-gate  *
22900Sstevel@tonic-gate  * Add a new listener to an event queue.
22910Sstevel@tonic-gate  */
22920Sstevel@tonic-gate void
22930Sstevel@tonic-gate cte_add_listener(ct_equeue_t *q, ct_listener_t *l)
22940Sstevel@tonic-gate {
22950Sstevel@tonic-gate 	cv_init(&l->ctl_cv, NULL, CV_DEFAULT, NULL);
22960Sstevel@tonic-gate 	l->ctl_equeue = q;
22970Sstevel@tonic-gate 	l->ctl_position = NULL;
22980Sstevel@tonic-gate 	l->ctl_flags = 0;
22990Sstevel@tonic-gate 
23000Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
23010Sstevel@tonic-gate 	list_insert_head(&q->ctq_tail, l);
23020Sstevel@tonic-gate 	list_insert_head(&q->ctq_listeners, l);
23030Sstevel@tonic-gate 	q->ctq_nlisteners++;
23040Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
23050Sstevel@tonic-gate }
23060Sstevel@tonic-gate 
23070Sstevel@tonic-gate /*
23080Sstevel@tonic-gate  * cte_remove_listener
23090Sstevel@tonic-gate  *
23100Sstevel@tonic-gate  * Remove a listener from an event queue.  No other queue activities
23110Sstevel@tonic-gate  * (e.g. cte_get event) may be in progress at this endpoint when this
23120Sstevel@tonic-gate  * is called.
23130Sstevel@tonic-gate  */
23140Sstevel@tonic-gate void
23150Sstevel@tonic-gate cte_remove_listener(ct_listener_t *l)
23160Sstevel@tonic-gate {
23170Sstevel@tonic-gate 	ct_equeue_t *q = l->ctl_equeue;
23180Sstevel@tonic-gate 	ct_kevent_t *e;
23190Sstevel@tonic-gate 
23200Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
23210Sstevel@tonic-gate 
23220Sstevel@tonic-gate 	ASSERT((l->ctl_flags & (CTLF_COPYOUT|CTLF_RESET)) == 0);
23230Sstevel@tonic-gate 
23240Sstevel@tonic-gate 	if ((e = l->ctl_position) != NULL)
23250Sstevel@tonic-gate 		cte_qrele(q, l, e);
23260Sstevel@tonic-gate 	else
23270Sstevel@tonic-gate 		list_remove(&q->ctq_tail, l);
23280Sstevel@tonic-gate 	l->ctl_position = NULL;
23290Sstevel@tonic-gate 
23300Sstevel@tonic-gate 	q->ctq_nlisteners--;
23310Sstevel@tonic-gate 	list_remove(&q->ctq_listeners, l);
23320Sstevel@tonic-gate 
23330Sstevel@tonic-gate 	if (l->ctl_flags & CTLF_RELIABLE)
23340Sstevel@tonic-gate 		q->ctq_nreliable--;
23350Sstevel@tonic-gate 
23360Sstevel@tonic-gate 	/*
23370Sstevel@tonic-gate 	 * If we are a the last listener of a dead reference counted
23380Sstevel@tonic-gate 	 * queue (i.e. a process bundle) we free it.  Otherwise we just
23390Sstevel@tonic-gate 	 * trim any events which may have been kept around for our
23400Sstevel@tonic-gate 	 * benefit.
23410Sstevel@tonic-gate 	 */
23420Sstevel@tonic-gate 	if ((q->ctq_flags & CTQ_REFFED) && (q->ctq_flags & CTQ_DEAD) &&
23430Sstevel@tonic-gate 	    (q->ctq_nlisteners == 0)) {
23440Sstevel@tonic-gate 		cte_queue_destroy(q);
23450Sstevel@tonic-gate 	} else {
23460Sstevel@tonic-gate 		cte_trim(q, NULL);
23470Sstevel@tonic-gate 		mutex_exit(&q->ctq_lock);
23480Sstevel@tonic-gate 	}
23490Sstevel@tonic-gate }
23500Sstevel@tonic-gate 
23510Sstevel@tonic-gate /*
23520Sstevel@tonic-gate  * cte_reset_listener
23530Sstevel@tonic-gate  *
23540Sstevel@tonic-gate  * Moves a listener's queue pointer to the beginning of the queue.
23550Sstevel@tonic-gate  */
23560Sstevel@tonic-gate void
23570Sstevel@tonic-gate cte_reset_listener(ct_listener_t *l)
23580Sstevel@tonic-gate {
23590Sstevel@tonic-gate 	ct_equeue_t *q = l->ctl_equeue;
23600Sstevel@tonic-gate 
23610Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
23620Sstevel@tonic-gate 
23630Sstevel@tonic-gate 	/*
23640Sstevel@tonic-gate 	 * We allow an asynchronous reset because it doesn't make a
23650Sstevel@tonic-gate 	 * whole lot of sense to make reset block or fail.  We already
23660Sstevel@tonic-gate 	 * have most of the mechanism needed thanks to queue trimming,
23670Sstevel@tonic-gate 	 * so implementing it isn't a big deal.
23680Sstevel@tonic-gate 	 */
23690Sstevel@tonic-gate 	if (l->ctl_flags & CTLF_COPYOUT)
23700Sstevel@tonic-gate 		l->ctl_flags |= CTLF_RESET;
23710Sstevel@tonic-gate 
23720Sstevel@tonic-gate 	(void) cte_qmove(q, l, list_head(&q->ctq_events));
23730Sstevel@tonic-gate 
23740Sstevel@tonic-gate 	/*
23750Sstevel@tonic-gate 	 * Inform blocked readers.
23760Sstevel@tonic-gate 	 */
23770Sstevel@tonic-gate 	cv_broadcast(&l->ctl_cv);
23780Sstevel@tonic-gate 	pollwakeup(&l->ctl_pollhead, POLLIN);
23790Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
23800Sstevel@tonic-gate }
23810Sstevel@tonic-gate 
23820Sstevel@tonic-gate /*
23830Sstevel@tonic-gate  * cte_next_event
23840Sstevel@tonic-gate  *
23850Sstevel@tonic-gate  * Moves the event pointer for the specified listener to the next event
23860Sstevel@tonic-gate  * on the queue.  To avoid races, this movement only occurs if the
23870Sstevel@tonic-gate  * specified event id matches that of the current event.  This is used
23880Sstevel@tonic-gate  * primarily to skip events that have been read but whose extended data
23890Sstevel@tonic-gate  * haven't been copied out.
23900Sstevel@tonic-gate  */
23910Sstevel@tonic-gate int
23920Sstevel@tonic-gate cte_next_event(ct_listener_t *l, uint64_t id)
23930Sstevel@tonic-gate {
23940Sstevel@tonic-gate 	ct_equeue_t *q = l->ctl_equeue;
23950Sstevel@tonic-gate 	ct_kevent_t *old;
23960Sstevel@tonic-gate 
23970Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
23980Sstevel@tonic-gate 
23990Sstevel@tonic-gate 	if (l->ctl_flags & CTLF_COPYOUT)
24000Sstevel@tonic-gate 		l->ctl_flags |= CTLF_RESET;
24010Sstevel@tonic-gate 
24020Sstevel@tonic-gate 	if (((old = l->ctl_position) != NULL) && (old->cte_id == id))
24030Sstevel@tonic-gate 		(void) cte_qmove(q, l, list_next(&q->ctq_events, old));
24040Sstevel@tonic-gate 
24050Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
24060Sstevel@tonic-gate 
24070Sstevel@tonic-gate 	return (0);
24080Sstevel@tonic-gate }
24090Sstevel@tonic-gate 
24100Sstevel@tonic-gate /*
24110Sstevel@tonic-gate  * cte_get_event
24120Sstevel@tonic-gate  *
24130Sstevel@tonic-gate  * Reads an event from an event endpoint.  If "nonblock" is clear, we
24140Sstevel@tonic-gate  * block until a suitable event is ready.  If "crit" is set, we only
24150Sstevel@tonic-gate  * read critical events.  Note that while "cr" is the caller's cred,
24160Sstevel@tonic-gate  * "zuniqid" is the unique id of the zone the calling contract
24170Sstevel@tonic-gate  * filesystem was mounted in.
24180Sstevel@tonic-gate  */
24190Sstevel@tonic-gate int
24200Sstevel@tonic-gate cte_get_event(ct_listener_t *l, int nonblock, void *uaddr, const cred_t *cr,
24210Sstevel@tonic-gate     uint64_t zuniqid, int crit)
24220Sstevel@tonic-gate {
24230Sstevel@tonic-gate 	ct_equeue_t *q = l->ctl_equeue;
24240Sstevel@tonic-gate 	ct_kevent_t *temp;
24250Sstevel@tonic-gate 	int result = 0;
24260Sstevel@tonic-gate 	int partial = 0;
24270Sstevel@tonic-gate 	size_t size, gsize, len;
24280Sstevel@tonic-gate 	model_t mdl = get_udatamodel();
24290Sstevel@tonic-gate 	STRUCT_DECL(ct_event, ev);
24300Sstevel@tonic-gate 	STRUCT_INIT(ev, mdl);
24310Sstevel@tonic-gate 
24320Sstevel@tonic-gate 	/*
24330Sstevel@tonic-gate 	 * cte_qreadable checks for CTLF_COPYOUT as well as ensures
24340Sstevel@tonic-gate 	 * that there exists, and we are pointing to, an appropriate
24350Sstevel@tonic-gate 	 * event.  It may temporarily drop ctq_lock, but that doesn't
24360Sstevel@tonic-gate 	 * really matter to us.
24370Sstevel@tonic-gate 	 */
24380Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
24390Sstevel@tonic-gate 	while (cte_qreadable(q, l, cr, zuniqid, crit)) {
24400Sstevel@tonic-gate 		if (nonblock) {
24410Sstevel@tonic-gate 			result = EAGAIN;
24420Sstevel@tonic-gate 			goto error;
24430Sstevel@tonic-gate 		}
24440Sstevel@tonic-gate 		if (q->ctq_flags & CTQ_DEAD) {
24450Sstevel@tonic-gate 			result = EIDRM;
24460Sstevel@tonic-gate 			goto error;
24470Sstevel@tonic-gate 		}
24480Sstevel@tonic-gate 		result = cv_wait_sig(&l->ctl_cv, &q->ctq_lock);
24490Sstevel@tonic-gate 		if (result == 0) {
24500Sstevel@tonic-gate 			result = EINTR;
24510Sstevel@tonic-gate 			goto error;
24520Sstevel@tonic-gate 		}
24530Sstevel@tonic-gate 	}
24540Sstevel@tonic-gate 	temp = l->ctl_position;
24550Sstevel@tonic-gate 	cte_hold(temp);
24560Sstevel@tonic-gate 	l->ctl_flags |= CTLF_COPYOUT;
24570Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
24580Sstevel@tonic-gate 
24590Sstevel@tonic-gate 	/*
24600Sstevel@tonic-gate 	 * We now have an event.  Copy in the user event structure to
24610Sstevel@tonic-gate 	 * see how much space we have to work with.
24620Sstevel@tonic-gate 	 */
24630Sstevel@tonic-gate 	result = copyin(uaddr, STRUCT_BUF(ev), STRUCT_SIZE(ev));
24640Sstevel@tonic-gate 	if (result)
24650Sstevel@tonic-gate 		goto copyerr;
24660Sstevel@tonic-gate 
24670Sstevel@tonic-gate 	/*
24680Sstevel@tonic-gate 	 * Determine what data we have and what the user should be
24690Sstevel@tonic-gate 	 * allowed to see.
24700Sstevel@tonic-gate 	 */
24710Sstevel@tonic-gate 	size = gsize = 0;
24720Sstevel@tonic-gate 	if (temp->cte_data) {
24730Sstevel@tonic-gate 		VERIFY(nvlist_size(temp->cte_data, &size,
24740Sstevel@tonic-gate 		    NV_ENCODE_NATIVE) == 0);
24750Sstevel@tonic-gate 		ASSERT(size != 0);
24760Sstevel@tonic-gate 	}
24770Sstevel@tonic-gate 	if (zuniqid == GLOBAL_ZONEUNIQID && temp->cte_gdata) {
24780Sstevel@tonic-gate 		VERIFY(nvlist_size(temp->cte_gdata, &gsize,
24790Sstevel@tonic-gate 		    NV_ENCODE_NATIVE) == 0);
24800Sstevel@tonic-gate 		ASSERT(gsize != 0);
24810Sstevel@tonic-gate 	}
24820Sstevel@tonic-gate 
24830Sstevel@tonic-gate 	/*
24840Sstevel@tonic-gate 	 * If we have enough space, copy out the extended event data.
24850Sstevel@tonic-gate 	 */
24860Sstevel@tonic-gate 	len = size + gsize;
24870Sstevel@tonic-gate 	if (len) {
24880Sstevel@tonic-gate 		if (STRUCT_FGET(ev, ctev_nbytes) >= len) {
24890Sstevel@tonic-gate 			char *buf = kmem_alloc(len, KM_SLEEP);
24900Sstevel@tonic-gate 
24910Sstevel@tonic-gate 			if (size)
24920Sstevel@tonic-gate 				VERIFY(nvlist_pack(temp->cte_data, &buf, &size,
24930Sstevel@tonic-gate 				    NV_ENCODE_NATIVE, KM_SLEEP) == 0);
24940Sstevel@tonic-gate 			if (gsize) {
24950Sstevel@tonic-gate 				char *tmp = buf + size;
24960Sstevel@tonic-gate 
24970Sstevel@tonic-gate 				VERIFY(nvlist_pack(temp->cte_gdata, &tmp,
24980Sstevel@tonic-gate 				    &gsize, NV_ENCODE_NATIVE, KM_SLEEP) == 0);
24990Sstevel@tonic-gate 			}
25000Sstevel@tonic-gate 
25010Sstevel@tonic-gate 			/* This shouldn't have changed */
25020Sstevel@tonic-gate 			ASSERT(size + gsize == len);
25030Sstevel@tonic-gate 			result = copyout(buf, STRUCT_FGETP(ev, ctev_buffer),
25040Sstevel@tonic-gate 			    len);
25050Sstevel@tonic-gate 			kmem_free(buf, len);
25060Sstevel@tonic-gate 			if (result)
25070Sstevel@tonic-gate 				goto copyerr;
25080Sstevel@tonic-gate 		} else {
25090Sstevel@tonic-gate 			partial = 1;
25100Sstevel@tonic-gate 		}
25110Sstevel@tonic-gate 	}
25120Sstevel@tonic-gate 
25130Sstevel@tonic-gate 	/*
25140Sstevel@tonic-gate 	 * Copy out the common event data.
25150Sstevel@tonic-gate 	 */
25160Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_id, temp->cte_contract->ct_id);
25170Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_evid, temp->cte_id);
25180Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_cttype,
25190Sstevel@tonic-gate 	    temp->cte_contract->ct_type->ct_type_index);
25204845Svikram 	STRUCT_FSET(ev, ctev_flags, temp->cte_flags &
25214845Svikram 	    (CTE_ACK|CTE_INFO|CTE_NEG));
25220Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_type, temp->cte_type);
25230Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_nbytes, len);
25240Sstevel@tonic-gate 	STRUCT_FSET(ev, ctev_goffset, size);
25250Sstevel@tonic-gate 	result = copyout(STRUCT_BUF(ev), uaddr, STRUCT_SIZE(ev));
25260Sstevel@tonic-gate 
25270Sstevel@tonic-gate copyerr:
25280Sstevel@tonic-gate 	/*
25290Sstevel@tonic-gate 	 * Only move our location in the queue if all copyouts were
25300Sstevel@tonic-gate 	 * successful, the caller provided enough space for the entire
25310Sstevel@tonic-gate 	 * event, and our endpoint wasn't reset or otherwise moved by
25320Sstevel@tonic-gate 	 * another thread.
25330Sstevel@tonic-gate 	 */
25340Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
25350Sstevel@tonic-gate 	if (result)
25360Sstevel@tonic-gate 		result = EFAULT;
25370Sstevel@tonic-gate 	else if (!partial && ((l->ctl_flags & CTLF_RESET) == 0) &&
25380Sstevel@tonic-gate 	    (l->ctl_position == temp))
25390Sstevel@tonic-gate 		(void) cte_qmove(q, l, list_next(&q->ctq_events, temp));
25400Sstevel@tonic-gate 	l->ctl_flags &= ~(CTLF_COPYOUT|CTLF_RESET);
25410Sstevel@tonic-gate 	/*
25420Sstevel@tonic-gate 	 * Signal any readers blocked on our CTLF_COPYOUT.
25430Sstevel@tonic-gate 	 */
25440Sstevel@tonic-gate 	cv_signal(&l->ctl_cv);
25450Sstevel@tonic-gate 	cte_rele(temp);
25460Sstevel@tonic-gate 
25470Sstevel@tonic-gate error:
25480Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
25490Sstevel@tonic-gate 	return (result);
25500Sstevel@tonic-gate }
25510Sstevel@tonic-gate 
25520Sstevel@tonic-gate /*
25530Sstevel@tonic-gate  * cte_set_reliable
25540Sstevel@tonic-gate  *
25550Sstevel@tonic-gate  * Requests that events be reliably delivered to an event endpoint.
25560Sstevel@tonic-gate  * Unread informative and acknowledged critical events will not be
25570Sstevel@tonic-gate  * removed from the queue until this listener reads or skips them.
25580Sstevel@tonic-gate  * Because a listener could maliciously request reliable delivery and
25590Sstevel@tonic-gate  * then do nothing, this requires that PRIV_CONTRACT_EVENT be in the
25600Sstevel@tonic-gate  * caller's effective set.
25610Sstevel@tonic-gate  */
25620Sstevel@tonic-gate int
25630Sstevel@tonic-gate cte_set_reliable(ct_listener_t *l, const cred_t *cr)
25640Sstevel@tonic-gate {
25650Sstevel@tonic-gate 	ct_equeue_t *q = l->ctl_equeue;
25660Sstevel@tonic-gate 	int error;
25670Sstevel@tonic-gate 
25680Sstevel@tonic-gate 	if ((error = secpolicy_contract_event(cr)) != 0)
25690Sstevel@tonic-gate 		return (error);
25700Sstevel@tonic-gate 
25710Sstevel@tonic-gate 	mutex_enter(&q->ctq_lock);
25720Sstevel@tonic-gate 	if ((l->ctl_flags & CTLF_RELIABLE) == 0) {
25730Sstevel@tonic-gate 		l->ctl_flags |= CTLF_RELIABLE;
25740Sstevel@tonic-gate 		q->ctq_nreliable++;
25750Sstevel@tonic-gate 		if (l->ctl_position != NULL)
25760Sstevel@tonic-gate 			l->ctl_position->cte_nodes[q->ctq_listno].
25770Sstevel@tonic-gate 			    ctm_nreliable++;
25780Sstevel@tonic-gate 	}
25790Sstevel@tonic-gate 	mutex_exit(&q->ctq_lock);
25800Sstevel@tonic-gate 
25810Sstevel@tonic-gate 	return (0);
25820Sstevel@tonic-gate }
2583