sun4/os/intr.c

*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * CDDL HEADER START
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * The contents of this file are subject to the terms of the
*0Sstevel@tonic-gate * Common Development and Distribution License, Version 1.0 only
*0Sstevel@tonic-gate * (the "License").  You may not use this file except in compliance
*0Sstevel@tonic-gate * with the License.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
*0Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing.
*0Sstevel@tonic-gate * See the License for the specific language governing permissions
*0Sstevel@tonic-gate * and limitations under the License.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each
*0Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
*0Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the
*0Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying
*0Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner]
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * CDDL HEADER END
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
*0Sstevel@tonic-gate * Use is subject to license terms.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate#pragma ident	"%Z%%M%	%I%	%E% SMI"
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate#include <sys/sysmacros.h>
*0Sstevel@tonic-gate#include <sys/stack.h>
*0Sstevel@tonic-gate#include <sys/cpuvar.h>
*0Sstevel@tonic-gate#include <sys/ivintr.h>
*0Sstevel@tonic-gate#include <sys/intreg.h>
*0Sstevel@tonic-gate#include <sys/membar.h>
*0Sstevel@tonic-gate#include <sys/kmem.h>
*0Sstevel@tonic-gate#include <sys/intr.h>
*0Sstevel@tonic-gate#include <sys/sunndi.h>
*0Sstevel@tonic-gate#include <sys/cmn_err.h>
*0Sstevel@tonic-gate#include <sys/privregs.h>
*0Sstevel@tonic-gate#include <sys/systm.h>
*0Sstevel@tonic-gate#include <sys/archsystm.h>
*0Sstevel@tonic-gate#include <sys/machsystm.h>
*0Sstevel@tonic-gate#include <sys/x_call.h>
*0Sstevel@tonic-gate#include <vm/seg_kp.h>
*0Sstevel@tonic-gate#include <sys/debug.h>
*0Sstevel@tonic-gate#include <sys/cyclic.h>
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate#include <sys/cpu_sgnblk_defs.h>
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatekmutex_t soft_iv_lock;	/* protect software interrupt vector table */
*0Sstevel@tonic-gate/* Global locks which protect the interrupt distribution lists */
*0Sstevel@tonic-gatestatic kmutex_t intr_dist_lock;
*0Sstevel@tonic-gatestatic kmutex_t intr_dist_cpu_lock;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/* Head of the interrupt distribution lists */
*0Sstevel@tonic-gatestatic struct intr_dist *intr_dist_head = NULL;
*0Sstevel@tonic-gatestatic struct intr_dist *intr_dist_whead = NULL;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gateuint_t swinum_base;
*0Sstevel@tonic-gateuint_t maxswinum;
*0Sstevel@tonic-gateuint_t siron_inum;
*0Sstevel@tonic-gateuint_t poke_cpu_inum;
*0Sstevel@tonic-gateint siron_pending;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gateint intr_policy = INTR_WEIGHTED_DIST;	/* interrupt distribution policy */
*0Sstevel@tonic-gateint intr_dist_debug = 0;
*0Sstevel@tonic-gateint32_t intr_dist_weight_max = 1;
*0Sstevel@tonic-gateint32_t intr_dist_weight_maxmax = 1000;
*0Sstevel@tonic-gateint intr_dist_weight_maxfactor = 2;
*0Sstevel@tonic-gate#define	INTR_DEBUG(args) if (intr_dist_debug) cmn_err args
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatestatic void sw_ivintr_init(cpu_t *);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * intr_init() - interrupt initialization
*0Sstevel@tonic-gate *	Initialize the system's software interrupt vector table and
*0Sstevel@tonic-gate *	CPU's interrupt free list
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_init(cpu_t *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	init_ivintr();
*0Sstevel@tonic-gate	sw_ivintr_init(cp);
*0Sstevel@tonic-gate	init_intr_pool(cp);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	mutex_init(&intr_dist_lock, NULL, MUTEX_DEFAULT, NULL);
*0Sstevel@tonic-gate	mutex_init(&intr_dist_cpu_lock, NULL, MUTEX_DEFAULT, NULL);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * A soft interrupt may have been requested prior to the initialization
*0Sstevel@tonic-gate	 * of soft interrupts.  Soft interrupts can't be dispatched until after
*0Sstevel@tonic-gate	 * init_intr_pool, so we have to wait until now before we can dispatch
*0Sstevel@tonic-gate	 * the pending soft interrupt (if any).
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	if (siron_pending)
*0Sstevel@tonic-gate		setsoftint(siron_inum);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * poke_cpu_intr - fall through when poke_cpu calls
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/* ARGSUSED */
*0Sstevel@tonic-gateuint_t
*0Sstevel@tonic-gatepoke_cpu_intr(caddr_t arg1, caddr_t arg2)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	CPU->cpu_m.poke_cpu_outstanding = B_FALSE;
*0Sstevel@tonic-gate	membar_stld_stst();
*0Sstevel@tonic-gate	return (1);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * sw_ivintr_init() - software interrupt vector initialization
*0Sstevel@tonic-gate *	called after CPU is active
*0Sstevel@tonic-gate *	the software interrupt vector table is part of the intr_vector[]
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatestatic void
*0Sstevel@tonic-gatesw_ivintr_init(cpu_t *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	extern uint_t softlevel1();
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	mutex_init(&soft_iv_lock, NULL, MUTEX_DEFAULT, NULL);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	swinum_base = SOFTIVNUM;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * the maximum software interrupt == MAX_SOFT_INO
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	maxswinum = swinum_base + MAX_SOFT_INO;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	REGISTER_BBUS_INTR();
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	siron_inum = add_softintr(PIL_1, softlevel1, 0);
*0Sstevel@tonic-gate	poke_cpu_inum = add_softintr(PIL_13, poke_cpu_intr, 0);
*0Sstevel@tonic-gate	cp->cpu_m.poke_cpu_outstanding = B_FALSE;
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatecpuset_t intr_add_pools_inuse;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * cleanup_intr_pool()
*0Sstevel@tonic-gate *	Free up the extra intr request pool for this cpu.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gatecleanup_intr_pool(cpu_t *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	extern struct intr_req *intr_add_head;
*0Sstevel@tonic-gate	int poolno;
*0Sstevel@tonic-gate	struct intr_req *pool;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	poolno = cp->cpu_m.intr_pool_added;
*0Sstevel@tonic-gate	if (poolno >= 0) {
*0Sstevel@tonic-gate		cp->cpu_m.intr_pool_added = -1;
*0Sstevel@tonic-gate		pool = (poolno * INTR_PENDING_MAX * intr_add_pools) +
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate			intr_add_head;	/* not byte arithmetic */
*0Sstevel@tonic-gate		bzero(pool, INTR_PENDING_MAX * intr_add_pools *
*0Sstevel@tonic-gate		    sizeof (struct intr_req));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		CPUSET_DEL(intr_add_pools_inuse, poolno);
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * init_intr_pool()
*0Sstevel@tonic-gate *	initialize the intr request pool for the cpu
*0Sstevel@tonic-gate * 	should be called for each cpu
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateinit_intr_pool(cpu_t *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	extern struct intr_req *intr_add_head;
*0Sstevel@tonic-gate#ifdef	DEBUG
*0Sstevel@tonic-gate	extern struct intr_req *intr_add_tail;
*0Sstevel@tonic-gate#endif	/* DEBUG */
*0Sstevel@tonic-gate	int i, pool;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	cp->cpu_m.intr_pool_added = -1;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	for (i = 0; i < INTR_PENDING_MAX-1; i++) {
*0Sstevel@tonic-gate		cp->cpu_m.intr_pool[i].intr_next =
*0Sstevel@tonic-gate		    &cp->cpu_m.intr_pool[i+1];
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate	cp->cpu_m.intr_pool[INTR_PENDING_MAX-1].intr_next = NULL;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	cp->cpu_m.intr_head[0] = &cp->cpu_m.intr_pool[0];
*0Sstevel@tonic-gate	cp->cpu_m.intr_tail[0] = &cp->cpu_m.intr_pool[INTR_PENDING_MAX-1];
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	if (intr_add_pools != 0) {
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		/*
*0Sstevel@tonic-gate		 * If additional interrupt pools have been allocated,
*0Sstevel@tonic-gate		 * initialize those too and add them to the free list.
*0Sstevel@tonic-gate		 */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		struct intr_req *trace;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		for (pool = 0; pool < max_ncpus; pool++) {
*0Sstevel@tonic-gate			if (!(CPU_IN_SET(intr_add_pools_inuse, pool)))
*0Sstevel@tonic-gate			    break;
*0Sstevel@tonic-gate		}
*0Sstevel@tonic-gate		if (pool >= max_ncpus) {
*0Sstevel@tonic-gate			/*
*0Sstevel@tonic-gate			 * XXX - intr pools are alloc'd, just not as
*0Sstevel@tonic-gate			 * much as we would like.
*0Sstevel@tonic-gate			 */
*0Sstevel@tonic-gate			cmn_err(CE_WARN, "Failed to alloc all requested intr "
*0Sstevel@tonic-gate			    "pools for cpu%d", cp->cpu_id);
*0Sstevel@tonic-gate			return;
*0Sstevel@tonic-gate		}
*0Sstevel@tonic-gate		CPUSET_ADD(intr_add_pools_inuse, pool);
*0Sstevel@tonic-gate		cp->cpu_m.intr_pool_added = pool;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		trace = (pool * INTR_PENDING_MAX * intr_add_pools) +
*0Sstevel@tonic-gate			intr_add_head;	/* not byte arithmetic */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		cp->cpu_m.intr_pool[INTR_PENDING_MAX-1].intr_next = trace;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		for (i = 1; i < intr_add_pools * INTR_PENDING_MAX; i++, trace++)
*0Sstevel@tonic-gate			trace->intr_next = trace + 1;
*0Sstevel@tonic-gate		trace->intr_next = NULL;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		ASSERT(trace >= intr_add_head && trace <= intr_add_tail);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		cp->cpu_m.intr_tail[0] = trace;
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * siron - primitive for sun/os/softint.c
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gatesiron(void)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	if (!siron_pending) {
*0Sstevel@tonic-gate		siron_pending = 1;
*0Sstevel@tonic-gate		if (siron_inum != 0)
*0Sstevel@tonic-gate			setsoftint(siron_inum);
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * no_ivintr()
*0Sstevel@tonic-gate * 	called by vec_interrupt() through sys_trap()
*0Sstevel@tonic-gate *	vector interrupt received but not valid or not
*0Sstevel@tonic-gate *	registered in intr_vector[]
*0Sstevel@tonic-gate *	considered as a spurious mondo interrupt
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gate/* ARGSUSED */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateno_ivintr(struct regs *rp, int inum, int pil)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	cmn_err(CE_WARN, "invalid vector intr: number 0x%x, pil 0x%x",
*0Sstevel@tonic-gate	    inum, pil);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate#ifdef DEBUG_VEC_INTR
*0Sstevel@tonic-gate	prom_enter_mon();
*0Sstevel@tonic-gate#endif /* DEBUG_VEC_INTR */
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * no_intr_pool()
*0Sstevel@tonic-gate * 	called by vec_interrupt() through sys_trap()
*0Sstevel@tonic-gate *	vector interrupt received but no intr_req entries
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gate/* ARGSUSED */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateno_intr_pool(struct regs *rp, int inum, int pil)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate#ifdef DEBUG_VEC_INTR
*0Sstevel@tonic-gate	cmn_err(CE_WARN, "intr_req pool empty: num 0x%x, pil 0x%x",
*0Sstevel@tonic-gate		inum, pil);
*0Sstevel@tonic-gate	prom_enter_mon();
*0Sstevel@tonic-gate#else
*0Sstevel@tonic-gate	cmn_err(CE_PANIC, "intr_req pool empty: num 0x%x, pil 0x%x",
*0Sstevel@tonic-gate		inum, pil);
*0Sstevel@tonic-gate#endif /* DEBUG_VEC_INTR */
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dequeue_req(uint_t pil, uint32_t inum)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	struct intr_req *ir, *prev;
*0Sstevel@tonic-gate	struct machcpu *mcpu;
*0Sstevel@tonic-gate	uint32_t clr;
*0Sstevel@tonic-gate	extern uint_t getpstate(void);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	ASSERT((getpstate() & PSTATE_IE) == 0);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	mcpu = &CPU->cpu_m;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* Find a matching entry in the list */
*0Sstevel@tonic-gate	prev = NULL;
*0Sstevel@tonic-gate	ir = mcpu->intr_head[pil];
*0Sstevel@tonic-gate	while (ir != NULL) {
*0Sstevel@tonic-gate		if (ir->intr_number == inum)
*0Sstevel@tonic-gate			break;
*0Sstevel@tonic-gate		prev = ir;
*0Sstevel@tonic-gate		ir = ir->intr_next;
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate	if (ir != NULL) {
*0Sstevel@tonic-gate		/*
*0Sstevel@tonic-gate		 * Remove entry from list
*0Sstevel@tonic-gate		 */
*0Sstevel@tonic-gate		if (prev != NULL)
*0Sstevel@tonic-gate			prev->intr_next = ir->intr_next;	/* non-head */
*0Sstevel@tonic-gate		else
*0Sstevel@tonic-gate			mcpu->intr_head[pil] = ir->intr_next;	/* head */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		if (ir->intr_next == NULL)
*0Sstevel@tonic-gate			mcpu->intr_tail[pil] = prev;		/* tail */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		/*
*0Sstevel@tonic-gate		 * Place on free list
*0Sstevel@tonic-gate		 */
*0Sstevel@tonic-gate		ir->intr_next = mcpu->intr_head[0];
*0Sstevel@tonic-gate		mcpu->intr_head[0] = ir;
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * clear pending interrupts at this level if the list is empty
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	if (mcpu->intr_head[pil] == NULL) {
*0Sstevel@tonic-gate		clr = 1 << pil;
*0Sstevel@tonic-gate		if (pil == PIL_14)
*0Sstevel@tonic-gate			clr |= (TICK_INT_MASK | STICK_INT_MASK);
*0Sstevel@tonic-gate		wr_clr_softint(clr);
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Send a directed interrupt of specified interrupt number id to a cpu.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gatesend_dirint(
*0Sstevel@tonic-gate	int cpuix,		/* cpu to be interrupted */
*0Sstevel@tonic-gate	int intr_id)		/* interrupt number id */
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	xt_one(cpuix, setsoftint_tl1, intr_id, 0);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateinit_intr_threads(struct cpu *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	int i;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	for (i = 0; i < NINTR_THREADS; i++)
*0Sstevel@tonic-gate		thread_create_intr(cp);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	cp->cpu_intr_stack = (caddr_t)segkp_get(segkp, INTR_STACK_SIZE,
*0Sstevel@tonic-gate		KPD_HASREDZONE | KPD_NO_ANON | KPD_LOCKED) +
*0Sstevel@tonic-gate		INTR_STACK_SIZE - SA(MINFRAME);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Take the specified CPU out of participation in interrupts.
*0Sstevel@tonic-gate *	Called by p_online(2) when a processor is being taken off-line.
*0Sstevel@tonic-gate *	This allows interrupt threads being handled on the processor to
*0Sstevel@tonic-gate *	complete before the processor is idled.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gateint
*0Sstevel@tonic-gatecpu_disable_intr(struct cpu *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	ASSERT(MUTEX_HELD(&cpu_lock));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * Turn off the CPU_ENABLE flag before calling the redistribution
*0Sstevel@tonic-gate	 * function, since it checks for this in the cpu flags.
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	cp->cpu_flags &= ~CPU_ENABLE;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	intr_redist_all_cpus();
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	return (0);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Allow the specified CPU to participate in interrupts.
*0Sstevel@tonic-gate *	Called by p_online(2) if a processor could not be taken off-line
*0Sstevel@tonic-gate *	because of bound threads, in order to resume processing interrupts.
*0Sstevel@tonic-gate *	Also called after starting a processor.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gatecpu_enable_intr(struct cpu *cp)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	ASSERT(MUTEX_HELD(&cpu_lock));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	cp->cpu_flags |= CPU_ENABLE;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	intr_redist_all_cpus();
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Add function to callback list for intr_redist_all_cpus.  We keep two lists,
*0Sstevel@tonic-gate * one for weighted callbacks and one for normal callbacks. Weighted callbacks
*0Sstevel@tonic-gate * are issued to redirect interrupts of a specified weight, from heavy to
*0Sstevel@tonic-gate * light.  This allows all the interrupts of a given weight to be redistributed
*0Sstevel@tonic-gate * for all weighted nexus drivers prior to those of less weight.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatestatic void
*0Sstevel@tonic-gateintr_dist_add_list(struct intr_dist **phead, void (*func)(void *), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	struct intr_dist *new = kmem_alloc(sizeof (*new), KM_SLEEP);
*0Sstevel@tonic-gate	struct intr_dist *iptr;
*0Sstevel@tonic-gate	struct intr_dist **pptr;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	ASSERT(func);
*0Sstevel@tonic-gate	new->func = func;
*0Sstevel@tonic-gate	new->arg = arg;
*0Sstevel@tonic-gate	new->next = NULL;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* Add to tail so that redistribution occurs in original order. */
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_lock);
*0Sstevel@tonic-gate	for (iptr = *phead, pptr = phead; iptr != NULL;
*0Sstevel@tonic-gate	    pptr = &iptr->next, iptr = iptr->next) {
*0Sstevel@tonic-gate		/* check for problems as we locate the tail */
*0Sstevel@tonic-gate		if ((iptr->func == func) && (iptr->arg == arg)) {
*0Sstevel@tonic-gate			cmn_err(CE_PANIC, "intr_dist_add_list(): duplicate");
*0Sstevel@tonic-gate			/*NOTREACHED*/
*0Sstevel@tonic-gate		}
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate	*pptr = new;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_lock);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_add(void (*func)(void *), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	intr_dist_add_list(&intr_dist_head, (void (*)(void *))func, arg);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_add_weighted(void (*func)(void *, int32_t, int32_t), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	intr_dist_add_list(&intr_dist_whead, (void (*)(void *))func, arg);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Search for the interrupt distribution structure with the specified
*0Sstevel@tonic-gate * mondo vec reg in the interrupt distribution list. If a match is found,
*0Sstevel@tonic-gate * then delete the entry from the list. The caller is responsible for
*0Sstevel@tonic-gate * modifying the mondo vector registers.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatestatic void
*0Sstevel@tonic-gateintr_dist_rem_list(struct intr_dist **headp, void (*func)(void *), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	struct intr_dist *iptr;
*0Sstevel@tonic-gate	struct intr_dist **vect;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_lock);
*0Sstevel@tonic-gate	for (iptr = *headp, vect = headp;
*0Sstevel@tonic-gate	    iptr != NULL; vect = &iptr->next, iptr = iptr->next) {
*0Sstevel@tonic-gate		if ((iptr->func == func) && (iptr->arg == arg)) {
*0Sstevel@tonic-gate			*vect = iptr->next;
*0Sstevel@tonic-gate			kmem_free(iptr, sizeof (struct intr_dist));
*0Sstevel@tonic-gate			mutex_exit(&intr_dist_lock);
*0Sstevel@tonic-gate			return;
*0Sstevel@tonic-gate		}
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	if (!panicstr)
*0Sstevel@tonic-gate		cmn_err(CE_PANIC, "intr_dist_rem_list: not found");
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_lock);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_rem(void (*func)(void *), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	intr_dist_rem_list(&intr_dist_head, (void (*)(void *))func, arg);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_rem_weighted(void (*func)(void *, int32_t, int32_t), void *arg)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	intr_dist_rem_list(&intr_dist_whead, (void (*)(void *))func, arg);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Initiate interrupt redistribution.  Redistribution improves the isolation
*0Sstevel@tonic-gate * associated with interrupt weights by ordering operations from heavy weight
*0Sstevel@tonic-gate * to light weight.  When a CPUs orientation changes relative to interrupts,
*0Sstevel@tonic-gate * there is *always* a redistribution to accommodate this change (call to
*0Sstevel@tonic-gate * intr_redist_all_cpus()).  As devices (not CPUs) attach/detach it is possible
*0Sstevel@tonic-gate * that a redistribution could improve the quality of an initialization. For
*0Sstevel@tonic-gate * example, if you are not using a NIC it may not be attached with s10 (devfs).
*0Sstevel@tonic-gate * If you then configure the NIC (ifconfig), this may cause the NIC to attach
*0Sstevel@tonic-gate * and plumb interrupts.  The CPU assignment for the NIC's interrupts is
*0Sstevel@tonic-gate * occurring late, so optimal "isolation" relative to weight is not occurring.
*0Sstevel@tonic-gate * The same applies to detach, although in this case doing the redistribution
*0Sstevel@tonic-gate * might improve "spread" for medium weight devices since the "isolation" of
*0Sstevel@tonic-gate * a higher weight device may no longer be present.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * NB: We should provide a utility to trigger redistribution (ala "intradm -r").
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * NB: There is risk associated with automatically triggering execution of the
*0Sstevel@tonic-gate * redistribution code at arbitrary times. The risk comes from the fact that
*0Sstevel@tonic-gate * there is a lot of low-level hardware interaction associated with a
*0Sstevel@tonic-gate * redistribution.  At some point we may want this code to perform automatic
*0Sstevel@tonic-gate * redistribution (redistribution thread; trigger timeout when add/remove
*0Sstevel@tonic-gate * weight delta is large enough, and call cv_signal from timeout - causing
*0Sstevel@tonic-gate * thead to call i_ddi_intr_redist_all_cpus()) but this is considered too
*0Sstevel@tonic-gate * risky at this time.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gatei_ddi_intr_redist_all_cpus()
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	mutex_enter(&cpu_lock);
*0Sstevel@tonic-gate	INTR_DEBUG((CE_CONT, "intr_dist: i_ddi_intr_redist_all_cpus\n"));
*0Sstevel@tonic-gate	intr_redist_all_cpus();
*0Sstevel@tonic-gate	mutex_exit(&cpu_lock);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Redistribute all interrupts
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * This function redistributes all interrupting devices, running the
*0Sstevel@tonic-gate * parent callback functions for each node.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_redist_all_cpus(void)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	struct cpu *cp;
*0Sstevel@tonic-gate	struct intr_dist *iptr;
*0Sstevel@tonic-gate	int32_t weight, max_weight;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	ASSERT(MUTEX_HELD(&cpu_lock));
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_lock);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * zero cpu_intr_weight on all cpus - it is safe to traverse
*0Sstevel@tonic-gate	 * cpu_list since we hold cpu_lock.
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	cp = cpu_list;
*0Sstevel@tonic-gate	do {
*0Sstevel@tonic-gate		cp->cpu_intr_weight = 0;
*0Sstevel@tonic-gate	} while ((cp = cp->cpu_next) != cpu_list);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * Assume that this redistribution may encounter a device weight
*0Sstevel@tonic-gate	 * via driver.conf tuning of "ddi-intr-weight" that is at most
*0Sstevel@tonic-gate	 * intr_dist_weight_maxfactor times larger.
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	max_weight = intr_dist_weight_max * intr_dist_weight_maxfactor;
*0Sstevel@tonic-gate	if (max_weight > intr_dist_weight_maxmax)
*0Sstevel@tonic-gate		max_weight = intr_dist_weight_maxmax;
*0Sstevel@tonic-gate	intr_dist_weight_max = 1;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	INTR_DEBUG((CE_CONT, "intr_dist: "
*0Sstevel@tonic-gate	    "intr_redist_all_cpus: %d-0\n", max_weight));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * Redistribute weighted, from heavy to light.  The callback that
*0Sstevel@tonic-gate	 * specifies a weight equal to weight_max should redirect all
*0Sstevel@tonic-gate	 * interrupts of weight weight_max or greater [weight_max, inf.).
*0Sstevel@tonic-gate	 * Interrupts of lesser weight should be processed on the call with
*0Sstevel@tonic-gate	 * the matching weight. This allows all the heaver weight interrupts
*0Sstevel@tonic-gate	 * on all weighted busses (multiple pci busses) to be redirected prior
*0Sstevel@tonic-gate	 * to any lesser weight interrupts.
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	for (weight = max_weight; weight >= 0; weight--)
*0Sstevel@tonic-gate		for (iptr = intr_dist_whead; iptr != NULL; iptr = iptr->next)
*0Sstevel@tonic-gate			((void (*)(void *, int32_t, int32_t))iptr->func)
*0Sstevel@tonic-gate			    (iptr->arg, max_weight, weight);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* redistribute normal (non-weighted) interrupts */
*0Sstevel@tonic-gate	for (iptr = intr_dist_head; iptr != NULL; iptr = iptr->next)
*0Sstevel@tonic-gate		((void (*)(void *))iptr->func)(iptr->arg);
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_lock);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_redist_all_cpus_shutdown(void)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	intr_policy = INTR_CURRENT_CPU;
*0Sstevel@tonic-gate	intr_redist_all_cpus();
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Determine what CPU to target, based on interrupt policy.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * INTR_FLAT_DIST: hold a current CPU pointer in a static variable and
*0Sstevel@tonic-gate *	advance through interrupt enabled cpus (round-robin).
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * INTR_WEIGHTED_DIST: search for an enabled CPU with the lowest
*0Sstevel@tonic-gate *	cpu_intr_weight, round robin when all equal.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate *	Weighted interrupt distribution provides two things: "spread" of weight
*0Sstevel@tonic-gate *	(associated with algorithm itself) and "isolation" (associated with a
*0Sstevel@tonic-gate *	particular device weight). A redistribution is what provides optimal
*0Sstevel@tonic-gate *	"isolation" of heavy weight interrupts, optimal "spread" of weight
*0Sstevel@tonic-gate *	(relative to what came before) is always occurring.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate *	An interrupt weight is a subjective number that represents the
*0Sstevel@tonic-gate *	percentage of a CPU required to service a device's interrupts: the
*0Sstevel@tonic-gate *	default weight is 0% (however the algorithm still maintains
*0Sstevel@tonic-gate *	round-robin), a network interface controller (NIC) may have a large
*0Sstevel@tonic-gate *	weight (35%). Interrupt weight only has meaning relative to the
*0Sstevel@tonic-gate *	interrupt weight of other devices: a CPU can be weighted more than
*0Sstevel@tonic-gate *	100%, and a single device might consume more than 100% of a CPU.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate *	A coarse interrupt weight can be defined by the parent nexus driver
*0Sstevel@tonic-gate *	based on bus specific information, like pci class codes. A nexus
*0Sstevel@tonic-gate *	driver that supports device interrupt weighting for its children
*0Sstevel@tonic-gate *	should call intr_dist_cpuid_add/rem_device_weight(), which adds
*0Sstevel@tonic-gate *	and removes the weight of a device from the CPU that an interrupt
*0Sstevel@tonic-gate *	is directed at.  The quality of initialization improves when the
*0Sstevel@tonic-gate *	device interrupt weights more accuracy reflect actual run-time weights,
*0Sstevel@tonic-gate *	and as the assignments are ordered from is heavy to light.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate *	The implementation also supports interrupt weight being specified in
*0Sstevel@tonic-gate *	driver.conf files via the property "ddi-intr-weight", which takes
*0Sstevel@tonic-gate *	precedence over the nexus supplied weight.  This support is added to
*0Sstevel@tonic-gate *	permit possible tweaking in the product in response to customer
*0Sstevel@tonic-gate *	problems. This is not a formal or committed interface.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate *	While a weighted approach chooses the CPU providing the best spread
*0Sstevel@tonic-gate *	given past weights, less than optimal isolation can result in cases
*0Sstevel@tonic-gate *	where heavy weight devices show up last. The nexus driver's interrupt
*0Sstevel@tonic-gate *	redistribution logic should use intr_dist_add/rem_weighted so that
*0Sstevel@tonic-gate *	interrupts can be redistributed heavy first for optimal isolation.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gateuint32_t
*0Sstevel@tonic-gateintr_dist_cpuid(void)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	static struct cpu	*curr_cpu;
*0Sstevel@tonic-gate	struct cpu		*start_cpu;
*0Sstevel@tonic-gate	struct cpu		*new_cpu;
*0Sstevel@tonic-gate	struct cpu		*cp;
*0Sstevel@tonic-gate	int			cpuid = -1;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* Establish exclusion for curr_cpu and cpu_intr_weight manipulation */
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	switch (intr_policy) {
*0Sstevel@tonic-gate	case INTR_CURRENT_CPU:
*0Sstevel@tonic-gate		cpuid = CPU->cpu_id;
*0Sstevel@tonic-gate		break;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	case INTR_BOOT_CPU:
*0Sstevel@tonic-gate		panic("INTR_BOOT_CPU no longer supported.");
*0Sstevel@tonic-gate		/*NOTREACHED*/
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	case INTR_FLAT_DIST:
*0Sstevel@tonic-gate	case INTR_WEIGHTED_DIST:
*0Sstevel@tonic-gate	default:
*0Sstevel@tonic-gate		/*
*0Sstevel@tonic-gate		 * Ensure that curr_cpu is valid - cpu_next will be NULL if
*0Sstevel@tonic-gate		 * the cpu has been deleted (cpu structs are never freed).
*0Sstevel@tonic-gate		 */
*0Sstevel@tonic-gate		if (curr_cpu == NULL || curr_cpu->cpu_next == NULL)
*0Sstevel@tonic-gate			curr_cpu = CPU;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		/*
*0Sstevel@tonic-gate		 * Advance to online CPU after curr_cpu (round-robin). For
*0Sstevel@tonic-gate		 * INTR_WEIGHTED_DIST we choose the cpu with the lightest
*0Sstevel@tonic-gate		 * weight.  For a nexus that does not support weight the
*0Sstevel@tonic-gate		 * default weight of zero is used. We degrade to round-robin
*0Sstevel@tonic-gate		 * behavior among equal weightes.  The default weight is zero
*0Sstevel@tonic-gate		 * and round-robin behavior continues.
*0Sstevel@tonic-gate		 *
*0Sstevel@tonic-gate		 * Disable preemption while traversing cpu_next_onln to
*0Sstevel@tonic-gate		 * ensure the list does not change.  This works because
*0Sstevel@tonic-gate		 * modifiers of this list and other lists in a struct cpu
*0Sstevel@tonic-gate		 * call pause_cpus() before making changes.
*0Sstevel@tonic-gate		 */
*0Sstevel@tonic-gate		kpreempt_disable();
*0Sstevel@tonic-gate		cp = start_cpu = curr_cpu->cpu_next_onln;
*0Sstevel@tonic-gate		new_cpu = NULL;
*0Sstevel@tonic-gate		do {
*0Sstevel@tonic-gate			/* Skip CPUs with interrupts disabled */
*0Sstevel@tonic-gate			if ((cp->cpu_flags & CPU_ENABLE) == 0)
*0Sstevel@tonic-gate				continue;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate			if (intr_policy == INTR_FLAT_DIST) {
*0Sstevel@tonic-gate				/* select CPU */
*0Sstevel@tonic-gate				new_cpu = cp;
*0Sstevel@tonic-gate				break;
*0Sstevel@tonic-gate			} else if ((new_cpu == NULL) ||
*0Sstevel@tonic-gate			    (cp->cpu_intr_weight < new_cpu->cpu_intr_weight)) {
*0Sstevel@tonic-gate				/* Choose if lighter weight */
*0Sstevel@tonic-gate				new_cpu = cp;
*0Sstevel@tonic-gate			}
*0Sstevel@tonic-gate		} while ((cp = cp->cpu_next_onln) != start_cpu);
*0Sstevel@tonic-gate		ASSERT(new_cpu);
*0Sstevel@tonic-gate		cpuid = new_cpu->cpu_id;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		INTR_DEBUG((CE_CONT, "intr_dist: cpu %2d weight %3d: "
*0Sstevel@tonic-gate		    "targeted\n", cpuid, new_cpu->cpu_intr_weight));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate		/* update static pointer for next round-robin */
*0Sstevel@tonic-gate		curr_cpu = new_cpu;
*0Sstevel@tonic-gate		kpreempt_enable();
*0Sstevel@tonic-gate		break;
*0Sstevel@tonic-gate	}
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate	return (cpuid);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate/*
*0Sstevel@tonic-gate * Add or remove the the weight of a device from a CPUs interrupt weight.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * We expect nexus drivers to call intr_dist_cpuid_add/rem_device_weight for
*0Sstevel@tonic-gate * their children to improve the overall quality of interrupt initialization.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * If a nexues shares the CPU returned by a single intr_dist_cpuid() call
*0Sstevel@tonic-gate * among multiple devices (sharing ino) then the nexus should call
*0Sstevel@tonic-gate * intr_dist_cpuid_add/rem_device_weight for each device separately. Devices
*0Sstevel@tonic-gate * that share must specify the same cpuid.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * If a nexus driver is unable to determine the cpu at remove_intr time
*0Sstevel@tonic-gate * for some of its interrupts, then it should not call add_device_weight -
*0Sstevel@tonic-gate * intr_dist_cpuid will still provide round-robin.
*0Sstevel@tonic-gate *
*0Sstevel@tonic-gate * An established device weight (from dev_info node) takes precedence over
*0Sstevel@tonic-gate * the weight passed in.  If a device weight is not already established
*0Sstevel@tonic-gate * then the passed in nexus weight is established.
*0Sstevel@tonic-gate */
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_cpuid_add_device_weight(uint32_t cpuid,
*0Sstevel@tonic-gate    dev_info_t *dip, int32_t nweight)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	int32_t		eweight;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/*
*0Sstevel@tonic-gate	 * For non-weighted policy everything has weight of zero (and we get
*0Sstevel@tonic-gate	 * round-robin distribution from intr_dist_cpuid).
*0Sstevel@tonic-gate	 * NB: intr_policy is limited to this file. A weighted nexus driver is
*0Sstevel@tonic-gate	 * calls this rouitne even if intr_policy has been patched to
*0Sstevel@tonic-gate	 * INTR_FLAG_DIST.
*0Sstevel@tonic-gate	 */
*0Sstevel@tonic-gate	ASSERT(dip);
*0Sstevel@tonic-gate	if (intr_policy != INTR_WEIGHTED_DIST)
*0Sstevel@tonic-gate		return;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	eweight = i_ddi_get_intr_weight(dip);
*0Sstevel@tonic-gate	INTR_DEBUG((CE_CONT, "intr_dist: cpu %2d weight %3d: +%2d/%2d for "
*0Sstevel@tonic-gate	    "%s#%d/%s#%d\n", cpuid, cpu[cpuid]->cpu_intr_weight,
*0Sstevel@tonic-gate	    nweight, eweight, ddi_driver_name(ddi_get_parent(dip)),
*0Sstevel@tonic-gate	    ddi_get_instance(ddi_get_parent(dip)),
*0Sstevel@tonic-gate	    ddi_driver_name(dip), ddi_get_instance(dip)));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* if no establish weight, establish nexus weight */
*0Sstevel@tonic-gate	if (eweight < 0) {
*0Sstevel@tonic-gate		if (nweight > 0)
*0Sstevel@tonic-gate			(void) i_ddi_set_intr_weight(dip, nweight);
*0Sstevel@tonic-gate		else
*0Sstevel@tonic-gate			nweight = 0;
*0Sstevel@tonic-gate	} else
*0Sstevel@tonic-gate		nweight = eweight;	/* use established weight */
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* Establish exclusion for cpu_intr_weight manipulation */
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate	cpu[cpuid]->cpu_intr_weight += nweight;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* update intr_dist_weight_max */
*0Sstevel@tonic-gate	if (nweight > intr_dist_weight_max)
*0Sstevel@tonic-gate		intr_dist_weight_max = nweight;
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate}
*0Sstevel@tonic-gate
*0Sstevel@tonic-gatevoid
*0Sstevel@tonic-gateintr_dist_cpuid_rem_device_weight(uint32_t cpuid, dev_info_t *dip)
*0Sstevel@tonic-gate{
*0Sstevel@tonic-gate	struct cpu	*cp;
*0Sstevel@tonic-gate	int32_t		weight;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	ASSERT(dip);
*0Sstevel@tonic-gate	if (intr_policy != INTR_WEIGHTED_DIST)
*0Sstevel@tonic-gate		return;
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* remove weight of device from cpu */
*0Sstevel@tonic-gate	weight = i_ddi_get_intr_weight(dip);
*0Sstevel@tonic-gate	if (weight < 0)
*0Sstevel@tonic-gate		weight = 0;
*0Sstevel@tonic-gate	INTR_DEBUG((CE_CONT, "intr_dist: cpu %2d weight %3d: -%2d    for "
*0Sstevel@tonic-gate	    "%s#%d/%s#%d\n", cpuid, cpu[cpuid]->cpu_intr_weight, weight,
*0Sstevel@tonic-gate	    ddi_driver_name(ddi_get_parent(dip)),
*0Sstevel@tonic-gate	    ddi_get_instance(ddi_get_parent(dip)),
*0Sstevel@tonic-gate	    ddi_driver_name(dip), ddi_get_instance(dip)));
*0Sstevel@tonic-gate
*0Sstevel@tonic-gate	/* Establish exclusion for cpu_intr_weight manipulation */
*0Sstevel@tonic-gate	mutex_enter(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate	cp = cpu[cpuid];
*0Sstevel@tonic-gate	cp->cpu_intr_weight -= weight;
*0Sstevel@tonic-gate	if (cp->cpu_intr_weight < 0)
*0Sstevel@tonic-gate		cp->cpu_intr_weight = 0;	/* sanity */
*0Sstevel@tonic-gate	mutex_exit(&intr_dist_cpu_lock);
*0Sstevel@tonic-gate}