xref: /onnv-gate/usr/src/uts/sun4/os/machdep.c (revision 2712)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
52005Selowe  * Common Development and Distribution License (the "License").
62005Selowe  * You may not use this file except in compliance with the License.
70Sstevel@tonic-gate  *
80Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
90Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
100Sstevel@tonic-gate  * See the License for the specific language governing permissions
110Sstevel@tonic-gate  * and limitations under the License.
120Sstevel@tonic-gate  *
130Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
140Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
150Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
160Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
170Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
180Sstevel@tonic-gate  *
190Sstevel@tonic-gate  * CDDL HEADER END
200Sstevel@tonic-gate  */
210Sstevel@tonic-gate /*
222005Selowe  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
230Sstevel@tonic-gate  * Use is subject to license terms.
240Sstevel@tonic-gate  */
250Sstevel@tonic-gate 
260Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
270Sstevel@tonic-gate 
280Sstevel@tonic-gate #include <sys/types.h>
290Sstevel@tonic-gate #include <sys/kstat.h>
300Sstevel@tonic-gate #include <sys/param.h>
310Sstevel@tonic-gate #include <sys/stack.h>
320Sstevel@tonic-gate #include <sys/regset.h>
330Sstevel@tonic-gate #include <sys/thread.h>
340Sstevel@tonic-gate #include <sys/proc.h>
350Sstevel@tonic-gate #include <sys/procfs_isa.h>
360Sstevel@tonic-gate #include <sys/kmem.h>
370Sstevel@tonic-gate #include <sys/cpuvar.h>
380Sstevel@tonic-gate #include <sys/systm.h>
390Sstevel@tonic-gate #include <sys/machpcb.h>
400Sstevel@tonic-gate #include <sys/machasi.h>
410Sstevel@tonic-gate #include <sys/vis.h>
420Sstevel@tonic-gate #include <sys/fpu/fpusystm.h>
430Sstevel@tonic-gate #include <sys/cpu_module.h>
440Sstevel@tonic-gate #include <sys/privregs.h>
450Sstevel@tonic-gate #include <sys/archsystm.h>
460Sstevel@tonic-gate #include <sys/atomic.h>
470Sstevel@tonic-gate #include <sys/cmn_err.h>
480Sstevel@tonic-gate #include <sys/time.h>
490Sstevel@tonic-gate #include <sys/clock.h>
500Sstevel@tonic-gate #include <sys/chip.h>
510Sstevel@tonic-gate #include <sys/cmp.h>
520Sstevel@tonic-gate #include <sys/platform_module.h>
530Sstevel@tonic-gate #include <sys/bl.h>
540Sstevel@tonic-gate #include <sys/nvpair.h>
550Sstevel@tonic-gate #include <sys/kdi_impl.h>
560Sstevel@tonic-gate #include <sys/machsystm.h>
570Sstevel@tonic-gate #include <sys/sysmacros.h>
580Sstevel@tonic-gate #include <sys/promif.h>
590Sstevel@tonic-gate #include <sys/pool_pset.h>
602005Selowe #include <vm/seg_kmem.h>
610Sstevel@tonic-gate 
620Sstevel@tonic-gate int maxphys = MMU_PAGESIZE * 16;	/* 128k */
630Sstevel@tonic-gate int klustsize = MMU_PAGESIZE * 16;	/* 128k */
640Sstevel@tonic-gate 
650Sstevel@tonic-gate /*
660Sstevel@tonic-gate  * Initialize kernel thread's stack.
670Sstevel@tonic-gate  */
680Sstevel@tonic-gate caddr_t
690Sstevel@tonic-gate thread_stk_init(caddr_t stk)
700Sstevel@tonic-gate {
710Sstevel@tonic-gate 	kfpu_t *fp;
720Sstevel@tonic-gate 	ulong_t align;
730Sstevel@tonic-gate 
740Sstevel@tonic-gate 	/* allocate extra space for floating point state */
750Sstevel@tonic-gate 	stk -= SA(sizeof (kfpu_t) + GSR_SIZE);
760Sstevel@tonic-gate 	align = (uintptr_t)stk & 0x3f;
770Sstevel@tonic-gate 	stk -= align;		/* force v9_fpu to be 16 byte aligned */
780Sstevel@tonic-gate 	fp = (kfpu_t *)stk;
790Sstevel@tonic-gate 	fp->fpu_fprs = 0;
800Sstevel@tonic-gate 
810Sstevel@tonic-gate 	stk -= SA(MINFRAME);
820Sstevel@tonic-gate 	return (stk);
830Sstevel@tonic-gate }
840Sstevel@tonic-gate 
852005Selowe #define	WIN32_SIZE	(MAXWIN * sizeof (struct rwindow32))
862005Selowe #define	WIN64_SIZE	(MAXWIN * sizeof (struct rwindow64))
872005Selowe 
882005Selowe kmem_cache_t	*wbuf32_cache;
892005Selowe kmem_cache_t	*wbuf64_cache;
902005Selowe 
912005Selowe void
922005Selowe lwp_stk_cache_init(void)
932005Selowe {
942224Selowe 	/*
952224Selowe 	 * Window buffers are allocated from the static arena
962224Selowe 	 * because they are accessed at TL>0. We also must use
972224Selowe 	 * KMC_NOHASH to prevent them from straddling page
982224Selowe 	 * boundaries as they are accessed by physical address.
992224Selowe 	 */
1002005Selowe 	wbuf32_cache = kmem_cache_create("wbuf32_cache", WIN32_SIZE,
1012224Selowe 	    0, NULL, NULL, NULL, NULL, static_arena, KMC_NOHASH);
1022005Selowe 	wbuf64_cache = kmem_cache_create("wbuf64_cache", WIN64_SIZE,
1032224Selowe 	    0, NULL, NULL, NULL, NULL, static_arena, KMC_NOHASH);
1042005Selowe }
1052005Selowe 
1060Sstevel@tonic-gate /*
1070Sstevel@tonic-gate  * Initialize lwp's kernel stack.
1080Sstevel@tonic-gate  * Note that now that the floating point register save area (kfpu_t)
1090Sstevel@tonic-gate  * has been broken out from machpcb and aligned on a 64 byte boundary so that
1100Sstevel@tonic-gate  * we can do block load/stores to/from it, there are a couple of potential
1110Sstevel@tonic-gate  * optimizations to save stack space. 1. The floating point register save
1120Sstevel@tonic-gate  * area could be aligned on a 16 byte boundary, and the floating point code
1130Sstevel@tonic-gate  * changed to (a) check the alignment and (b) use different save/restore
1140Sstevel@tonic-gate  * macros depending upon the alignment. 2. The lwp_stk_init code below
1150Sstevel@tonic-gate  * could be changed to calculate if less space would be wasted if machpcb
1160Sstevel@tonic-gate  * was first instead of second. However there is a REGOFF macro used in
1170Sstevel@tonic-gate  * locore, syscall_trap, machdep and mlsetup that assumes that the saved
1180Sstevel@tonic-gate  * register area is a fixed distance from the %sp, and would have to be
1190Sstevel@tonic-gate  * changed to a pointer or something...JJ said later.
1200Sstevel@tonic-gate  */
1210Sstevel@tonic-gate caddr_t
1220Sstevel@tonic-gate lwp_stk_init(klwp_t *lwp, caddr_t stk)
1230Sstevel@tonic-gate {
1240Sstevel@tonic-gate 	struct machpcb *mpcb;
1250Sstevel@tonic-gate 	kfpu_t *fp;
1260Sstevel@tonic-gate 	uintptr_t aln;
1270Sstevel@tonic-gate 
1280Sstevel@tonic-gate 	stk -= SA(sizeof (kfpu_t) + GSR_SIZE);
1290Sstevel@tonic-gate 	aln = (uintptr_t)stk & 0x3F;
1300Sstevel@tonic-gate 	stk -= aln;
1310Sstevel@tonic-gate 	fp = (kfpu_t *)stk;
1320Sstevel@tonic-gate 	stk -= SA(sizeof (struct machpcb));
1330Sstevel@tonic-gate 	mpcb = (struct machpcb *)stk;
1340Sstevel@tonic-gate 	bzero(mpcb, sizeof (struct machpcb));
1350Sstevel@tonic-gate 	bzero(fp, sizeof (kfpu_t) + GSR_SIZE);
1360Sstevel@tonic-gate 	lwp->lwp_regs = (void *)&mpcb->mpcb_regs;
1370Sstevel@tonic-gate 	lwp->lwp_fpu = (void *)fp;
1380Sstevel@tonic-gate 	mpcb->mpcb_fpu = fp;
1390Sstevel@tonic-gate 	mpcb->mpcb_fpu->fpu_q = mpcb->mpcb_fpu_q;
1400Sstevel@tonic-gate 	mpcb->mpcb_thread = lwp->lwp_thread;
1410Sstevel@tonic-gate 	mpcb->mpcb_wbcnt = 0;
1420Sstevel@tonic-gate 	if (lwp->lwp_procp->p_model == DATAMODEL_ILP32) {
1430Sstevel@tonic-gate 		mpcb->mpcb_wstate = WSTATE_USER32;
1442005Selowe 		mpcb->mpcb_wbuf = kmem_cache_alloc(wbuf32_cache, KM_SLEEP);
1450Sstevel@tonic-gate 	} else {
1460Sstevel@tonic-gate 		mpcb->mpcb_wstate = WSTATE_USER64;
1472005Selowe 		mpcb->mpcb_wbuf = kmem_cache_alloc(wbuf64_cache, KM_SLEEP);
1480Sstevel@tonic-gate 	}
1490Sstevel@tonic-gate 	ASSERT(((uintptr_t)mpcb->mpcb_wbuf & 7) == 0);
1500Sstevel@tonic-gate 	mpcb->mpcb_wbuf_pa = va_to_pa(mpcb->mpcb_wbuf);
1510Sstevel@tonic-gate 	mpcb->mpcb_pa = va_to_pa(mpcb);
1520Sstevel@tonic-gate 	return (stk);
1530Sstevel@tonic-gate }
1540Sstevel@tonic-gate 
1550Sstevel@tonic-gate void
1560Sstevel@tonic-gate lwp_stk_fini(klwp_t *lwp)
1570Sstevel@tonic-gate {
1580Sstevel@tonic-gate 	struct machpcb *mpcb = lwptompcb(lwp);
1590Sstevel@tonic-gate 
1600Sstevel@tonic-gate 	/*
1610Sstevel@tonic-gate 	 * there might be windows still in the wbuf due to unmapped
1620Sstevel@tonic-gate 	 * stack, misaligned stack pointer, etc.  We just free it.
1630Sstevel@tonic-gate 	 */
1640Sstevel@tonic-gate 	mpcb->mpcb_wbcnt = 0;
1650Sstevel@tonic-gate 	if (mpcb->mpcb_wstate == WSTATE_USER32)
1662005Selowe 		kmem_cache_free(wbuf32_cache, mpcb->mpcb_wbuf);
1670Sstevel@tonic-gate 	else
1682005Selowe 		kmem_cache_free(wbuf64_cache, mpcb->mpcb_wbuf);
1690Sstevel@tonic-gate 	mpcb->mpcb_wbuf = NULL;
1700Sstevel@tonic-gate 	mpcb->mpcb_wbuf_pa = -1;
1710Sstevel@tonic-gate }
1720Sstevel@tonic-gate 
1730Sstevel@tonic-gate 
1740Sstevel@tonic-gate /*
1750Sstevel@tonic-gate  * Copy regs from parent to child.
1760Sstevel@tonic-gate  */
1770Sstevel@tonic-gate void
1780Sstevel@tonic-gate lwp_forkregs(klwp_t *lwp, klwp_t *clwp)
1790Sstevel@tonic-gate {
1800Sstevel@tonic-gate 	kthread_t *t, *pt = lwptot(lwp);
1810Sstevel@tonic-gate 	struct machpcb *mpcb = lwptompcb(clwp);
1820Sstevel@tonic-gate 	struct machpcb *pmpcb = lwptompcb(lwp);
1830Sstevel@tonic-gate 	kfpu_t *fp, *pfp = lwptofpu(lwp);
1840Sstevel@tonic-gate 	caddr_t wbuf;
1850Sstevel@tonic-gate 	uint_t wstate;
1860Sstevel@tonic-gate 
1870Sstevel@tonic-gate 	t = mpcb->mpcb_thread;
1880Sstevel@tonic-gate 	/*
1890Sstevel@tonic-gate 	 * remember child's fp and wbuf since they will get erased during
1900Sstevel@tonic-gate 	 * the bcopy.
1910Sstevel@tonic-gate 	 */
1920Sstevel@tonic-gate 	fp = mpcb->mpcb_fpu;
1930Sstevel@tonic-gate 	wbuf = mpcb->mpcb_wbuf;
1940Sstevel@tonic-gate 	wstate = mpcb->mpcb_wstate;
1950Sstevel@tonic-gate 	/*
1960Sstevel@tonic-gate 	 * Don't copy mpcb_frame since we hand-crafted it
1970Sstevel@tonic-gate 	 * in thread_load().
1980Sstevel@tonic-gate 	 */
1990Sstevel@tonic-gate 	bcopy(lwp->lwp_regs, clwp->lwp_regs, sizeof (struct machpcb) - REGOFF);
2000Sstevel@tonic-gate 	mpcb->mpcb_thread = t;
2010Sstevel@tonic-gate 	mpcb->mpcb_fpu = fp;
2020Sstevel@tonic-gate 	fp->fpu_q = mpcb->mpcb_fpu_q;
2030Sstevel@tonic-gate 
2040Sstevel@tonic-gate 	/*
2050Sstevel@tonic-gate 	 * It is theoretically possibly for the lwp's wstate to
2060Sstevel@tonic-gate 	 * be different from its value assigned in lwp_stk_init,
2070Sstevel@tonic-gate 	 * since lwp_stk_init assumed the data model of the process.
2080Sstevel@tonic-gate 	 * Here, we took on the data model of the cloned lwp.
2090Sstevel@tonic-gate 	 */
2100Sstevel@tonic-gate 	if (mpcb->mpcb_wstate != wstate) {
2110Sstevel@tonic-gate 		if (wstate == WSTATE_USER32) {
2122005Selowe 			kmem_cache_free(wbuf32_cache, wbuf);
2132005Selowe 			wbuf = kmem_cache_alloc(wbuf64_cache, KM_SLEEP);
2140Sstevel@tonic-gate 			wstate = WSTATE_USER64;
2150Sstevel@tonic-gate 		} else {
2162005Selowe 			kmem_cache_free(wbuf64_cache, wbuf);
2172005Selowe 			wbuf = kmem_cache_alloc(wbuf32_cache, KM_SLEEP);
2180Sstevel@tonic-gate 			wstate = WSTATE_USER32;
2190Sstevel@tonic-gate 		}
2200Sstevel@tonic-gate 	}
2210Sstevel@tonic-gate 
2220Sstevel@tonic-gate 	mpcb->mpcb_pa = va_to_pa(mpcb);
2230Sstevel@tonic-gate 	mpcb->mpcb_wbuf = wbuf;
2240Sstevel@tonic-gate 	mpcb->mpcb_wbuf_pa = va_to_pa(wbuf);
2250Sstevel@tonic-gate 
2260Sstevel@tonic-gate 	ASSERT(mpcb->mpcb_wstate == wstate);
2270Sstevel@tonic-gate 
2280Sstevel@tonic-gate 	if (mpcb->mpcb_wbcnt != 0) {
2290Sstevel@tonic-gate 		bcopy(pmpcb->mpcb_wbuf, mpcb->mpcb_wbuf,
2300Sstevel@tonic-gate 		    mpcb->mpcb_wbcnt * ((mpcb->mpcb_wstate == WSTATE_USER32) ?
2310Sstevel@tonic-gate 		    sizeof (struct rwindow32) : sizeof (struct rwindow64)));
2320Sstevel@tonic-gate 	}
2330Sstevel@tonic-gate 
2340Sstevel@tonic-gate 	if (pt == curthread)
2350Sstevel@tonic-gate 		pfp->fpu_fprs = _fp_read_fprs();
2360Sstevel@tonic-gate 	if ((pfp->fpu_en) || (pfp->fpu_fprs & FPRS_FEF)) {
2370Sstevel@tonic-gate 		if (pt == curthread && fpu_exists) {
2380Sstevel@tonic-gate 			save_gsr(clwp->lwp_fpu);
2390Sstevel@tonic-gate 		} else {
2400Sstevel@tonic-gate 			uint64_t gsr;
2410Sstevel@tonic-gate 			gsr = get_gsr(lwp->lwp_fpu);
2420Sstevel@tonic-gate 			set_gsr(gsr, clwp->lwp_fpu);
2430Sstevel@tonic-gate 		}
2440Sstevel@tonic-gate 		fp_fork(lwp, clwp);
2450Sstevel@tonic-gate 	}
2460Sstevel@tonic-gate }
2470Sstevel@tonic-gate 
2480Sstevel@tonic-gate /*
2490Sstevel@tonic-gate  * Free lwp fpu regs.
2500Sstevel@tonic-gate  */
2510Sstevel@tonic-gate void
2520Sstevel@tonic-gate lwp_freeregs(klwp_t *lwp, int isexec)
2530Sstevel@tonic-gate {
2540Sstevel@tonic-gate 	kfpu_t *fp = lwptofpu(lwp);
2550Sstevel@tonic-gate 
2560Sstevel@tonic-gate 	if (lwptot(lwp) == curthread)
2570Sstevel@tonic-gate 		fp->fpu_fprs = _fp_read_fprs();
2580Sstevel@tonic-gate 	if ((fp->fpu_en) || (fp->fpu_fprs & FPRS_FEF))
2590Sstevel@tonic-gate 		fp_free(fp, isexec);
2600Sstevel@tonic-gate }
2610Sstevel@tonic-gate 
2620Sstevel@tonic-gate /*
263*2712Snn35248  * This function is currently unused on sparc.
264*2712Snn35248  */
265*2712Snn35248 /*ARGSUSED*/
266*2712Snn35248 void
267*2712Snn35248 lwp_attach_brand_hdlrs(klwp_t *lwp)
268*2712Snn35248 {}
269*2712Snn35248 
270*2712Snn35248 /*
2710Sstevel@tonic-gate  * fill in the extra register state area specified with the
2720Sstevel@tonic-gate  * specified lwp's platform-dependent non-floating-point extra
2730Sstevel@tonic-gate  * register state information
2740Sstevel@tonic-gate  */
2750Sstevel@tonic-gate /* ARGSUSED */
2760Sstevel@tonic-gate void
2770Sstevel@tonic-gate xregs_getgfiller(klwp_id_t lwp, caddr_t xrp)
2780Sstevel@tonic-gate {
2790Sstevel@tonic-gate 	/* for sun4u nothing to do here, added for symmetry */
2800Sstevel@tonic-gate }
2810Sstevel@tonic-gate 
2820Sstevel@tonic-gate /*
2830Sstevel@tonic-gate  * fill in the extra register state area specified with the specified lwp's
2840Sstevel@tonic-gate  * platform-dependent floating-point extra register state information.
2850Sstevel@tonic-gate  * NOTE:  'lwp' might not correspond to 'curthread' since this is
2860Sstevel@tonic-gate  * called from code in /proc to get the registers of another lwp.
2870Sstevel@tonic-gate  */
2880Sstevel@tonic-gate void
2890Sstevel@tonic-gate xregs_getfpfiller(klwp_id_t lwp, caddr_t xrp)
2900Sstevel@tonic-gate {
2910Sstevel@tonic-gate 	prxregset_t *xregs = (prxregset_t *)xrp;
2920Sstevel@tonic-gate 	kfpu_t *fp = lwptofpu(lwp);
2930Sstevel@tonic-gate 	uint32_t fprs = (FPRS_FEF|FPRS_DU|FPRS_DL);
2940Sstevel@tonic-gate 	uint64_t gsr;
2950Sstevel@tonic-gate 
2960Sstevel@tonic-gate 	/*
2970Sstevel@tonic-gate 	 * fp_fksave() does not flush the GSR register into
2980Sstevel@tonic-gate 	 * the lwp area, so do it now
2990Sstevel@tonic-gate 	 */
3000Sstevel@tonic-gate 	kpreempt_disable();
3010Sstevel@tonic-gate 	if (ttolwp(curthread) == lwp && fpu_exists) {
3020Sstevel@tonic-gate 		fp->fpu_fprs = _fp_read_fprs();
3030Sstevel@tonic-gate 		if ((fp->fpu_fprs & FPRS_FEF) != FPRS_FEF) {
3040Sstevel@tonic-gate 			_fp_write_fprs(fprs);
3050Sstevel@tonic-gate 			fp->fpu_fprs = (V9_FPU_FPRS_TYPE)fprs;
3060Sstevel@tonic-gate 		}
3070Sstevel@tonic-gate 		save_gsr(fp);
3080Sstevel@tonic-gate 	}
3090Sstevel@tonic-gate 	gsr = get_gsr(fp);
3100Sstevel@tonic-gate 	kpreempt_enable();
3110Sstevel@tonic-gate 	PRXREG_GSR(xregs) = gsr;
3120Sstevel@tonic-gate }
3130Sstevel@tonic-gate 
3140Sstevel@tonic-gate /*
3150Sstevel@tonic-gate  * set the specified lwp's platform-dependent non-floating-point
3160Sstevel@tonic-gate  * extra register state based on the specified input
3170Sstevel@tonic-gate  */
3180Sstevel@tonic-gate /* ARGSUSED */
3190Sstevel@tonic-gate void
3200Sstevel@tonic-gate xregs_setgfiller(klwp_id_t lwp, caddr_t xrp)
3210Sstevel@tonic-gate {
3220Sstevel@tonic-gate 	/* for sun4u nothing to do here, added for symmetry */
3230Sstevel@tonic-gate }
3240Sstevel@tonic-gate 
3250Sstevel@tonic-gate /*
3260Sstevel@tonic-gate  * set the specified lwp's platform-dependent floating-point
3270Sstevel@tonic-gate  * extra register state based on the specified input
3280Sstevel@tonic-gate  */
3290Sstevel@tonic-gate void
3300Sstevel@tonic-gate xregs_setfpfiller(klwp_id_t lwp, caddr_t xrp)
3310Sstevel@tonic-gate {
3320Sstevel@tonic-gate 	prxregset_t *xregs = (prxregset_t *)xrp;
3330Sstevel@tonic-gate 	kfpu_t *fp = lwptofpu(lwp);
3340Sstevel@tonic-gate 	uint32_t fprs = (FPRS_FEF|FPRS_DU|FPRS_DL);
3350Sstevel@tonic-gate 	uint64_t gsr = PRXREG_GSR(xregs);
3360Sstevel@tonic-gate 
3370Sstevel@tonic-gate 	kpreempt_disable();
3380Sstevel@tonic-gate 	set_gsr(gsr, lwptofpu(lwp));
3390Sstevel@tonic-gate 
3400Sstevel@tonic-gate 	if ((lwp == ttolwp(curthread)) && fpu_exists) {
3410Sstevel@tonic-gate 		fp->fpu_fprs = _fp_read_fprs();
3420Sstevel@tonic-gate 		if ((fp->fpu_fprs & FPRS_FEF) != FPRS_FEF) {
3430Sstevel@tonic-gate 			_fp_write_fprs(fprs);
3440Sstevel@tonic-gate 			fp->fpu_fprs = (V9_FPU_FPRS_TYPE)fprs;
3450Sstevel@tonic-gate 		}
3460Sstevel@tonic-gate 		restore_gsr(lwptofpu(lwp));
3470Sstevel@tonic-gate 	}
3480Sstevel@tonic-gate 	kpreempt_enable();
3490Sstevel@tonic-gate }
3500Sstevel@tonic-gate 
3510Sstevel@tonic-gate /*
3520Sstevel@tonic-gate  * fill in the sun4u asrs, ie, the lwp's platform-dependent
3530Sstevel@tonic-gate  * non-floating-point extra register state information
3540Sstevel@tonic-gate  */
3550Sstevel@tonic-gate /* ARGSUSED */
3560Sstevel@tonic-gate void
3570Sstevel@tonic-gate getasrs(klwp_t *lwp, asrset_t asr)
3580Sstevel@tonic-gate {
3590Sstevel@tonic-gate 	/* for sun4u nothing to do here, added for symmetry */
3600Sstevel@tonic-gate }
3610Sstevel@tonic-gate 
3620Sstevel@tonic-gate /*
3630Sstevel@tonic-gate  * fill in the sun4u asrs, ie, the lwp's platform-dependent
3640Sstevel@tonic-gate  * floating-point extra register state information
3650Sstevel@tonic-gate  */
3660Sstevel@tonic-gate void
3670Sstevel@tonic-gate getfpasrs(klwp_t *lwp, asrset_t asr)
3680Sstevel@tonic-gate {
3690Sstevel@tonic-gate 	kfpu_t *fp = lwptofpu(lwp);
3700Sstevel@tonic-gate 	uint32_t fprs = (FPRS_FEF|FPRS_DU|FPRS_DL);
3710Sstevel@tonic-gate 
3720Sstevel@tonic-gate 	kpreempt_disable();
3730Sstevel@tonic-gate 	if (ttolwp(curthread) == lwp)
3740Sstevel@tonic-gate 		fp->fpu_fprs = _fp_read_fprs();
3750Sstevel@tonic-gate 	if ((fp->fpu_en) || (fp->fpu_fprs & FPRS_FEF)) {
3760Sstevel@tonic-gate 		if (fpu_exists && ttolwp(curthread) == lwp) {
3770Sstevel@tonic-gate 			if ((fp->fpu_fprs & FPRS_FEF) != FPRS_FEF) {
3780Sstevel@tonic-gate 				_fp_write_fprs(fprs);
3790Sstevel@tonic-gate 				fp->fpu_fprs = (V9_FPU_FPRS_TYPE)fprs;
3800Sstevel@tonic-gate 			}
3810Sstevel@tonic-gate 			save_gsr(fp);
3820Sstevel@tonic-gate 		}
3830Sstevel@tonic-gate 		asr[ASR_GSR] = (int64_t)get_gsr(fp);
3840Sstevel@tonic-gate 	}
3850Sstevel@tonic-gate 	kpreempt_enable();
3860Sstevel@tonic-gate }
3870Sstevel@tonic-gate 
3880Sstevel@tonic-gate /*
3890Sstevel@tonic-gate  * set the sun4u asrs, ie, the lwp's platform-dependent
3900Sstevel@tonic-gate  * non-floating-point extra register state information
3910Sstevel@tonic-gate  */
3920Sstevel@tonic-gate /* ARGSUSED */
3930Sstevel@tonic-gate void
3940Sstevel@tonic-gate setasrs(klwp_t *lwp, asrset_t asr)
3950Sstevel@tonic-gate {
3960Sstevel@tonic-gate 	/* for sun4u nothing to do here, added for symmetry */
3970Sstevel@tonic-gate }
3980Sstevel@tonic-gate 
3990Sstevel@tonic-gate void
4000Sstevel@tonic-gate setfpasrs(klwp_t *lwp, asrset_t asr)
4010Sstevel@tonic-gate {
4020Sstevel@tonic-gate 	kfpu_t *fp = lwptofpu(lwp);
4030Sstevel@tonic-gate 	uint32_t fprs = (FPRS_FEF|FPRS_DU|FPRS_DL);
4040Sstevel@tonic-gate 
4050Sstevel@tonic-gate 	kpreempt_disable();
4060Sstevel@tonic-gate 	if (ttolwp(curthread) == lwp)
4070Sstevel@tonic-gate 		fp->fpu_fprs = _fp_read_fprs();
4080Sstevel@tonic-gate 	if ((fp->fpu_en) || (fp->fpu_fprs & FPRS_FEF)) {
4090Sstevel@tonic-gate 		set_gsr(asr[ASR_GSR], fp);
4100Sstevel@tonic-gate 		if (fpu_exists && ttolwp(curthread) == lwp) {
4110Sstevel@tonic-gate 			if ((fp->fpu_fprs & FPRS_FEF) != FPRS_FEF) {
4120Sstevel@tonic-gate 				_fp_write_fprs(fprs);
4130Sstevel@tonic-gate 				fp->fpu_fprs = (V9_FPU_FPRS_TYPE)fprs;
4140Sstevel@tonic-gate 			}
4150Sstevel@tonic-gate 			restore_gsr(fp);
4160Sstevel@tonic-gate 		}
4170Sstevel@tonic-gate 	}
4180Sstevel@tonic-gate 	kpreempt_enable();
4190Sstevel@tonic-gate }
4200Sstevel@tonic-gate 
4210Sstevel@tonic-gate /*
4220Sstevel@tonic-gate  * Create interrupt kstats for this CPU.
4230Sstevel@tonic-gate  */
4240Sstevel@tonic-gate void
4250Sstevel@tonic-gate cpu_create_intrstat(cpu_t *cp)
4260Sstevel@tonic-gate {
4270Sstevel@tonic-gate 	int		i;
4280Sstevel@tonic-gate 	kstat_t		*intr_ksp;
4290Sstevel@tonic-gate 	kstat_named_t	*knp;
4300Sstevel@tonic-gate 	char		name[KSTAT_STRLEN];
4310Sstevel@tonic-gate 	zoneid_t	zoneid;
4320Sstevel@tonic-gate 
4330Sstevel@tonic-gate 	ASSERT(MUTEX_HELD(&cpu_lock));
4340Sstevel@tonic-gate 
4350Sstevel@tonic-gate 	if (pool_pset_enabled())
4360Sstevel@tonic-gate 		zoneid = GLOBAL_ZONEID;
4370Sstevel@tonic-gate 	else
4380Sstevel@tonic-gate 		zoneid = ALL_ZONES;
4390Sstevel@tonic-gate 
4400Sstevel@tonic-gate 	intr_ksp = kstat_create_zone("cpu", cp->cpu_id, "intrstat", "misc",
4410Sstevel@tonic-gate 	    KSTAT_TYPE_NAMED, PIL_MAX * 2, NULL, zoneid);
4420Sstevel@tonic-gate 
4430Sstevel@tonic-gate 	/*
4440Sstevel@tonic-gate 	 * Initialize each PIL's named kstat
4450Sstevel@tonic-gate 	 */
4460Sstevel@tonic-gate 	if (intr_ksp != NULL) {
4470Sstevel@tonic-gate 		intr_ksp->ks_update = cpu_kstat_intrstat_update;
4480Sstevel@tonic-gate 		knp = (kstat_named_t *)intr_ksp->ks_data;
4490Sstevel@tonic-gate 		intr_ksp->ks_private = cp;
4500Sstevel@tonic-gate 		for (i = 0; i < PIL_MAX; i++) {
4510Sstevel@tonic-gate 			(void) snprintf(name, KSTAT_STRLEN, "level-%d-time",
4520Sstevel@tonic-gate 			    i + 1);
4530Sstevel@tonic-gate 			kstat_named_init(&knp[i * 2], name, KSTAT_DATA_UINT64);
4540Sstevel@tonic-gate 			(void) snprintf(name, KSTAT_STRLEN, "level-%d-count",
4550Sstevel@tonic-gate 			    i + 1);
4560Sstevel@tonic-gate 			kstat_named_init(&knp[(i * 2) + 1], name,
4570Sstevel@tonic-gate 			    KSTAT_DATA_UINT64);
4580Sstevel@tonic-gate 		}
4590Sstevel@tonic-gate 		kstat_install(intr_ksp);
4600Sstevel@tonic-gate 	}
4610Sstevel@tonic-gate }
4620Sstevel@tonic-gate 
4630Sstevel@tonic-gate /*
4640Sstevel@tonic-gate  * Delete interrupt kstats for this CPU.
4650Sstevel@tonic-gate  */
4660Sstevel@tonic-gate void
4670Sstevel@tonic-gate cpu_delete_intrstat(cpu_t *cp)
4680Sstevel@tonic-gate {
4690Sstevel@tonic-gate 	kstat_delete_byname_zone("cpu", cp->cpu_id, "intrstat", ALL_ZONES);
4700Sstevel@tonic-gate }
4710Sstevel@tonic-gate 
4720Sstevel@tonic-gate /*
4730Sstevel@tonic-gate  * Convert interrupt statistics from CPU ticks to nanoseconds and
4740Sstevel@tonic-gate  * update kstat.
4750Sstevel@tonic-gate  */
4760Sstevel@tonic-gate int
4770Sstevel@tonic-gate cpu_kstat_intrstat_update(kstat_t *ksp, int rw)
4780Sstevel@tonic-gate {
4790Sstevel@tonic-gate 	kstat_named_t	*knp = ksp->ks_data;
4800Sstevel@tonic-gate 	cpu_t		*cpup = (cpu_t *)ksp->ks_private;
4810Sstevel@tonic-gate 	int		i;
4820Sstevel@tonic-gate 
4830Sstevel@tonic-gate 	if (rw == KSTAT_WRITE)
4840Sstevel@tonic-gate 		return (EACCES);
4850Sstevel@tonic-gate 
4860Sstevel@tonic-gate 	/*
4870Sstevel@tonic-gate 	 * We use separate passes to copy and convert the statistics to
4880Sstevel@tonic-gate 	 * nanoseconds. This assures that the snapshot of the data is as
4890Sstevel@tonic-gate 	 * self-consistent as possible.
4900Sstevel@tonic-gate 	 */
4910Sstevel@tonic-gate 
4920Sstevel@tonic-gate 	for (i = 0; i < PIL_MAX; i++) {
4930Sstevel@tonic-gate 		knp[i * 2].value.ui64 = cpup->cpu_m.intrstat[i + 1][0];
4940Sstevel@tonic-gate 		knp[(i * 2) + 1].value.ui64 = cpup->cpu_stats.sys.intr[i];
4950Sstevel@tonic-gate 	}
4960Sstevel@tonic-gate 
4970Sstevel@tonic-gate 	for (i = 0; i < PIL_MAX; i++) {
4980Sstevel@tonic-gate 		knp[i * 2].value.ui64 =
4990Sstevel@tonic-gate 		    (uint64_t)tick2ns((hrtime_t)knp[i * 2].value.ui64,
5000Sstevel@tonic-gate 			cpup->cpu_id);
5010Sstevel@tonic-gate 	}
5020Sstevel@tonic-gate 
5030Sstevel@tonic-gate 	return (0);
5040Sstevel@tonic-gate }
5050Sstevel@tonic-gate 
5060Sstevel@tonic-gate /*
5070Sstevel@tonic-gate  * Called by common/os/cpu.c for psrinfo(1m) kstats
5080Sstevel@tonic-gate  */
5090Sstevel@tonic-gate char *
5100Sstevel@tonic-gate cpu_fru_fmri(cpu_t *cp)
5110Sstevel@tonic-gate {
5120Sstevel@tonic-gate 	return (cpunodes[cp->cpu_id].fru_fmri);
5130Sstevel@tonic-gate }
5140Sstevel@tonic-gate 
5150Sstevel@tonic-gate /*
5160Sstevel@tonic-gate  * An interrupt thread is ending a time slice, so compute the interval it
5170Sstevel@tonic-gate  * ran for and update the statistic for its PIL.
5180Sstevel@tonic-gate  */
5190Sstevel@tonic-gate void
5200Sstevel@tonic-gate cpu_intr_swtch_enter(kthread_id_t t)
5210Sstevel@tonic-gate {
5220Sstevel@tonic-gate 	uint64_t	interval;
5230Sstevel@tonic-gate 	uint64_t	start;
524590Sesolom 	cpu_t		*cpu;
5250Sstevel@tonic-gate 
5260Sstevel@tonic-gate 	ASSERT((t->t_flag & T_INTR_THREAD) != 0);
5270Sstevel@tonic-gate 	ASSERT(t->t_pil > 0 && t->t_pil <= LOCK_LEVEL);
5280Sstevel@tonic-gate 
5290Sstevel@tonic-gate 	/*
5300Sstevel@tonic-gate 	 * We could be here with a zero timestamp. This could happen if:
5310Sstevel@tonic-gate 	 * an interrupt thread which no longer has a pinned thread underneath
5320Sstevel@tonic-gate 	 * it (i.e. it blocked at some point in its past) has finished running
5330Sstevel@tonic-gate 	 * its handler. intr_thread() updated the interrupt statistic for its
5340Sstevel@tonic-gate 	 * PIL and zeroed its timestamp. Since there was no pinned thread to
5350Sstevel@tonic-gate 	 * return to, swtch() gets called and we end up here.
5360Sstevel@tonic-gate 	 *
5370Sstevel@tonic-gate 	 * It can also happen if an interrupt thread in intr_thread() calls
5380Sstevel@tonic-gate 	 * preempt. It will have already taken care of updating stats. In
5390Sstevel@tonic-gate 	 * this event, the interrupt thread will be runnable.
5400Sstevel@tonic-gate 	 */
5410Sstevel@tonic-gate 	if (t->t_intr_start) {
5420Sstevel@tonic-gate 		do {
5430Sstevel@tonic-gate 			start = t->t_intr_start;
5440Sstevel@tonic-gate 			interval = gettick_counter() - start;
5450Sstevel@tonic-gate 		} while (cas64(&t->t_intr_start, start, 0) != start);
546590Sesolom 		cpu = CPU;
547590Sesolom 		if (cpu->cpu_m.divisor > 1)
548590Sesolom 			interval *= cpu->cpu_m.divisor;
549590Sesolom 		cpu->cpu_m.intrstat[t->t_pil][0] += interval;
550590Sesolom 
551590Sesolom 		atomic_add_64((uint64_t *)&cpu->cpu_intracct[cpu->cpu_mstate],
552590Sesolom 		    interval);
5530Sstevel@tonic-gate 	} else
5540Sstevel@tonic-gate 		ASSERT(t->t_intr == NULL || t->t_state == TS_RUN);
5550Sstevel@tonic-gate }
5560Sstevel@tonic-gate 
5570Sstevel@tonic-gate 
5580Sstevel@tonic-gate /*
5590Sstevel@tonic-gate  * An interrupt thread is returning from swtch(). Place a starting timestamp
5600Sstevel@tonic-gate  * in its thread structure.
5610Sstevel@tonic-gate  */
5620Sstevel@tonic-gate void
5630Sstevel@tonic-gate cpu_intr_swtch_exit(kthread_id_t t)
5640Sstevel@tonic-gate {
5650Sstevel@tonic-gate 	uint64_t ts;
5660Sstevel@tonic-gate 
5670Sstevel@tonic-gate 	ASSERT((t->t_flag & T_INTR_THREAD) != 0);
5680Sstevel@tonic-gate 	ASSERT(t->t_pil > 0 && t->t_pil <= LOCK_LEVEL);
5690Sstevel@tonic-gate 
5700Sstevel@tonic-gate 	do {
5710Sstevel@tonic-gate 		ts = t->t_intr_start;
5720Sstevel@tonic-gate 	} while (cas64(&t->t_intr_start, ts, gettick_counter()) != ts);
5730Sstevel@tonic-gate }
5740Sstevel@tonic-gate 
5750Sstevel@tonic-gate 
5760Sstevel@tonic-gate int
5770Sstevel@tonic-gate blacklist(int cmd, const char *scheme, nvlist_t *fmri, const char *class)
5780Sstevel@tonic-gate {
5790Sstevel@tonic-gate 	if (&plat_blacklist)
5800Sstevel@tonic-gate 		return (plat_blacklist(cmd, scheme, fmri, class));
5810Sstevel@tonic-gate 
5820Sstevel@tonic-gate 	return (ENOTSUP);
5830Sstevel@tonic-gate }
5840Sstevel@tonic-gate 
5850Sstevel@tonic-gate int
5860Sstevel@tonic-gate kdi_pread(caddr_t buf, size_t nbytes, uint64_t addr, size_t *ncopiedp)
5870Sstevel@tonic-gate {
5880Sstevel@tonic-gate 	extern void kdi_flush_caches(void);
5890Sstevel@tonic-gate 	size_t nread = 0;
5900Sstevel@tonic-gate 	uint32_t word;
5910Sstevel@tonic-gate 	int slop, i;
5920Sstevel@tonic-gate 
5930Sstevel@tonic-gate 	kdi_flush_caches();
5940Sstevel@tonic-gate 	membar_enter();
5950Sstevel@tonic-gate 
5960Sstevel@tonic-gate 	/* We might not begin on a word boundary. */
5970Sstevel@tonic-gate 	if ((slop = addr & 3) != 0) {
5980Sstevel@tonic-gate 		word = ldphys(addr & ~3);
5990Sstevel@tonic-gate 		for (i = slop; i < 4 && nbytes > 0; i++, nbytes--, nread++)
6000Sstevel@tonic-gate 			*buf++ = ((uchar_t *)&word)[i];
6010Sstevel@tonic-gate 		addr = roundup(addr, 4);
6020Sstevel@tonic-gate 	}
6030Sstevel@tonic-gate 
6040Sstevel@tonic-gate 	while (nbytes > 0) {
6050Sstevel@tonic-gate 		word = ldphys(addr);
6060Sstevel@tonic-gate 		for (i = 0; i < 4 && nbytes > 0; i++, nbytes--, nread++, addr++)
6070Sstevel@tonic-gate 			*buf++ = ((uchar_t *)&word)[i];
6080Sstevel@tonic-gate 	}
6090Sstevel@tonic-gate 
6100Sstevel@tonic-gate 	kdi_flush_caches();
6110Sstevel@tonic-gate 
6120Sstevel@tonic-gate 	*ncopiedp = nread;
6130Sstevel@tonic-gate 	return (0);
6140Sstevel@tonic-gate }
6150Sstevel@tonic-gate 
6160Sstevel@tonic-gate int
6170Sstevel@tonic-gate kdi_pwrite(caddr_t buf, size_t nbytes, uint64_t addr, size_t *ncopiedp)
6180Sstevel@tonic-gate {
6190Sstevel@tonic-gate 	extern void kdi_flush_caches(void);
6200Sstevel@tonic-gate 	size_t nwritten = 0;
6210Sstevel@tonic-gate 	uint32_t word;
6220Sstevel@tonic-gate 	int slop, i;
6230Sstevel@tonic-gate 
6240Sstevel@tonic-gate 	kdi_flush_caches();
6250Sstevel@tonic-gate 
6260Sstevel@tonic-gate 	/* We might not begin on a word boundary. */
6270Sstevel@tonic-gate 	if ((slop = addr & 3) != 0) {
6280Sstevel@tonic-gate 		word = ldphys(addr & ~3);
6290Sstevel@tonic-gate 		for (i = slop; i < 4 && nbytes > 0; i++, nbytes--, nwritten++)
6300Sstevel@tonic-gate 			((uchar_t *)&word)[i] = *buf++;
6310Sstevel@tonic-gate 		stphys(addr & ~3, word);
6320Sstevel@tonic-gate 		addr = roundup(addr, 4);
6330Sstevel@tonic-gate 	}
6340Sstevel@tonic-gate 
6350Sstevel@tonic-gate 	while (nbytes > 3) {
6360Sstevel@tonic-gate 		for (word = 0, i = 0; i < 4; i++, nbytes--, nwritten++)
6370Sstevel@tonic-gate 			((uchar_t *)&word)[i] = *buf++;
6380Sstevel@tonic-gate 		stphys(addr, word);
6390Sstevel@tonic-gate 		addr += 4;
6400Sstevel@tonic-gate 	}
6410Sstevel@tonic-gate 
6420Sstevel@tonic-gate 	/* We might not end with a whole word. */
6430Sstevel@tonic-gate 	if (nbytes > 0) {
6440Sstevel@tonic-gate 		word = ldphys(addr);
6450Sstevel@tonic-gate 		for (i = 0; nbytes > 0; i++, nbytes--, nwritten++)
6460Sstevel@tonic-gate 			((uchar_t *)&word)[i] = *buf++;
6470Sstevel@tonic-gate 		stphys(addr, word);
6480Sstevel@tonic-gate 	}
6490Sstevel@tonic-gate 
6500Sstevel@tonic-gate 	membar_enter();
6510Sstevel@tonic-gate 	kdi_flush_caches();
6520Sstevel@tonic-gate 
6530Sstevel@tonic-gate 	*ncopiedp = nwritten;
6540Sstevel@tonic-gate 	return (0);
6550Sstevel@tonic-gate }
6560Sstevel@tonic-gate 
6570Sstevel@tonic-gate static void
6580Sstevel@tonic-gate kdi_kernpanic(struct regs *regs, uint_t tt)
6590Sstevel@tonic-gate {
6600Sstevel@tonic-gate 	sync_reg_buf = *regs;
6610Sstevel@tonic-gate 	sync_tt = tt;
6620Sstevel@tonic-gate 
6630Sstevel@tonic-gate 	sync_handler();
6640Sstevel@tonic-gate }
6650Sstevel@tonic-gate 
6660Sstevel@tonic-gate static void
6670Sstevel@tonic-gate kdi_plat_call(void (*platfn)(void))
6680Sstevel@tonic-gate {
6690Sstevel@tonic-gate 	if (platfn != NULL) {
6700Sstevel@tonic-gate 		prom_suspend_prepost();
6710Sstevel@tonic-gate 		platfn();
6720Sstevel@tonic-gate 		prom_resume_prepost();
6730Sstevel@tonic-gate 	}
6740Sstevel@tonic-gate }
6750Sstevel@tonic-gate 
6760Sstevel@tonic-gate void
6770Sstevel@tonic-gate mach_kdi_init(kdi_t *kdi)
6780Sstevel@tonic-gate {
6790Sstevel@tonic-gate 	kdi->kdi_plat_call = kdi_plat_call;
6800Sstevel@tonic-gate 	kdi->mkdi_cpu_index = kdi_cpu_index;
6810Sstevel@tonic-gate 	kdi->mkdi_trap_vatotte = kdi_trap_vatotte;
6820Sstevel@tonic-gate 	kdi->mkdi_kernpanic = kdi_kernpanic;
6830Sstevel@tonic-gate }
684590Sesolom 
685590Sesolom 
686590Sesolom /*
687590Sesolom  * get_cpu_mstate() is passed an array of timestamps, NCMSTATES
688590Sesolom  * long, and it fills in the array with the time spent on cpu in
689590Sesolom  * each of the mstates, where time is returned in nsec.
690590Sesolom  *
691590Sesolom  * No guarantee is made that the returned values in times[] will
692590Sesolom  * monotonically increase on sequential calls, although this will
693590Sesolom  * be true in the long run. Any such guarantee must be handled by
694590Sesolom  * the caller, if needed. This can happen if we fail to account
695590Sesolom  * for elapsed time due to a generation counter conflict, yet we
696590Sesolom  * did account for it on a prior call (see below).
697590Sesolom  *
698590Sesolom  * The complication is that the cpu in question may be updating
699590Sesolom  * its microstate at the same time that we are reading it.
700590Sesolom  * Because the microstate is only updated when the CPU's state
701590Sesolom  * changes, the values in cpu_intracct[] can be indefinitely out
702590Sesolom  * of date. To determine true current values, it is necessary to
703590Sesolom  * compare the current time with cpu_mstate_start, and add the
704590Sesolom  * difference to times[cpu_mstate].
705590Sesolom  *
706590Sesolom  * This can be a problem if those values are changing out from
707590Sesolom  * under us. Because the code path in new_cpu_mstate() is
708590Sesolom  * performance critical, we have not added a lock to it. Instead,
709590Sesolom  * we have added a generation counter. Before beginning
710590Sesolom  * modifications, the counter is set to 0. After modifications,
711590Sesolom  * it is set to the old value plus one.
712590Sesolom  *
713590Sesolom  * get_cpu_mstate() will not consider the values of cpu_mstate
714590Sesolom  * and cpu_mstate_start to be usable unless the value of
715590Sesolom  * cpu_mstate_gen is both non-zero and unchanged, both before and
716590Sesolom  * after reading the mstate information. Note that we must
717590Sesolom  * protect against out-of-order loads around accesses to the
718590Sesolom  * generation counter. Also, this is a best effort approach in
719590Sesolom  * that we do not retry should the counter be found to have
720590Sesolom  * changed.
721590Sesolom  *
722590Sesolom  * cpu_intracct[] is used to identify time spent in each CPU
723590Sesolom  * mstate while handling interrupts. Such time should be reported
724590Sesolom  * against system time, and so is subtracted out from its
725590Sesolom  * corresponding cpu_acct[] time and added to
726590Sesolom  * cpu_acct[CMS_SYSTEM]. Additionally, intracct time is stored in
727590Sesolom  * %ticks, but acct time may be stored as %sticks, thus requiring
728590Sesolom  * different conversions before they can be compared.
729590Sesolom  */
730590Sesolom 
731590Sesolom void
732590Sesolom get_cpu_mstate(cpu_t *cpu, hrtime_t *times)
733590Sesolom {
734590Sesolom 	int i;
735590Sesolom 	hrtime_t now, start;
736590Sesolom 	uint16_t gen;
737590Sesolom 	uint16_t state;
738590Sesolom 	hrtime_t intracct[NCMSTATES];
739590Sesolom 
740590Sesolom 	/*
741590Sesolom 	 * Load all volatile state under the protection of membar.
742590Sesolom 	 * cpu_acct[cpu_mstate] must be loaded to avoid double counting
743590Sesolom 	 * of (now - cpu_mstate_start) by a change in CPU mstate that
744590Sesolom 	 * arrives after we make our last check of cpu_mstate_gen.
745590Sesolom 	 */
746590Sesolom 
747590Sesolom 	now = gethrtime_unscaled();
748590Sesolom 	gen = cpu->cpu_mstate_gen;
749590Sesolom 
750590Sesolom 	membar_consumer();	/* guarantee load ordering */
751590Sesolom 	start = cpu->cpu_mstate_start;
752590Sesolom 	state = cpu->cpu_mstate;
753590Sesolom 	for (i = 0; i < NCMSTATES; i++) {
754590Sesolom 		intracct[i] = cpu->cpu_intracct[i];
755590Sesolom 		times[i] = cpu->cpu_acct[i];
756590Sesolom 	}
757590Sesolom 	membar_consumer();	/* guarantee load ordering */
758590Sesolom 
759590Sesolom 	if (gen != 0 && gen == cpu->cpu_mstate_gen && now > start)
760590Sesolom 		times[state] += now - start;
761590Sesolom 
762590Sesolom 	for (i = 0; i < NCMSTATES; i++) {
763590Sesolom 		scalehrtime(&times[i]);
764590Sesolom 		intracct[i] = tick2ns((hrtime_t)intracct[i], cpu->cpu_id);
765590Sesolom 	}
766590Sesolom 
767590Sesolom 	for (i = 0; i < NCMSTATES; i++) {
768590Sesolom 		if (i == CMS_SYSTEM)
769590Sesolom 			continue;
770590Sesolom 		times[i] -= intracct[i];
771590Sesolom 		if (times[i] < 0) {
772590Sesolom 			intracct[i] += times[i];
773590Sesolom 			times[i] = 0;
774590Sesolom 		}
775590Sesolom 		times[CMS_SYSTEM] += intracct[i];
776590Sesolom 	}
777590Sesolom }
778