xref: /onnv-gate/usr/src/uts/common/io/mem.c (revision 1463:48d4046e5f1a)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5*1463Sayznaga  * Common Development and Distribution License (the "License").
6*1463Sayznaga  * You may not use this file except in compliance with the License.
70Sstevel@tonic-gate  *
80Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
90Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
100Sstevel@tonic-gate  * See the License for the specific language governing permissions
110Sstevel@tonic-gate  * and limitations under the License.
120Sstevel@tonic-gate  *
130Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
140Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
150Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
160Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
170Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
180Sstevel@tonic-gate  *
190Sstevel@tonic-gate  * CDDL HEADER END
200Sstevel@tonic-gate  */
210Sstevel@tonic-gate /*
221283Sayznaga  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
230Sstevel@tonic-gate  * Use is subject to license terms.
240Sstevel@tonic-gate  */
250Sstevel@tonic-gate 
260Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
270Sstevel@tonic-gate 
280Sstevel@tonic-gate /*
290Sstevel@tonic-gate  * Memory special file
300Sstevel@tonic-gate  */
310Sstevel@tonic-gate 
320Sstevel@tonic-gate #include <sys/types.h>
330Sstevel@tonic-gate #include <sys/param.h>
340Sstevel@tonic-gate #include <sys/user.h>
350Sstevel@tonic-gate #include <sys/buf.h>
360Sstevel@tonic-gate #include <sys/systm.h>
370Sstevel@tonic-gate #include <sys/cred.h>
380Sstevel@tonic-gate #include <sys/vm.h>
390Sstevel@tonic-gate #include <sys/uio.h>
400Sstevel@tonic-gate #include <sys/mman.h>
410Sstevel@tonic-gate #include <sys/kmem.h>
420Sstevel@tonic-gate #include <vm/seg.h>
430Sstevel@tonic-gate #include <vm/page.h>
440Sstevel@tonic-gate #include <sys/stat.h>
450Sstevel@tonic-gate #include <sys/vmem.h>
460Sstevel@tonic-gate #include <sys/memlist.h>
470Sstevel@tonic-gate #include <sys/bootconf.h>
480Sstevel@tonic-gate 
490Sstevel@tonic-gate #include <vm/seg_vn.h>
500Sstevel@tonic-gate #include <vm/seg_dev.h>
510Sstevel@tonic-gate #include <vm/seg_kmem.h>
520Sstevel@tonic-gate #include <vm/seg_kp.h>
530Sstevel@tonic-gate #include <vm/seg_kpm.h>
540Sstevel@tonic-gate #include <vm/hat.h>
550Sstevel@tonic-gate 
560Sstevel@tonic-gate #include <sys/conf.h>
570Sstevel@tonic-gate #include <sys/mem.h>
580Sstevel@tonic-gate #include <sys/types.h>
590Sstevel@tonic-gate #include <sys/conf.h>
600Sstevel@tonic-gate #include <sys/param.h>
610Sstevel@tonic-gate #include <sys/systm.h>
620Sstevel@tonic-gate #include <sys/errno.h>
630Sstevel@tonic-gate #include <sys/modctl.h>
640Sstevel@tonic-gate #include <sys/memlist.h>
650Sstevel@tonic-gate #include <sys/ddi.h>
660Sstevel@tonic-gate #include <sys/sunddi.h>
670Sstevel@tonic-gate #include <sys/debug.h>
681186Sayznaga #include <sys/fm/protocol.h>
690Sstevel@tonic-gate 
701414Scindi #if defined(__sparc)
710Sstevel@tonic-gate extern int cpu_get_mem_name(uint64_t, uint64_t *, uint64_t, char *, int, int *);
720Sstevel@tonic-gate extern int cpu_get_mem_info(uint64_t, uint64_t, uint64_t *, uint64_t *,
730Sstevel@tonic-gate     uint64_t *, int *, int *, int *);
740Sstevel@tonic-gate extern size_t cpu_get_name_bufsize(void);
751186Sayznaga extern int cpu_get_mem_sid(char *, char *, int, int *);
761186Sayznaga extern int cpu_get_mem_addr(char *, char *, uint64_t, uint64_t *);
771414Scindi #elif defined(__i386) || defined(__amd64)
781414Scindi #include <sys/cpu_module.h>
791186Sayznaga #endif	/* __sparc */
800Sstevel@tonic-gate 
810Sstevel@tonic-gate /*
820Sstevel@tonic-gate  * Turn a byte length into a pagecount.  The DDI btop takes a
830Sstevel@tonic-gate  * 32-bit size on 32-bit machines, this handles 64-bit sizes for
840Sstevel@tonic-gate  * large physical-memory 32-bit machines.
850Sstevel@tonic-gate  */
860Sstevel@tonic-gate #define	BTOP(x)	((pgcnt_t)((x) >> _pageshift))
870Sstevel@tonic-gate 
880Sstevel@tonic-gate static kmutex_t mm_lock;
890Sstevel@tonic-gate static caddr_t mm_map;
900Sstevel@tonic-gate 
910Sstevel@tonic-gate static dev_info_t *mm_dip;	/* private copy of devinfo pointer */
920Sstevel@tonic-gate 
930Sstevel@tonic-gate static int mm_kmem_io_access;
940Sstevel@tonic-gate 
950Sstevel@tonic-gate static int mm_kstat_update(kstat_t *ksp, int rw);
960Sstevel@tonic-gate static int mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw);
970Sstevel@tonic-gate 
981186Sayznaga static int mm_read_mem_name(intptr_t data, mem_name_t *mem_name);
991186Sayznaga static int mm_read_mem_page(intptr_t data, mem_page_t *mpage);
1001186Sayznaga static int mm_get_mem_fmri(mem_page_t *mpage, nvlist_t **nvl);
1011186Sayznaga static int mm_get_paddr(nvlist_t *nvl, uint64_t *paddr);
1021186Sayznaga 
1030Sstevel@tonic-gate /*ARGSUSED1*/
1040Sstevel@tonic-gate static int
1050Sstevel@tonic-gate mm_attach(dev_info_t *devi, ddi_attach_cmd_t cmd)
1060Sstevel@tonic-gate {
1070Sstevel@tonic-gate 	int i;
1080Sstevel@tonic-gate 	struct mem_minor {
1090Sstevel@tonic-gate 		char *name;
1100Sstevel@tonic-gate 		minor_t minor;
1110Sstevel@tonic-gate 		int privonly;
1120Sstevel@tonic-gate 		const char *rdpriv;
1130Sstevel@tonic-gate 		const char *wrpriv;
1140Sstevel@tonic-gate 		mode_t priv_mode;
1150Sstevel@tonic-gate 	} mm[] = {
1160Sstevel@tonic-gate 		{ "mem",	M_MEM,		0,	NULL,	"all",	0640 },
1170Sstevel@tonic-gate 		{ "kmem",	M_KMEM,		0,	NULL,	"all",	0640 },
1180Sstevel@tonic-gate 		{ "allkmem",	M_ALLKMEM,	0,	"all",	"all",	0600 },
1190Sstevel@tonic-gate 		{ "null",	M_NULL,	PRIVONLY_DEV,	NULL,	NULL,	0666 },
1200Sstevel@tonic-gate 		{ "zero",	M_ZERO, PRIVONLY_DEV,	NULL,	NULL,	0666 },
1210Sstevel@tonic-gate 	};
1220Sstevel@tonic-gate 	kstat_t *ksp;
1230Sstevel@tonic-gate 
1240Sstevel@tonic-gate 	mutex_init(&mm_lock, NULL, MUTEX_DEFAULT, NULL);
1250Sstevel@tonic-gate 	mm_map = vmem_alloc(heap_arena, PAGESIZE, VM_SLEEP);
1260Sstevel@tonic-gate 
1270Sstevel@tonic-gate 	for (i = 0; i < (sizeof (mm) / sizeof (mm[0])); i++) {
1280Sstevel@tonic-gate 		if (ddi_create_priv_minor_node(devi, mm[i].name, S_IFCHR,
1290Sstevel@tonic-gate 		    mm[i].minor, DDI_PSEUDO, mm[i].privonly,
1300Sstevel@tonic-gate 		    mm[i].rdpriv, mm[i].wrpriv, mm[i].priv_mode) ==
1310Sstevel@tonic-gate 		    DDI_FAILURE) {
1320Sstevel@tonic-gate 			ddi_remove_minor_node(devi, NULL);
1330Sstevel@tonic-gate 			return (DDI_FAILURE);
1340Sstevel@tonic-gate 		}
1350Sstevel@tonic-gate 	}
1360Sstevel@tonic-gate 
1370Sstevel@tonic-gate 	mm_dip = devi;
1380Sstevel@tonic-gate 
1390Sstevel@tonic-gate 	ksp = kstat_create("mm", 0, "phys_installed", "misc",
1400Sstevel@tonic-gate 	    KSTAT_TYPE_RAW, 0, KSTAT_FLAG_VAR_SIZE | KSTAT_FLAG_VIRTUAL);
1410Sstevel@tonic-gate 	if (ksp != NULL) {
1420Sstevel@tonic-gate 		ksp->ks_update = mm_kstat_update;
1430Sstevel@tonic-gate 		ksp->ks_snapshot = mm_kstat_snapshot;
1440Sstevel@tonic-gate 		ksp->ks_lock = &mm_lock; /* XXX - not really needed */
1450Sstevel@tonic-gate 		kstat_install(ksp);
1460Sstevel@tonic-gate 	}
1470Sstevel@tonic-gate 
1480Sstevel@tonic-gate 	mm_kmem_io_access = ddi_getprop(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
1490Sstevel@tonic-gate 	    "kmem_io_access", 0);
1500Sstevel@tonic-gate 
1510Sstevel@tonic-gate 	return (DDI_SUCCESS);
1520Sstevel@tonic-gate }
1530Sstevel@tonic-gate 
1540Sstevel@tonic-gate /*ARGSUSED*/
1550Sstevel@tonic-gate static int
1560Sstevel@tonic-gate mm_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result)
1570Sstevel@tonic-gate {
1580Sstevel@tonic-gate 	register int error;
1590Sstevel@tonic-gate 
1600Sstevel@tonic-gate 	switch (infocmd) {
1610Sstevel@tonic-gate 	case DDI_INFO_DEVT2DEVINFO:
1620Sstevel@tonic-gate 		*result = (void *)mm_dip;
1630Sstevel@tonic-gate 		error = DDI_SUCCESS;
1640Sstevel@tonic-gate 		break;
1650Sstevel@tonic-gate 	case DDI_INFO_DEVT2INSTANCE:
1660Sstevel@tonic-gate 		*result = (void *)0;
1670Sstevel@tonic-gate 		error = DDI_SUCCESS;
1680Sstevel@tonic-gate 		break;
1690Sstevel@tonic-gate 	default:
1700Sstevel@tonic-gate 		error = DDI_FAILURE;
1710Sstevel@tonic-gate 	}
1720Sstevel@tonic-gate 	return (error);
1730Sstevel@tonic-gate }
1740Sstevel@tonic-gate 
1750Sstevel@tonic-gate /*ARGSUSED1*/
1760Sstevel@tonic-gate static int
1770Sstevel@tonic-gate mmopen(dev_t *devp, int flag, int typ, struct cred *cred)
1780Sstevel@tonic-gate {
1790Sstevel@tonic-gate 	switch (getminor(*devp)) {
1800Sstevel@tonic-gate 	case M_NULL:
1810Sstevel@tonic-gate 	case M_ZERO:
1820Sstevel@tonic-gate 	case M_MEM:
1830Sstevel@tonic-gate 	case M_KMEM:
1840Sstevel@tonic-gate 	case M_ALLKMEM:
1850Sstevel@tonic-gate 		/* standard devices */
1860Sstevel@tonic-gate 		break;
1870Sstevel@tonic-gate 
1880Sstevel@tonic-gate 	default:
1890Sstevel@tonic-gate 		/* Unsupported or unknown type */
1900Sstevel@tonic-gate 		return (EINVAL);
1910Sstevel@tonic-gate 	}
1920Sstevel@tonic-gate 	return (0);
1930Sstevel@tonic-gate }
1940Sstevel@tonic-gate 
1950Sstevel@tonic-gate struct pollhead	mm_pollhd;
1960Sstevel@tonic-gate 
1970Sstevel@tonic-gate /*ARGSUSED*/
1980Sstevel@tonic-gate static int
1990Sstevel@tonic-gate mmchpoll(dev_t dev, short events, int anyyet, short *reventsp,
2000Sstevel@tonic-gate     struct pollhead **phpp)
2010Sstevel@tonic-gate {
2020Sstevel@tonic-gate 	switch (getminor(dev)) {
2030Sstevel@tonic-gate 	case M_NULL:
2040Sstevel@tonic-gate 	case M_ZERO:
2050Sstevel@tonic-gate 	case M_MEM:
2060Sstevel@tonic-gate 	case M_KMEM:
2070Sstevel@tonic-gate 	case M_ALLKMEM:
2080Sstevel@tonic-gate 		*reventsp = events & (POLLIN | POLLOUT | POLLPRI | POLLRDNORM |
2090Sstevel@tonic-gate 			POLLWRNORM | POLLRDBAND | POLLWRBAND);
2100Sstevel@tonic-gate 		/*
2110Sstevel@tonic-gate 		 * A non NULL pollhead pointer should be returned in case
2120Sstevel@tonic-gate 		 * user polls for 0 events.
2130Sstevel@tonic-gate 		 */
2140Sstevel@tonic-gate 		*phpp = !anyyet && !*reventsp ?
2150Sstevel@tonic-gate 		    &mm_pollhd : (struct pollhead *)NULL;
2160Sstevel@tonic-gate 		return (0);
2170Sstevel@tonic-gate 	default:
2180Sstevel@tonic-gate 		/* no other devices currently support polling */
2190Sstevel@tonic-gate 		return (ENXIO);
2200Sstevel@tonic-gate 	}
2210Sstevel@tonic-gate }
2220Sstevel@tonic-gate 
2230Sstevel@tonic-gate static int
2240Sstevel@tonic-gate mmpropop(dev_t dev, dev_info_t *dip, ddi_prop_op_t prop_op, int flags,
2250Sstevel@tonic-gate     char *name, caddr_t valuep, int *lengthp)
2260Sstevel@tonic-gate {
2270Sstevel@tonic-gate 	/*
2280Sstevel@tonic-gate 	 * implement zero size to reduce overhead (avoid two failing
2290Sstevel@tonic-gate 	 * property lookups per stat).
2300Sstevel@tonic-gate 	 */
2310Sstevel@tonic-gate 	return (ddi_prop_op_size(dev, dip, prop_op,
2320Sstevel@tonic-gate 	    flags, name, valuep, lengthp, 0));
2330Sstevel@tonic-gate }
2340Sstevel@tonic-gate 
2350Sstevel@tonic-gate static int
2360Sstevel@tonic-gate mmio(struct uio *uio, enum uio_rw rw, pfn_t pfn, off_t pageoff, int allowio)
2370Sstevel@tonic-gate {
2380Sstevel@tonic-gate 	int error = 0;
2390Sstevel@tonic-gate 	size_t nbytes = MIN((size_t)(PAGESIZE - pageoff),
2400Sstevel@tonic-gate 	    (size_t)uio->uio_iov->iov_len);
2410Sstevel@tonic-gate 
2420Sstevel@tonic-gate 	mutex_enter(&mm_lock);
2430Sstevel@tonic-gate 	hat_devload(kas.a_hat, mm_map, PAGESIZE, pfn,
2440Sstevel@tonic-gate 	    (uint_t)(rw == UIO_READ ? PROT_READ : PROT_READ | PROT_WRITE),
2450Sstevel@tonic-gate 	    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
2460Sstevel@tonic-gate 
2470Sstevel@tonic-gate 	if (!pf_is_memory(pfn)) {
2480Sstevel@tonic-gate 		if (allowio) {
2490Sstevel@tonic-gate 			size_t c = uio->uio_iov->iov_len;
2500Sstevel@tonic-gate 
2510Sstevel@tonic-gate 			if (ddi_peekpokeio(NULL, uio, rw,
2520Sstevel@tonic-gate 			    (caddr_t)(uintptr_t)uio->uio_loffset, c,
2530Sstevel@tonic-gate 			    sizeof (int32_t)) != DDI_SUCCESS)
2540Sstevel@tonic-gate 				error = EFAULT;
2550Sstevel@tonic-gate 		} else
2560Sstevel@tonic-gate 			error = EIO;
2570Sstevel@tonic-gate 	} else
2580Sstevel@tonic-gate 		error = uiomove(&mm_map[pageoff], nbytes, rw, uio);
2590Sstevel@tonic-gate 
2600Sstevel@tonic-gate 	hat_unload(kas.a_hat, mm_map, PAGESIZE, HAT_UNLOAD_UNLOCK);
2610Sstevel@tonic-gate 	mutex_exit(&mm_lock);
2620Sstevel@tonic-gate 	return (error);
2630Sstevel@tonic-gate }
2640Sstevel@tonic-gate 
2650Sstevel@tonic-gate #ifdef	__sparc
2660Sstevel@tonic-gate 
267670Selowe static int
268670Selowe mmpagelock(struct as *as, caddr_t va)
269670Selowe {
270670Selowe 	struct seg *seg;
271670Selowe 	int i;
272670Selowe 
273670Selowe 	AS_LOCK_ENTER(as, &as->a_lock, RW_READER);
274670Selowe 	seg = as_segat(as, va);
275670Selowe 	i = (seg != NULL)? SEGOP_CAPABLE(seg, S_CAPABILITY_NOMINFLT) : 0;
276670Selowe 	AS_LOCK_EXIT(as, &as->a_lock);
277670Selowe 
278670Selowe 	return (i);
279670Selowe }
280670Selowe 
281670Selowe #define	NEED_LOCK_KVADDR(kva)	mmpagelock(&kas, kva)
2820Sstevel@tonic-gate 
2830Sstevel@tonic-gate #else	/* __i386, __amd64 */
2840Sstevel@tonic-gate 
2850Sstevel@tonic-gate #define	NEED_LOCK_KVADDR(va)	0
2860Sstevel@tonic-gate 
2870Sstevel@tonic-gate #endif	/* __sparc */
2880Sstevel@tonic-gate 
2890Sstevel@tonic-gate /*ARGSUSED3*/
2900Sstevel@tonic-gate static int
2910Sstevel@tonic-gate mmrw(dev_t dev, struct uio *uio, enum uio_rw rw, cred_t *cred)
2920Sstevel@tonic-gate {
2930Sstevel@tonic-gate 	pfn_t v;
2940Sstevel@tonic-gate 	struct iovec *iov;
2950Sstevel@tonic-gate 	int error = 0;
2960Sstevel@tonic-gate 	size_t c;
2970Sstevel@tonic-gate 	ssize_t oresid = uio->uio_resid;
2980Sstevel@tonic-gate 	minor_t minor = getminor(dev);
2990Sstevel@tonic-gate 
3000Sstevel@tonic-gate 	while (uio->uio_resid > 0 && error == 0) {
3010Sstevel@tonic-gate 		iov = uio->uio_iov;
3020Sstevel@tonic-gate 		if (iov->iov_len == 0) {
3030Sstevel@tonic-gate 			uio->uio_iov++;
3040Sstevel@tonic-gate 			uio->uio_iovcnt--;
3050Sstevel@tonic-gate 			if (uio->uio_iovcnt < 0)
3060Sstevel@tonic-gate 				panic("mmrw");
3070Sstevel@tonic-gate 			continue;
3080Sstevel@tonic-gate 		}
3090Sstevel@tonic-gate 		switch (minor) {
3100Sstevel@tonic-gate 
3110Sstevel@tonic-gate 		case M_MEM:
3120Sstevel@tonic-gate 			memlist_read_lock();
3130Sstevel@tonic-gate 			if (!address_in_memlist(phys_install,
3140Sstevel@tonic-gate 			    (uint64_t)uio->uio_loffset, 1)) {
3150Sstevel@tonic-gate 				memlist_read_unlock();
3160Sstevel@tonic-gate 				error = EFAULT;
3170Sstevel@tonic-gate 				break;
3180Sstevel@tonic-gate 			}
3190Sstevel@tonic-gate 			memlist_read_unlock();
3200Sstevel@tonic-gate 
3210Sstevel@tonic-gate 			v = BTOP((u_offset_t)uio->uio_loffset);
3220Sstevel@tonic-gate 			error = mmio(uio, rw, v,
3230Sstevel@tonic-gate 			    uio->uio_loffset & PAGEOFFSET, 0);
3240Sstevel@tonic-gate 			break;
3250Sstevel@tonic-gate 
3260Sstevel@tonic-gate 		case M_KMEM:
3270Sstevel@tonic-gate 		case M_ALLKMEM:
3280Sstevel@tonic-gate 			{
3290Sstevel@tonic-gate 			page_t **ppp;
3300Sstevel@tonic-gate 			caddr_t vaddr = (caddr_t)uio->uio_offset;
3310Sstevel@tonic-gate 			int try_lock = NEED_LOCK_KVADDR(vaddr);
3320Sstevel@tonic-gate 			int locked = 0;
3330Sstevel@tonic-gate 
3340Sstevel@tonic-gate 			/*
3350Sstevel@tonic-gate 			 * If vaddr does not map a valid page, as_pagelock()
3360Sstevel@tonic-gate 			 * will return failure. Hence we can't check the
3370Sstevel@tonic-gate 			 * return value and return EFAULT here as we'd like.
3380Sstevel@tonic-gate 			 * seg_kp and seg_kpm do not properly support
3390Sstevel@tonic-gate 			 * as_pagelock() for this context so we avoid it
3400Sstevel@tonic-gate 			 * using the try_lock set check above.  Some day when
3410Sstevel@tonic-gate 			 * the kernel page locking gets redesigned all this
3420Sstevel@tonic-gate 			 * muck can be cleaned up.
3430Sstevel@tonic-gate 			 */
3440Sstevel@tonic-gate 			if (try_lock)
3450Sstevel@tonic-gate 				locked = (as_pagelock(&kas, &ppp, vaddr,
3460Sstevel@tonic-gate 				    PAGESIZE, S_WRITE) == 0);
3470Sstevel@tonic-gate 
348513Sjongkis 			v = hat_getpfnum(kas.a_hat,
349513Sjongkis 			    (caddr_t)(uintptr_t)uio->uio_loffset);
3500Sstevel@tonic-gate 			if (v == PFN_INVALID) {
3510Sstevel@tonic-gate 				if (locked)
3520Sstevel@tonic-gate 					as_pageunlock(&kas, ppp, vaddr,
3530Sstevel@tonic-gate 					    PAGESIZE, S_WRITE);
3540Sstevel@tonic-gate 				error = EFAULT;
3550Sstevel@tonic-gate 				break;
3560Sstevel@tonic-gate 			}
3570Sstevel@tonic-gate 
3580Sstevel@tonic-gate 			error = mmio(uio, rw, v, uio->uio_loffset & PAGEOFFSET,
3590Sstevel@tonic-gate 			    minor == M_ALLKMEM || mm_kmem_io_access);
3600Sstevel@tonic-gate 			if (locked)
3610Sstevel@tonic-gate 				as_pageunlock(&kas, ppp, vaddr, PAGESIZE,
3620Sstevel@tonic-gate 				    S_WRITE);
3630Sstevel@tonic-gate 			}
3640Sstevel@tonic-gate 
3650Sstevel@tonic-gate 			break;
3660Sstevel@tonic-gate 
3670Sstevel@tonic-gate 		case M_ZERO:
3680Sstevel@tonic-gate 			if (rw == UIO_READ) {
3690Sstevel@tonic-gate 				label_t ljb;
3700Sstevel@tonic-gate 
3710Sstevel@tonic-gate 				if (on_fault(&ljb)) {
3720Sstevel@tonic-gate 					no_fault();
3730Sstevel@tonic-gate 					error = EFAULT;
3740Sstevel@tonic-gate 					break;
3750Sstevel@tonic-gate 				}
3760Sstevel@tonic-gate 				uzero(iov->iov_base, iov->iov_len);
3770Sstevel@tonic-gate 				no_fault();
3780Sstevel@tonic-gate 				uio->uio_resid -= iov->iov_len;
3790Sstevel@tonic-gate 				uio->uio_loffset += iov->iov_len;
3800Sstevel@tonic-gate 				break;
3810Sstevel@tonic-gate 			}
3820Sstevel@tonic-gate 			/* else it's a write, fall through to NULL case */
3830Sstevel@tonic-gate 			/*FALLTHROUGH*/
3840Sstevel@tonic-gate 
3850Sstevel@tonic-gate 		case M_NULL:
3860Sstevel@tonic-gate 			if (rw == UIO_READ)
3870Sstevel@tonic-gate 				return (0);
3880Sstevel@tonic-gate 			c = iov->iov_len;
3890Sstevel@tonic-gate 			iov->iov_base += c;
3900Sstevel@tonic-gate 			iov->iov_len -= c;
3910Sstevel@tonic-gate 			uio->uio_loffset += c;
3920Sstevel@tonic-gate 			uio->uio_resid -= c;
3930Sstevel@tonic-gate 			break;
3940Sstevel@tonic-gate 
3950Sstevel@tonic-gate 		}
3960Sstevel@tonic-gate 	}
3970Sstevel@tonic-gate 	return (uio->uio_resid == oresid ? error : 0);
3980Sstevel@tonic-gate }
3990Sstevel@tonic-gate 
4000Sstevel@tonic-gate static int
4010Sstevel@tonic-gate mmread(dev_t dev, struct uio *uio, cred_t *cred)
4020Sstevel@tonic-gate {
4030Sstevel@tonic-gate 	return (mmrw(dev, uio, UIO_READ, cred));
4040Sstevel@tonic-gate }
4050Sstevel@tonic-gate 
4060Sstevel@tonic-gate static int
4070Sstevel@tonic-gate mmwrite(dev_t dev, struct uio *uio, cred_t *cred)
4080Sstevel@tonic-gate {
4090Sstevel@tonic-gate 	return (mmrw(dev, uio, UIO_WRITE, cred));
4100Sstevel@tonic-gate }
4110Sstevel@tonic-gate 
4120Sstevel@tonic-gate /*
4130Sstevel@tonic-gate  * Private ioctl for libkvm to support kvm_physaddr().
4140Sstevel@tonic-gate  * Given an address space and a VA, compute the PA.
4150Sstevel@tonic-gate  */
4160Sstevel@tonic-gate static int
4170Sstevel@tonic-gate mmioctl_vtop(intptr_t data)
4180Sstevel@tonic-gate {
4191414Scindi #ifdef _SYSCALL32
4201414Scindi 	mem_vtop32_t vtop32;
4211414Scindi #endif
4220Sstevel@tonic-gate 	mem_vtop_t mem_vtop;
4230Sstevel@tonic-gate 	proc_t *p;
4240Sstevel@tonic-gate 	pfn_t pfn = (pfn_t)PFN_INVALID;
4250Sstevel@tonic-gate 	pid_t pid = 0;
4260Sstevel@tonic-gate 	struct as *as;
4270Sstevel@tonic-gate 	struct seg *seg;
4280Sstevel@tonic-gate 
4291414Scindi 	if (get_udatamodel() == DATAMODEL_NATIVE) {
4301414Scindi 		if (copyin((void *)data, &mem_vtop, sizeof (mem_vtop_t)))
4311414Scindi 			return (EFAULT);
4321414Scindi 	}
4331414Scindi #ifdef _SYSCALL32
4341414Scindi 	else {
4351414Scindi 		if (copyin((void *)data, &vtop32, sizeof (mem_vtop32_t)))
4361414Scindi 			return (EFAULT);
4371414Scindi 		mem_vtop.m_as = (struct as *)vtop32.m_as;
4381414Scindi 		mem_vtop.m_va = (void *)vtop32.m_va;
4391414Scindi 
4401414Scindi 		if (mem_vtop.m_as != NULL)
4411414Scindi 			return (EINVAL);
4421414Scindi 	}
4431414Scindi #endif
4441414Scindi 
4450Sstevel@tonic-gate 	if (mem_vtop.m_as == &kas) {
4460Sstevel@tonic-gate 		pfn = hat_getpfnum(kas.a_hat, mem_vtop.m_va);
4470Sstevel@tonic-gate 	} else {
4481414Scindi 		if (mem_vtop.m_as == NULL) {
4491414Scindi 			/*
4501414Scindi 			 * Assume the calling process's address space if the
4511414Scindi 			 * caller didn't specify one.
4521414Scindi 			 */
4531414Scindi 			p = curthread->t_procp;
4541414Scindi 			if (p == NULL)
4551414Scindi 				return (EIO);
4561414Scindi 			mem_vtop.m_as = p->p_as;
4571414Scindi 		}
4581414Scindi 
4590Sstevel@tonic-gate 		mutex_enter(&pidlock);
4600Sstevel@tonic-gate 		for (p = practive; p != NULL; p = p->p_next) {
4610Sstevel@tonic-gate 			if (p->p_as == mem_vtop.m_as) {
4620Sstevel@tonic-gate 				pid = p->p_pid;
4630Sstevel@tonic-gate 				break;
4640Sstevel@tonic-gate 			}
4650Sstevel@tonic-gate 		}
4660Sstevel@tonic-gate 		mutex_exit(&pidlock);
4670Sstevel@tonic-gate 		if (p == NULL)
4680Sstevel@tonic-gate 			return (EIO);
4690Sstevel@tonic-gate 		p = sprlock(pid);
4700Sstevel@tonic-gate 		if (p == NULL)
4710Sstevel@tonic-gate 			return (EIO);
4720Sstevel@tonic-gate 		as = p->p_as;
4730Sstevel@tonic-gate 		if (as == mem_vtop.m_as) {
4740Sstevel@tonic-gate 			mutex_exit(&p->p_lock);
4750Sstevel@tonic-gate 			AS_LOCK_ENTER(as, &as->a_lock, RW_READER);
4760Sstevel@tonic-gate 			for (seg = AS_SEGFIRST(as); seg != NULL;
4770Sstevel@tonic-gate 			    seg = AS_SEGNEXT(as, seg))
4780Sstevel@tonic-gate 				if ((uintptr_t)mem_vtop.m_va -
4790Sstevel@tonic-gate 				    (uintptr_t)seg->s_base < seg->s_size)
4800Sstevel@tonic-gate 					break;
4810Sstevel@tonic-gate 			if (seg != NULL)
4820Sstevel@tonic-gate 				pfn = hat_getpfnum(as->a_hat, mem_vtop.m_va);
4830Sstevel@tonic-gate 			AS_LOCK_EXIT(as, &as->a_lock);
4840Sstevel@tonic-gate 			mutex_enter(&p->p_lock);
4850Sstevel@tonic-gate 		}
4860Sstevel@tonic-gate 		sprunlock(p);
4870Sstevel@tonic-gate 	}
4880Sstevel@tonic-gate 	mem_vtop.m_pfn = pfn;
4890Sstevel@tonic-gate 	if (pfn == PFN_INVALID)
4900Sstevel@tonic-gate 		return (EIO);
4911414Scindi 
4921414Scindi 	if (get_udatamodel() == DATAMODEL_NATIVE) {
4931414Scindi 		if (copyout(&mem_vtop, (void *)data, sizeof (mem_vtop_t)))
4941414Scindi 			return (EFAULT);
4951414Scindi 	}
4961414Scindi #ifdef _SYSCALL32
4971414Scindi 	else {
4981414Scindi 		vtop32.m_pfn = mem_vtop.m_pfn;
4991414Scindi 		if (copyout(&vtop32, (void *)data, sizeof (mem_vtop32_t)))
5001414Scindi 			return (EFAULT);
5011414Scindi 	}
5021414Scindi #endif
5030Sstevel@tonic-gate 
5040Sstevel@tonic-gate 	return (0);
5050Sstevel@tonic-gate }
5060Sstevel@tonic-gate 
5070Sstevel@tonic-gate /*
508917Selowe  * Given a PA, execute the given page retire command on it.
5090Sstevel@tonic-gate  */
5100Sstevel@tonic-gate static int
5110Sstevel@tonic-gate mmioctl_page_retire(int cmd, intptr_t data)
5120Sstevel@tonic-gate {
513917Selowe 	extern int page_retire_test(void);
5140Sstevel@tonic-gate 	uint64_t pa;
5150Sstevel@tonic-gate 
516917Selowe 	if (copyin((void *)data, &pa, sizeof (uint64_t))) {
517917Selowe 		return (EFAULT);
5180Sstevel@tonic-gate 	}
5190Sstevel@tonic-gate 
520917Selowe 	switch (cmd) {
521917Selowe 	case MEM_PAGE_ISRETIRED:
522917Selowe 		return (page_retire_check(pa, NULL));
523917Selowe 
524917Selowe 	case MEM_PAGE_UNRETIRE:
525917Selowe 		return (page_unretire(pa));
526917Selowe 
527917Selowe 	case MEM_PAGE_RETIRE:
528917Selowe 		return (page_retire(pa, PR_FMA));
529917Selowe 
530917Selowe 	case MEM_PAGE_RETIRE_MCE:
531917Selowe 		return (page_retire(pa, PR_MCE));
532917Selowe 
533917Selowe 	case MEM_PAGE_RETIRE_UE:
534917Selowe 		return (page_retire(pa, PR_UE));
5350Sstevel@tonic-gate 
536917Selowe 	case MEM_PAGE_GETERRORS:
537917Selowe 		{
538917Selowe 			uint64_t page_errors;
539917Selowe 			int rc = page_retire_check(pa, &page_errors);
540917Selowe 			if (copyout(&page_errors, (void *)data,
541917Selowe 			    sizeof (uint64_t))) {
542917Selowe 				return (EFAULT);
543917Selowe 			}
544917Selowe 			return (rc);
545917Selowe 		}
546917Selowe 
547917Selowe 	case MEM_PAGE_RETIRE_TEST:
548917Selowe 		return (page_retire_test());
549917Selowe 
550917Selowe 	}
551917Selowe 
552917Selowe 	return (EINVAL);
5530Sstevel@tonic-gate }
5540Sstevel@tonic-gate 
5551186Sayznaga /*
5561186Sayznaga  * Given a mem-scheme FMRI for a page, execute the given page retire
5571186Sayznaga  * command on it.
5581186Sayznaga  */
5591186Sayznaga static int
5601186Sayznaga mmioctl_page_fmri_retire(int cmd, intptr_t data)
5611186Sayznaga {
5621186Sayznaga 	mem_page_t mpage;
5631186Sayznaga 	uint64_t pa;
5641186Sayznaga 	nvlist_t *nvl;
5651186Sayznaga 	int err;
5661186Sayznaga 
5671186Sayznaga 	if ((err = mm_read_mem_page(data, &mpage)) < 0)
5681186Sayznaga 		return (err);
5691186Sayznaga 
5701186Sayznaga 	if ((err = mm_get_mem_fmri(&mpage, &nvl)) < 0)
5711186Sayznaga 		return (err);
5721186Sayznaga 
5731414Scindi 	if ((err = mm_get_paddr(nvl, &pa)) != 0) {
5741186Sayznaga 		nvlist_free(nvl);
5751186Sayznaga 		return (err);
5761186Sayznaga 	}
5771186Sayznaga 
5781186Sayznaga 	nvlist_free(nvl);
5791186Sayznaga 
5801186Sayznaga 	switch (cmd) {
5811186Sayznaga 	case MEM_PAGE_FMRI_ISRETIRED:
5821186Sayznaga 		return (page_retire_check(pa, NULL));
5831186Sayznaga 
5841186Sayznaga 	case MEM_PAGE_FMRI_RETIRE:
5851186Sayznaga 		return (page_retire(pa, PR_FMA));
5861186Sayznaga 	}
5871186Sayznaga 
5881186Sayznaga 	return (EINVAL);
5891186Sayznaga }
5901186Sayznaga 
5910Sstevel@tonic-gate #ifdef __sparc
5920Sstevel@tonic-gate /*
5930Sstevel@tonic-gate  * Given a syndrome, syndrome type, and address return the
5940Sstevel@tonic-gate  * associated memory name in the provided data buffer.
5950Sstevel@tonic-gate  */
5960Sstevel@tonic-gate static int
5970Sstevel@tonic-gate mmioctl_get_mem_name(intptr_t data)
5980Sstevel@tonic-gate {
5990Sstevel@tonic-gate 	mem_name_t mem_name;
6000Sstevel@tonic-gate 	void *buf;
6010Sstevel@tonic-gate 	size_t bufsize;
6020Sstevel@tonic-gate 	int len, err;
6030Sstevel@tonic-gate 
6040Sstevel@tonic-gate 	if ((bufsize = cpu_get_name_bufsize()) == 0)
6050Sstevel@tonic-gate 		return (ENOTSUP);
6060Sstevel@tonic-gate 
6071186Sayznaga 	if ((err = mm_read_mem_name(data, &mem_name)) < 0)
6081186Sayznaga 		return (err);
6090Sstevel@tonic-gate 
6100Sstevel@tonic-gate 	buf = kmem_alloc(bufsize, KM_SLEEP);
6110Sstevel@tonic-gate 
6120Sstevel@tonic-gate 	/*
6130Sstevel@tonic-gate 	 * Call into cpu specific code to do the lookup.
6140Sstevel@tonic-gate 	 */
6150Sstevel@tonic-gate 	if ((err = cpu_get_mem_name(mem_name.m_synd, mem_name.m_type,
6160Sstevel@tonic-gate 	    mem_name.m_addr, buf, bufsize, &len)) != 0) {
6170Sstevel@tonic-gate 		kmem_free(buf, bufsize);
6180Sstevel@tonic-gate 		return (err);
6190Sstevel@tonic-gate 	}
6200Sstevel@tonic-gate 
6210Sstevel@tonic-gate 	if (len >= mem_name.m_namelen) {
6220Sstevel@tonic-gate 		kmem_free(buf, bufsize);
6230Sstevel@tonic-gate 		return (ENAMETOOLONG);
6240Sstevel@tonic-gate 	}
6250Sstevel@tonic-gate 
6260Sstevel@tonic-gate 	if (copyoutstr(buf, (char *)mem_name.m_name,
6270Sstevel@tonic-gate 	    mem_name.m_namelen, NULL) != 0) {
6280Sstevel@tonic-gate 		kmem_free(buf, bufsize);
6290Sstevel@tonic-gate 		return (EFAULT);
6300Sstevel@tonic-gate 	}
6310Sstevel@tonic-gate 
6320Sstevel@tonic-gate 	kmem_free(buf, bufsize);
6330Sstevel@tonic-gate 	return (0);
6340Sstevel@tonic-gate }
6350Sstevel@tonic-gate 
6360Sstevel@tonic-gate /*
6370Sstevel@tonic-gate  * Given a syndrome and address return information about the associated memory.
6380Sstevel@tonic-gate  */
6390Sstevel@tonic-gate static int
6400Sstevel@tonic-gate mmioctl_get_mem_info(intptr_t data)
6410Sstevel@tonic-gate {
6420Sstevel@tonic-gate 	mem_info_t mem_info;
6430Sstevel@tonic-gate 	int err;
6440Sstevel@tonic-gate 
6450Sstevel@tonic-gate 	if (copyin((void *)data, &mem_info, sizeof (mem_info_t)))
6460Sstevel@tonic-gate 		return (EFAULT);
6470Sstevel@tonic-gate 
6480Sstevel@tonic-gate 	if ((err = cpu_get_mem_info(mem_info.m_synd, mem_info.m_addr,
6490Sstevel@tonic-gate 	    &mem_info.m_mem_size, &mem_info.m_seg_size, &mem_info.m_bank_size,
6500Sstevel@tonic-gate 	    &mem_info.m_segments, &mem_info.m_banks, &mem_info.m_mcid)) != 0)
6510Sstevel@tonic-gate 		return (err);
6520Sstevel@tonic-gate 
6530Sstevel@tonic-gate 	if (copyout(&mem_info, (void *)data, sizeof (mem_info_t)) != 0)
6540Sstevel@tonic-gate 		return (EFAULT);
6550Sstevel@tonic-gate 
6560Sstevel@tonic-gate 	return (0);
6570Sstevel@tonic-gate }
6581186Sayznaga 
6591186Sayznaga /*
6601186Sayznaga  * Given a memory name, return its associated serial id
6611186Sayznaga  */
6621186Sayznaga static int
6631186Sayznaga mmioctl_get_mem_sid(intptr_t data)
6641186Sayznaga {
6651186Sayznaga 	mem_name_t mem_name;
6661186Sayznaga 	void *buf;
6671186Sayznaga 	void *name;
6681186Sayznaga 	size_t	name_len;
6691186Sayznaga 	size_t bufsize;
6701186Sayznaga 	int len, err;
6711186Sayznaga 
6721186Sayznaga 	if ((bufsize = cpu_get_name_bufsize()) == 0)
6731186Sayznaga 		return (ENOTSUP);
6741186Sayznaga 
6751186Sayznaga 	if ((err = mm_read_mem_name(data, &mem_name)) < 0)
6761186Sayznaga 		return (err);
6771186Sayznaga 
6781186Sayznaga 	buf = kmem_alloc(bufsize, KM_SLEEP);
6791186Sayznaga 
6801186Sayznaga 	if (mem_name.m_namelen > 1024)
6811186Sayznaga 		mem_name.m_namelen = 1024; /* cap at 1024 bytes */
6821186Sayznaga 
6831186Sayznaga 	name = kmem_alloc(mem_name.m_namelen, KM_SLEEP);
6841186Sayznaga 
6851186Sayznaga 	if ((err = copyinstr((char *)mem_name.m_name, (char *)name,
6861186Sayznaga 	    mem_name.m_namelen, &name_len)) != 0) {
6871186Sayznaga 		kmem_free(buf, bufsize);
6881186Sayznaga 		kmem_free(name, mem_name.m_namelen);
6891186Sayznaga 		return (err);
6901186Sayznaga 	}
6911186Sayznaga 
6921186Sayznaga 	/*
6931186Sayznaga 	 * Call into cpu specific code to do the lookup.
6941186Sayznaga 	 */
6951186Sayznaga 	if ((err = cpu_get_mem_sid(name, buf, bufsize, &len)) != 0) {
6961186Sayznaga 		kmem_free(buf, bufsize);
6971186Sayznaga 		kmem_free(name, mem_name.m_namelen);
6981186Sayznaga 		return (err);
6991186Sayznaga 	}
7001186Sayznaga 
7011186Sayznaga 	if (len > mem_name.m_sidlen) {
7021186Sayznaga 		kmem_free(buf, bufsize);
7031186Sayznaga 		kmem_free(name, mem_name.m_namelen);
7041186Sayznaga 		return (ENAMETOOLONG);
7051186Sayznaga 	}
7061186Sayznaga 
7071186Sayznaga 	if (copyoutstr(buf, (char *)mem_name.m_sid,
7081186Sayznaga 	    mem_name.m_sidlen, NULL) != 0) {
7091186Sayznaga 		kmem_free(buf, bufsize);
7101186Sayznaga 		kmem_free(name, mem_name.m_namelen);
7111186Sayznaga 		return (EFAULT);
7121186Sayznaga 	}
7131186Sayznaga 
7141186Sayznaga 	kmem_free(buf, bufsize);
7151186Sayznaga 	kmem_free(name, mem_name.m_namelen);
7161186Sayznaga 	return (0);
7171186Sayznaga }
7180Sstevel@tonic-gate #endif	/* __sparc */
7190Sstevel@tonic-gate 
7200Sstevel@tonic-gate /*
7210Sstevel@tonic-gate  * Private ioctls for
7220Sstevel@tonic-gate  *	libkvm to support kvm_physaddr().
7230Sstevel@tonic-gate  *	FMA support for page_retire() and memory attribute information.
7240Sstevel@tonic-gate  */
7250Sstevel@tonic-gate /*ARGSUSED*/
7260Sstevel@tonic-gate static int
7270Sstevel@tonic-gate mmioctl(dev_t dev, int cmd, intptr_t data, int flag, cred_t *cred, int *rvalp)
7280Sstevel@tonic-gate {
7291283Sayznaga 	if ((cmd == MEM_VTOP && getminor(dev) != M_KMEM) ||
7301283Sayznaga 	    (cmd != MEM_VTOP && getminor(dev) != M_MEM))
7311186Sayznaga 		return (ENXIO);
7321186Sayznaga 
7330Sstevel@tonic-gate 	switch (cmd) {
7340Sstevel@tonic-gate 	case MEM_VTOP:
7350Sstevel@tonic-gate 		return (mmioctl_vtop(data));
7360Sstevel@tonic-gate 
7370Sstevel@tonic-gate 	case MEM_PAGE_RETIRE:
7380Sstevel@tonic-gate 	case MEM_PAGE_ISRETIRED:
739917Selowe 	case MEM_PAGE_UNRETIRE:
740917Selowe 	case MEM_PAGE_RETIRE_MCE:
741917Selowe 	case MEM_PAGE_RETIRE_UE:
742917Selowe 	case MEM_PAGE_GETERRORS:
743917Selowe 	case MEM_PAGE_RETIRE_TEST:
7440Sstevel@tonic-gate 		return (mmioctl_page_retire(cmd, data));
7450Sstevel@tonic-gate 
7461186Sayznaga 	case MEM_PAGE_FMRI_RETIRE:
7471186Sayznaga 	case MEM_PAGE_FMRI_ISRETIRED:
7481186Sayznaga 		return (mmioctl_page_fmri_retire(cmd, data));
7491186Sayznaga 
7500Sstevel@tonic-gate #ifdef __sparc
7511186Sayznaga 	case MEM_NAME:
7520Sstevel@tonic-gate 		return (mmioctl_get_mem_name(data));
7530Sstevel@tonic-gate 
7540Sstevel@tonic-gate 	case MEM_INFO:
7550Sstevel@tonic-gate 		return (mmioctl_get_mem_info(data));
7561186Sayznaga 
7571186Sayznaga 	case MEM_SID:
7581186Sayznaga 		return (mmioctl_get_mem_sid(data));
7590Sstevel@tonic-gate #else
7601186Sayznaga 	case MEM_NAME:
7611186Sayznaga 	case MEM_INFO:
7621186Sayznaga 	case MEM_SID:
7630Sstevel@tonic-gate 		return (ENOTSUP);
7641186Sayznaga #endif	/* __sparc */
7650Sstevel@tonic-gate 	}
7660Sstevel@tonic-gate 	return (ENXIO);
7670Sstevel@tonic-gate }
7680Sstevel@tonic-gate 
7690Sstevel@tonic-gate /*ARGSUSED2*/
7700Sstevel@tonic-gate static int
7710Sstevel@tonic-gate mmmmap(dev_t dev, off_t off, int prot)
7720Sstevel@tonic-gate {
7730Sstevel@tonic-gate 	pfn_t pf;
7740Sstevel@tonic-gate 	struct memlist *pmem;
7750Sstevel@tonic-gate 	minor_t minor = getminor(dev);
7760Sstevel@tonic-gate 
7770Sstevel@tonic-gate 	switch (minor) {
7780Sstevel@tonic-gate 	case M_MEM:
7790Sstevel@tonic-gate 		pf = btop(off);
7800Sstevel@tonic-gate 		memlist_read_lock();
7810Sstevel@tonic-gate 		for (pmem = phys_install; pmem != NULL; pmem = pmem->next) {
7820Sstevel@tonic-gate 			if (pf >= BTOP(pmem->address) &&
7830Sstevel@tonic-gate 			    pf < BTOP(pmem->address + pmem->size)) {
7840Sstevel@tonic-gate 				memlist_read_unlock();
7850Sstevel@tonic-gate 				return (impl_obmem_pfnum(pf));
7860Sstevel@tonic-gate 			}
7870Sstevel@tonic-gate 		}
7880Sstevel@tonic-gate 		memlist_read_unlock();
7890Sstevel@tonic-gate 		break;
7900Sstevel@tonic-gate 
7910Sstevel@tonic-gate 	case M_KMEM:
7920Sstevel@tonic-gate 	case M_ALLKMEM:
7930Sstevel@tonic-gate 		/* no longer supported with KPR */
7940Sstevel@tonic-gate 		return (-1);
7950Sstevel@tonic-gate 
7960Sstevel@tonic-gate 	case M_ZERO:
7970Sstevel@tonic-gate 		/*
7980Sstevel@tonic-gate 		 * We shouldn't be mmap'ing to /dev/zero here as
7990Sstevel@tonic-gate 		 * mmsegmap() should have already converted
8000Sstevel@tonic-gate 		 * a mapping request for this device to a mapping
8010Sstevel@tonic-gate 		 * using seg_vn for anonymous memory.
8020Sstevel@tonic-gate 		 */
8030Sstevel@tonic-gate 		break;
8040Sstevel@tonic-gate 
8050Sstevel@tonic-gate 	}
8060Sstevel@tonic-gate 	return (-1);
8070Sstevel@tonic-gate }
8080Sstevel@tonic-gate 
8090Sstevel@tonic-gate /*
8100Sstevel@tonic-gate  * This function is called when a memory device is mmap'ed.
8110Sstevel@tonic-gate  * Set up the mapping to the correct device driver.
8120Sstevel@tonic-gate  */
8130Sstevel@tonic-gate static int
8140Sstevel@tonic-gate mmsegmap(dev_t dev, off_t off, struct as *as, caddr_t *addrp, off_t len,
8150Sstevel@tonic-gate     uint_t prot, uint_t maxprot, uint_t flags, struct cred *cred)
8160Sstevel@tonic-gate {
8170Sstevel@tonic-gate 	struct segvn_crargs vn_a;
8180Sstevel@tonic-gate 	struct segdev_crargs dev_a;
8190Sstevel@tonic-gate 	int error;
8200Sstevel@tonic-gate 	minor_t minor;
8210Sstevel@tonic-gate 	off_t i;
8220Sstevel@tonic-gate 
8230Sstevel@tonic-gate 	minor = getminor(dev);
8240Sstevel@tonic-gate 
8250Sstevel@tonic-gate 	as_rangelock(as);
8260Sstevel@tonic-gate 	if ((flags & MAP_FIXED) == 0) {
8270Sstevel@tonic-gate 		/*
8280Sstevel@tonic-gate 		 * No need to worry about vac alignment on /dev/zero
8290Sstevel@tonic-gate 		 * since this is a "clone" object that doesn't yet exist.
8300Sstevel@tonic-gate 		 */
8310Sstevel@tonic-gate 		map_addr(addrp, len, (offset_t)off,
8320Sstevel@tonic-gate 				(minor == M_MEM) || (minor == M_KMEM), flags);
8330Sstevel@tonic-gate 
8340Sstevel@tonic-gate 		if (*addrp == NULL) {
8350Sstevel@tonic-gate 			as_rangeunlock(as);
8360Sstevel@tonic-gate 			return (ENOMEM);
8370Sstevel@tonic-gate 		}
8380Sstevel@tonic-gate 	} else {
8390Sstevel@tonic-gate 		/*
8400Sstevel@tonic-gate 		 * User specified address -
8410Sstevel@tonic-gate 		 * Blow away any previous mappings.
8420Sstevel@tonic-gate 		 */
8430Sstevel@tonic-gate 		(void) as_unmap(as, *addrp, len);
8440Sstevel@tonic-gate 	}
8450Sstevel@tonic-gate 
8460Sstevel@tonic-gate 	switch (minor) {
8470Sstevel@tonic-gate 	case M_MEM:
8480Sstevel@tonic-gate 		/* /dev/mem cannot be mmap'ed with MAP_PRIVATE */
8490Sstevel@tonic-gate 		if ((flags & MAP_TYPE) != MAP_SHARED) {
8500Sstevel@tonic-gate 			as_rangeunlock(as);
8510Sstevel@tonic-gate 			return (EINVAL);
8520Sstevel@tonic-gate 		}
8530Sstevel@tonic-gate 
8540Sstevel@tonic-gate 		/*
8550Sstevel@tonic-gate 		 * Check to ensure that the entire range is
8560Sstevel@tonic-gate 		 * legal and we are not trying to map in
8570Sstevel@tonic-gate 		 * more than the device will let us.
8580Sstevel@tonic-gate 		 */
8590Sstevel@tonic-gate 		for (i = 0; i < len; i += PAGESIZE) {
8600Sstevel@tonic-gate 			if (mmmmap(dev, off + i, maxprot) == -1) {
8610Sstevel@tonic-gate 				as_rangeunlock(as);
8620Sstevel@tonic-gate 				return (ENXIO);
8630Sstevel@tonic-gate 			}
8640Sstevel@tonic-gate 		}
8650Sstevel@tonic-gate 
8660Sstevel@tonic-gate 		/*
8670Sstevel@tonic-gate 		 * Use seg_dev segment driver for /dev/mem mapping.
8680Sstevel@tonic-gate 		 */
8690Sstevel@tonic-gate 		dev_a.mapfunc = mmmmap;
8700Sstevel@tonic-gate 		dev_a.dev = dev;
8710Sstevel@tonic-gate 		dev_a.offset = off;
8720Sstevel@tonic-gate 		dev_a.type = (flags & MAP_TYPE);
8730Sstevel@tonic-gate 		dev_a.prot = (uchar_t)prot;
8740Sstevel@tonic-gate 		dev_a.maxprot = (uchar_t)maxprot;
8750Sstevel@tonic-gate 		dev_a.hat_attr = 0;
8760Sstevel@tonic-gate 
8770Sstevel@tonic-gate 		/*
8780Sstevel@tonic-gate 		 * Make /dev/mem mappings non-consistent since we can't
8790Sstevel@tonic-gate 		 * alias pages that don't have page structs behind them,
8800Sstevel@tonic-gate 		 * such as kernel stack pages. If someone mmap()s a kernel
8810Sstevel@tonic-gate 		 * stack page and if we give him a tte with cv, a line from
8820Sstevel@tonic-gate 		 * that page can get into both pages of the spitfire d$.
8830Sstevel@tonic-gate 		 * But snoop from another processor will only invalidate
8840Sstevel@tonic-gate 		 * the first page. This later caused kernel (xc_attention)
8850Sstevel@tonic-gate 		 * to go into an infinite loop at pil 13 and no interrupts
8860Sstevel@tonic-gate 		 * could come in. See 1203630.
8870Sstevel@tonic-gate 		 *
8880Sstevel@tonic-gate 		 */
8890Sstevel@tonic-gate 		dev_a.hat_flags = HAT_LOAD_NOCONSIST;
8900Sstevel@tonic-gate 		dev_a.devmap_data = NULL;
8910Sstevel@tonic-gate 
8920Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segdev_create, &dev_a);
8930Sstevel@tonic-gate 		break;
8940Sstevel@tonic-gate 
8950Sstevel@tonic-gate 	case M_ZERO:
8960Sstevel@tonic-gate 		/*
8970Sstevel@tonic-gate 		 * Use seg_vn segment driver for /dev/zero mapping.
8980Sstevel@tonic-gate 		 * Passing in a NULL amp gives us the "cloning" effect.
8990Sstevel@tonic-gate 		 */
9000Sstevel@tonic-gate 		vn_a.vp = NULL;
9010Sstevel@tonic-gate 		vn_a.offset = 0;
9020Sstevel@tonic-gate 		vn_a.type = (flags & MAP_TYPE);
9030Sstevel@tonic-gate 		vn_a.prot = prot;
9040Sstevel@tonic-gate 		vn_a.maxprot = maxprot;
9050Sstevel@tonic-gate 		vn_a.flags = flags & ~MAP_TYPE;
9060Sstevel@tonic-gate 		vn_a.cred = cred;
9070Sstevel@tonic-gate 		vn_a.amp = NULL;
9080Sstevel@tonic-gate 		vn_a.szc = 0;
9090Sstevel@tonic-gate 		vn_a.lgrp_mem_policy_flags = 0;
9100Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segvn_create, &vn_a);
9110Sstevel@tonic-gate 		break;
9120Sstevel@tonic-gate 
9130Sstevel@tonic-gate 	case M_KMEM:
9140Sstevel@tonic-gate 	case M_ALLKMEM:
9150Sstevel@tonic-gate 		/* No longer supported with KPR. */
9160Sstevel@tonic-gate 		error = ENXIO;
9170Sstevel@tonic-gate 		break;
9180Sstevel@tonic-gate 
9190Sstevel@tonic-gate 	case M_NULL:
9200Sstevel@tonic-gate 		/*
9210Sstevel@tonic-gate 		 * Use seg_dev segment driver for /dev/null mapping.
9220Sstevel@tonic-gate 		 */
9230Sstevel@tonic-gate 		dev_a.mapfunc = mmmmap;
9240Sstevel@tonic-gate 		dev_a.dev = dev;
9250Sstevel@tonic-gate 		dev_a.offset = off;
9260Sstevel@tonic-gate 		dev_a.type = 0;		/* neither PRIVATE nor SHARED */
9270Sstevel@tonic-gate 		dev_a.prot = dev_a.maxprot = (uchar_t)PROT_NONE;
9280Sstevel@tonic-gate 		dev_a.hat_attr = 0;
9290Sstevel@tonic-gate 		dev_a.hat_flags = 0;
9300Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segdev_create, &dev_a);
9310Sstevel@tonic-gate 		break;
9320Sstevel@tonic-gate 
9330Sstevel@tonic-gate 	default:
9340Sstevel@tonic-gate 		error = ENXIO;
9350Sstevel@tonic-gate 	}
9360Sstevel@tonic-gate 
9370Sstevel@tonic-gate 	as_rangeunlock(as);
9380Sstevel@tonic-gate 	return (error);
9390Sstevel@tonic-gate }
9400Sstevel@tonic-gate 
9410Sstevel@tonic-gate static struct cb_ops mm_cb_ops = {
9420Sstevel@tonic-gate 	mmopen,			/* open */
9430Sstevel@tonic-gate 	nulldev,		/* close */
9440Sstevel@tonic-gate 	nodev,			/* strategy */
9450Sstevel@tonic-gate 	nodev,			/* print */
9460Sstevel@tonic-gate 	nodev,			/* dump */
9470Sstevel@tonic-gate 	mmread,			/* read */
9480Sstevel@tonic-gate 	mmwrite,		/* write */
9490Sstevel@tonic-gate 	mmioctl,		/* ioctl */
9500Sstevel@tonic-gate 	nodev,			/* devmap */
9510Sstevel@tonic-gate 	mmmmap,			/* mmap */
9520Sstevel@tonic-gate 	mmsegmap,		/* segmap */
9530Sstevel@tonic-gate 	mmchpoll,		/* poll */
9540Sstevel@tonic-gate 	mmpropop,		/* prop_op */
9550Sstevel@tonic-gate 	0,			/* streamtab  */
9560Sstevel@tonic-gate 	D_NEW | D_MP | D_64BIT | D_U64BIT
9570Sstevel@tonic-gate };
9580Sstevel@tonic-gate 
9590Sstevel@tonic-gate static struct dev_ops mm_ops = {
9600Sstevel@tonic-gate 	DEVO_REV,		/* devo_rev, */
9610Sstevel@tonic-gate 	0,			/* refcnt  */
9620Sstevel@tonic-gate 	mm_info,		/* get_dev_info */
9630Sstevel@tonic-gate 	nulldev,		/* identify */
9640Sstevel@tonic-gate 	nulldev,		/* probe */
9650Sstevel@tonic-gate 	mm_attach,		/* attach */
9660Sstevel@tonic-gate 	nodev,			/* detach */
9670Sstevel@tonic-gate 	nodev,			/* reset */
9680Sstevel@tonic-gate 	&mm_cb_ops,		/* driver operations */
9690Sstevel@tonic-gate 	(struct bus_ops *)0	/* bus operations */
9700Sstevel@tonic-gate };
9710Sstevel@tonic-gate 
9720Sstevel@tonic-gate static struct modldrv modldrv = {
9730Sstevel@tonic-gate 	&mod_driverops, "memory driver %I%", &mm_ops,
9740Sstevel@tonic-gate };
9750Sstevel@tonic-gate 
9760Sstevel@tonic-gate static struct modlinkage modlinkage = {
9770Sstevel@tonic-gate 	MODREV_1, &modldrv, NULL
9780Sstevel@tonic-gate };
9790Sstevel@tonic-gate 
9800Sstevel@tonic-gate int
9810Sstevel@tonic-gate _init(void)
9820Sstevel@tonic-gate {
9830Sstevel@tonic-gate 	return (mod_install(&modlinkage));
9840Sstevel@tonic-gate }
9850Sstevel@tonic-gate 
9860Sstevel@tonic-gate int
9870Sstevel@tonic-gate _info(struct modinfo *modinfop)
9880Sstevel@tonic-gate {
9890Sstevel@tonic-gate 	return (mod_info(&modlinkage, modinfop));
9900Sstevel@tonic-gate }
9910Sstevel@tonic-gate 
9920Sstevel@tonic-gate int
9930Sstevel@tonic-gate _fini(void)
9940Sstevel@tonic-gate {
9950Sstevel@tonic-gate 	return (mod_remove(&modlinkage));
9960Sstevel@tonic-gate }
9970Sstevel@tonic-gate 
9980Sstevel@tonic-gate static int
9990Sstevel@tonic-gate mm_kstat_update(kstat_t *ksp, int rw)
10000Sstevel@tonic-gate {
10010Sstevel@tonic-gate 	struct memlist *pmem;
10020Sstevel@tonic-gate 	uint_t count;
10030Sstevel@tonic-gate 
10040Sstevel@tonic-gate 	if (rw == KSTAT_WRITE)
10050Sstevel@tonic-gate 		return (EACCES);
10060Sstevel@tonic-gate 
10070Sstevel@tonic-gate 	count = 0;
10080Sstevel@tonic-gate 	memlist_read_lock();
10090Sstevel@tonic-gate 	for (pmem = phys_install; pmem != NULL; pmem = pmem->next) {
10100Sstevel@tonic-gate 		count++;
10110Sstevel@tonic-gate 	}
10120Sstevel@tonic-gate 	memlist_read_unlock();
10130Sstevel@tonic-gate 
10140Sstevel@tonic-gate 	ksp->ks_ndata = count;
10150Sstevel@tonic-gate 	ksp->ks_data_size = count * 2 * sizeof (uint64_t);
10160Sstevel@tonic-gate 
10170Sstevel@tonic-gate 	return (0);
10180Sstevel@tonic-gate }
10190Sstevel@tonic-gate 
10200Sstevel@tonic-gate static int
10210Sstevel@tonic-gate mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw)
10220Sstevel@tonic-gate {
10230Sstevel@tonic-gate 	struct memlist *pmem;
10240Sstevel@tonic-gate 	struct memunit {
10250Sstevel@tonic-gate 		uint64_t address;
10260Sstevel@tonic-gate 		uint64_t size;
10270Sstevel@tonic-gate 	} *kspmem;
10280Sstevel@tonic-gate 
10290Sstevel@tonic-gate 	if (rw == KSTAT_WRITE)
10300Sstevel@tonic-gate 		return (EACCES);
10310Sstevel@tonic-gate 
10320Sstevel@tonic-gate 	ksp->ks_snaptime = gethrtime();
10330Sstevel@tonic-gate 
10340Sstevel@tonic-gate 	kspmem = (struct memunit *)buf;
10350Sstevel@tonic-gate 	memlist_read_lock();
10360Sstevel@tonic-gate 	for (pmem = phys_install; pmem != NULL; pmem = pmem->next, kspmem++) {
10370Sstevel@tonic-gate 		if ((caddr_t)kspmem >= (caddr_t)buf + ksp->ks_data_size)
10380Sstevel@tonic-gate 			break;
10390Sstevel@tonic-gate 		kspmem->address = pmem->address;
10400Sstevel@tonic-gate 		kspmem->size = pmem->size;
10410Sstevel@tonic-gate 	}
10420Sstevel@tonic-gate 	memlist_read_unlock();
10430Sstevel@tonic-gate 
10440Sstevel@tonic-gate 	return (0);
10450Sstevel@tonic-gate }
10461186Sayznaga 
10471186Sayznaga /*
10481186Sayznaga  * Read a mem_name_t from user-space and store it in the mem_name_t
10491186Sayznaga  * pointed to by the mem_name argument.
10501186Sayznaga  */
10511186Sayznaga static int
10521186Sayznaga mm_read_mem_name(intptr_t data, mem_name_t *mem_name)
10531186Sayznaga {
10541186Sayznaga 	if (get_udatamodel() == DATAMODEL_NATIVE) {
10551186Sayznaga 		if (copyin((void *)data, mem_name, sizeof (mem_name_t)))
10561186Sayznaga 			return (EFAULT);
10571186Sayznaga 	}
10581186Sayznaga #ifdef	_SYSCALL32
10591186Sayznaga 	else {
10601186Sayznaga 		mem_name32_t mem_name32;
10611186Sayznaga 
10621186Sayznaga 		if (copyin((void *)data, &mem_name32, sizeof (mem_name32_t)))
10631186Sayznaga 			return (EFAULT);
10641186Sayznaga 		mem_name->m_addr = mem_name32.m_addr;
10651186Sayznaga 		mem_name->m_synd = mem_name32.m_synd;
10661186Sayznaga 		mem_name->m_type[0] = mem_name32.m_type[0];
10671186Sayznaga 		mem_name->m_type[1] = mem_name32.m_type[1];
10681283Sayznaga 		mem_name->m_name = (caddr_t)(uintptr_t)mem_name32.m_name;
10691186Sayznaga 		mem_name->m_namelen = (size_t)mem_name32.m_namelen;
10701283Sayznaga 		mem_name->m_sid = (caddr_t)(uintptr_t)mem_name32.m_sid;
10711186Sayznaga 		mem_name->m_sidlen = (size_t)mem_name32.m_sidlen;
10721186Sayznaga 	}
10731186Sayznaga #endif	/* _SYSCALL32 */
10741186Sayznaga 
10751186Sayznaga 	return (0);
10761186Sayznaga }
10771186Sayznaga 
10781186Sayznaga /*
10791186Sayznaga  * Read a mem_page_t from user-space and store it in the mem_page_t
10801186Sayznaga  * pointed to by the mpage argument.
10811186Sayznaga  */
10821186Sayznaga static int
10831186Sayznaga mm_read_mem_page(intptr_t data, mem_page_t *mpage)
10841186Sayznaga {
10851186Sayznaga 	if (get_udatamodel() == DATAMODEL_NATIVE) {
10861186Sayznaga 		if (copyin((void *)data, mpage, sizeof (mem_page_t)) != 0)
10871186Sayznaga 			return (EFAULT);
10881186Sayznaga 	}
10891186Sayznaga #ifdef _SYSCALL32
10901186Sayznaga 	else {
10911186Sayznaga 		mem_page32_t	mpage32;
10921186Sayznaga 
10931186Sayznaga 		if (copyin((void *)data, &mpage32, sizeof (mem_page32_t)) != 0)
10941186Sayznaga 			return (EFAULT);
10951186Sayznaga 
10961186Sayznaga 		mpage->m_fmri = (caddr_t)(uintptr_t)mpage32.m_fmri;
10971186Sayznaga 		mpage->m_fmrisz = mpage32.m_fmrisz;
10981186Sayznaga 	}
10991186Sayznaga #endif	/* _SYSCALL32 */
11001186Sayznaga 
11011186Sayznaga 	return (0);
11021186Sayznaga }
11031186Sayznaga 
11041186Sayznaga /*
11051186Sayznaga  * Expand an FMRI from a mem_page_t.
11061186Sayznaga  */
11071186Sayznaga static int
11081186Sayznaga mm_get_mem_fmri(mem_page_t *mpage, nvlist_t **nvl)
11091186Sayznaga {
11101186Sayznaga 	char *buf;
11111186Sayznaga 	int err;
11121186Sayznaga 
11131186Sayznaga 	if (mpage->m_fmri == NULL || mpage->m_fmrisz > MEM_FMRI_MAX_BUFSIZE)
11141186Sayznaga 		return (EINVAL);
11151186Sayznaga 
11161186Sayznaga 	buf = kmem_alloc(mpage->m_fmrisz, KM_SLEEP);
11171186Sayznaga 	if (copyin(mpage->m_fmri, buf, mpage->m_fmrisz) != 0) {
11181186Sayznaga 		kmem_free(buf, mpage->m_fmrisz);
11191186Sayznaga 		return (EFAULT);
11201186Sayznaga 	}
11211186Sayznaga 
11221186Sayznaga 	err = nvlist_unpack(buf, mpage->m_fmrisz, nvl, KM_SLEEP);
11231186Sayznaga 	kmem_free(buf, mpage->m_fmrisz);
11241186Sayznaga 
11251186Sayznaga 	return (err);
11261186Sayznaga }
11271186Sayznaga 
11281186Sayznaga static int
11291186Sayznaga mm_get_paddr(nvlist_t *nvl, uint64_t *paddr)
11301186Sayznaga {
11311186Sayznaga 	uint8_t version;
11321189Sayznaga 	uint64_t pa;
11331186Sayznaga 	char *scheme;
11341189Sayznaga #ifdef __sparc
11351189Sayznaga 	uint64_t offset;
11361186Sayznaga 	char *unum;
11371186Sayznaga 	char **serids;
11381186Sayznaga 	uint_t nserids;
11391186Sayznaga 	int err;
11401189Sayznaga #endif
11411186Sayznaga 
11421186Sayznaga 	/* Verify FMRI scheme name and version number */
11431186Sayznaga 	if ((nvlist_lookup_string(nvl, FM_FMRI_SCHEME, &scheme) != 0) ||
11441186Sayznaga 	    (strcmp(scheme, FM_FMRI_SCHEME_MEM) != 0) ||
11451186Sayznaga 	    (nvlist_lookup_uint8(nvl, FM_VERSION, &version) != 0) ||
11461186Sayznaga 	    version > FM_MEM_SCHEME_VERSION) {
11471186Sayznaga 		return (EINVAL);
11481186Sayznaga 	}
11491186Sayznaga 
11501186Sayznaga 	/*
11511186Sayznaga 	 * There are two ways a physical address can be  obtained from a mem
11521186Sayznaga 	 * scheme FMRI.  One way is to use the "offset" and  "serial"
11531186Sayznaga 	 * members, if they are present, together with the "unum" member to
11541186Sayznaga 	 * calculate a physical address.  This is the preferred way since
11551186Sayznaga 	 * it is independent of possible changes to the programming of
11561186Sayznaga 	 * underlying hardware registers that may change the physical address.
11571186Sayznaga 	 * If the "offset" member is not present, then the address is
11581186Sayznaga 	 * retrieved from the "physaddr" member.
11591186Sayznaga 	 */
11601414Scindi #if defined(__sparc)
11611186Sayznaga 	if (nvlist_lookup_uint64(nvl, FM_FMRI_MEM_OFFSET, &offset) != 0) {
11621186Sayznaga 		if (nvlist_lookup_uint64(nvl, FM_FMRI_MEM_PHYSADDR, &pa) !=
11631186Sayznaga 		    0) {
11641186Sayznaga 			return (EINVAL);
11651186Sayznaga 		}
11661186Sayznaga 	} else if (nvlist_lookup_string(nvl, FM_FMRI_MEM_UNUM, &unum) != 0 ||
11671186Sayznaga 	    nvlist_lookup_string_array(nvl, FM_FMRI_MEM_SERIAL_ID, &serids,
11681186Sayznaga 	    &nserids) != 0) {
11691186Sayznaga 		return (EINVAL);
11701186Sayznaga 	} else {
1171*1463Sayznaga 		err = cpu_get_mem_addr(unum, serids[0], offset, &pa);
1172*1463Sayznaga 		if (err != 0) {
1173*1463Sayznaga 			if (err == ENOTSUP) {
1174*1463Sayznaga 				/* Fall back to physaddr */
1175*1463Sayznaga 				if (nvlist_lookup_uint64(nvl,
1176*1463Sayznaga 				    FM_FMRI_MEM_PHYSADDR, &pa) != 0)
1177*1463Sayznaga 					return (EINVAL);
1178*1463Sayznaga 			} else
1179*1463Sayznaga 				return (err);
1180*1463Sayznaga 		}
11811186Sayznaga 	}
11821414Scindi #elif defined(__i386) || defined(__amd64)
11831414Scindi 	if (cmi_mc_unumtopa(NULL, nvl, &pa) == 0)
11841187Sayznaga 		return (EINVAL);
11851414Scindi #else
11861414Scindi #error "port me"
11871187Sayznaga #endif /* __sparc */
11881186Sayznaga 
11891186Sayznaga 	*paddr = pa;
11901186Sayznaga 	return (0);
11911186Sayznaga }
1192