10Sstevel@tonic-gate /* 20Sstevel@tonic-gate * CDDL HEADER START 30Sstevel@tonic-gate * 40Sstevel@tonic-gate * The contents of this file are subject to the terms of the 51463Sayznaga * Common Development and Distribution License (the "License"). 61463Sayznaga * You may not use this file except in compliance with the License. 70Sstevel@tonic-gate * 80Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 90Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 100Sstevel@tonic-gate * See the License for the specific language governing permissions 110Sstevel@tonic-gate * and limitations under the License. 120Sstevel@tonic-gate * 130Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 140Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 150Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 160Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 170Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 180Sstevel@tonic-gate * 190Sstevel@tonic-gate * CDDL HEADER END 200Sstevel@tonic-gate */ 210Sstevel@tonic-gate /* 226036Smec * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 230Sstevel@tonic-gate * Use is subject to license terms. 240Sstevel@tonic-gate */ 250Sstevel@tonic-gate 260Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" 270Sstevel@tonic-gate 280Sstevel@tonic-gate /* 290Sstevel@tonic-gate * Memory special file 300Sstevel@tonic-gate */ 310Sstevel@tonic-gate 320Sstevel@tonic-gate #include <sys/types.h> 330Sstevel@tonic-gate #include <sys/param.h> 340Sstevel@tonic-gate #include <sys/user.h> 350Sstevel@tonic-gate #include <sys/buf.h> 360Sstevel@tonic-gate #include <sys/systm.h> 370Sstevel@tonic-gate #include <sys/cred.h> 380Sstevel@tonic-gate #include <sys/vm.h> 390Sstevel@tonic-gate #include <sys/uio.h> 400Sstevel@tonic-gate #include <sys/mman.h> 410Sstevel@tonic-gate #include <sys/kmem.h> 420Sstevel@tonic-gate #include <vm/seg.h> 430Sstevel@tonic-gate #include <vm/page.h> 440Sstevel@tonic-gate #include <sys/stat.h> 450Sstevel@tonic-gate #include <sys/vmem.h> 460Sstevel@tonic-gate #include <sys/memlist.h> 470Sstevel@tonic-gate #include <sys/bootconf.h> 480Sstevel@tonic-gate 490Sstevel@tonic-gate #include <vm/seg_vn.h> 500Sstevel@tonic-gate #include <vm/seg_dev.h> 510Sstevel@tonic-gate #include <vm/seg_kmem.h> 520Sstevel@tonic-gate #include <vm/seg_kp.h> 530Sstevel@tonic-gate #include <vm/seg_kpm.h> 540Sstevel@tonic-gate #include <vm/hat.h> 550Sstevel@tonic-gate 560Sstevel@tonic-gate #include <sys/conf.h> 570Sstevel@tonic-gate #include <sys/mem.h> 580Sstevel@tonic-gate #include <sys/types.h> 590Sstevel@tonic-gate #include <sys/conf.h> 600Sstevel@tonic-gate #include <sys/param.h> 610Sstevel@tonic-gate #include <sys/systm.h> 620Sstevel@tonic-gate #include <sys/errno.h> 630Sstevel@tonic-gate #include <sys/modctl.h> 640Sstevel@tonic-gate #include <sys/memlist.h> 650Sstevel@tonic-gate #include <sys/ddi.h> 660Sstevel@tonic-gate #include <sys/sunddi.h> 670Sstevel@tonic-gate #include <sys/debug.h> 681186Sayznaga #include <sys/fm/protocol.h> 690Sstevel@tonic-gate 701414Scindi #if defined(__sparc) 710Sstevel@tonic-gate extern int cpu_get_mem_name(uint64_t, uint64_t *, uint64_t, char *, int, int *); 720Sstevel@tonic-gate extern int cpu_get_mem_info(uint64_t, uint64_t, uint64_t *, uint64_t *, 730Sstevel@tonic-gate uint64_t *, int *, int *, int *); 740Sstevel@tonic-gate extern size_t cpu_get_name_bufsize(void); 751186Sayznaga extern int cpu_get_mem_sid(char *, char *, int, int *); 761186Sayznaga extern int cpu_get_mem_addr(char *, char *, uint64_t, uint64_t *); 773446Smrj #elif defined(__x86) 781414Scindi #include <sys/cpu_module.h> 791186Sayznaga #endif /* __sparc */ 800Sstevel@tonic-gate 810Sstevel@tonic-gate /* 820Sstevel@tonic-gate * Turn a byte length into a pagecount. The DDI btop takes a 830Sstevel@tonic-gate * 32-bit size on 32-bit machines, this handles 64-bit sizes for 840Sstevel@tonic-gate * large physical-memory 32-bit machines. 850Sstevel@tonic-gate */ 860Sstevel@tonic-gate #define BTOP(x) ((pgcnt_t)((x) >> _pageshift)) 870Sstevel@tonic-gate 880Sstevel@tonic-gate static kmutex_t mm_lock; 890Sstevel@tonic-gate static caddr_t mm_map; 900Sstevel@tonic-gate 910Sstevel@tonic-gate static dev_info_t *mm_dip; /* private copy of devinfo pointer */ 920Sstevel@tonic-gate 930Sstevel@tonic-gate static int mm_kmem_io_access; 940Sstevel@tonic-gate 950Sstevel@tonic-gate static int mm_kstat_update(kstat_t *ksp, int rw); 960Sstevel@tonic-gate static int mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw); 970Sstevel@tonic-gate 981186Sayznaga static int mm_read_mem_name(intptr_t data, mem_name_t *mem_name); 991186Sayznaga static int mm_read_mem_page(intptr_t data, mem_page_t *mpage); 1001186Sayznaga static int mm_get_mem_fmri(mem_page_t *mpage, nvlist_t **nvl); 1011186Sayznaga static int mm_get_paddr(nvlist_t *nvl, uint64_t *paddr); 1021186Sayznaga 1030Sstevel@tonic-gate /*ARGSUSED1*/ 1040Sstevel@tonic-gate static int 1050Sstevel@tonic-gate mm_attach(dev_info_t *devi, ddi_attach_cmd_t cmd) 1060Sstevel@tonic-gate { 1070Sstevel@tonic-gate int i; 1080Sstevel@tonic-gate struct mem_minor { 1090Sstevel@tonic-gate char *name; 1100Sstevel@tonic-gate minor_t minor; 1110Sstevel@tonic-gate int privonly; 1120Sstevel@tonic-gate const char *rdpriv; 1130Sstevel@tonic-gate const char *wrpriv; 1140Sstevel@tonic-gate mode_t priv_mode; 1150Sstevel@tonic-gate } mm[] = { 1160Sstevel@tonic-gate { "mem", M_MEM, 0, NULL, "all", 0640 }, 1170Sstevel@tonic-gate { "kmem", M_KMEM, 0, NULL, "all", 0640 }, 1180Sstevel@tonic-gate { "allkmem", M_ALLKMEM, 0, "all", "all", 0600 }, 1190Sstevel@tonic-gate { "null", M_NULL, PRIVONLY_DEV, NULL, NULL, 0666 }, 1200Sstevel@tonic-gate { "zero", M_ZERO, PRIVONLY_DEV, NULL, NULL, 0666 }, 1210Sstevel@tonic-gate }; 1220Sstevel@tonic-gate kstat_t *ksp; 1230Sstevel@tonic-gate 1240Sstevel@tonic-gate mutex_init(&mm_lock, NULL, MUTEX_DEFAULT, NULL); 1250Sstevel@tonic-gate mm_map = vmem_alloc(heap_arena, PAGESIZE, VM_SLEEP); 1260Sstevel@tonic-gate 1270Sstevel@tonic-gate for (i = 0; i < (sizeof (mm) / sizeof (mm[0])); i++) { 1280Sstevel@tonic-gate if (ddi_create_priv_minor_node(devi, mm[i].name, S_IFCHR, 1290Sstevel@tonic-gate mm[i].minor, DDI_PSEUDO, mm[i].privonly, 1300Sstevel@tonic-gate mm[i].rdpriv, mm[i].wrpriv, mm[i].priv_mode) == 1310Sstevel@tonic-gate DDI_FAILURE) { 1320Sstevel@tonic-gate ddi_remove_minor_node(devi, NULL); 1330Sstevel@tonic-gate return (DDI_FAILURE); 1340Sstevel@tonic-gate } 1350Sstevel@tonic-gate } 1360Sstevel@tonic-gate 1370Sstevel@tonic-gate mm_dip = devi; 1380Sstevel@tonic-gate 1390Sstevel@tonic-gate ksp = kstat_create("mm", 0, "phys_installed", "misc", 1400Sstevel@tonic-gate KSTAT_TYPE_RAW, 0, KSTAT_FLAG_VAR_SIZE | KSTAT_FLAG_VIRTUAL); 1410Sstevel@tonic-gate if (ksp != NULL) { 1420Sstevel@tonic-gate ksp->ks_update = mm_kstat_update; 1430Sstevel@tonic-gate ksp->ks_snapshot = mm_kstat_snapshot; 1440Sstevel@tonic-gate ksp->ks_lock = &mm_lock; /* XXX - not really needed */ 1450Sstevel@tonic-gate kstat_install(ksp); 1460Sstevel@tonic-gate } 1470Sstevel@tonic-gate 1480Sstevel@tonic-gate mm_kmem_io_access = ddi_getprop(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS, 1490Sstevel@tonic-gate "kmem_io_access", 0); 1500Sstevel@tonic-gate 1510Sstevel@tonic-gate return (DDI_SUCCESS); 1520Sstevel@tonic-gate } 1530Sstevel@tonic-gate 1540Sstevel@tonic-gate /*ARGSUSED*/ 1550Sstevel@tonic-gate static int 1560Sstevel@tonic-gate mm_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result) 1570Sstevel@tonic-gate { 1580Sstevel@tonic-gate register int error; 1590Sstevel@tonic-gate 1600Sstevel@tonic-gate switch (infocmd) { 1610Sstevel@tonic-gate case DDI_INFO_DEVT2DEVINFO: 1620Sstevel@tonic-gate *result = (void *)mm_dip; 1630Sstevel@tonic-gate error = DDI_SUCCESS; 1640Sstevel@tonic-gate break; 1650Sstevel@tonic-gate case DDI_INFO_DEVT2INSTANCE: 1660Sstevel@tonic-gate *result = (void *)0; 1670Sstevel@tonic-gate error = DDI_SUCCESS; 1680Sstevel@tonic-gate break; 1690Sstevel@tonic-gate default: 1700Sstevel@tonic-gate error = DDI_FAILURE; 1710Sstevel@tonic-gate } 1720Sstevel@tonic-gate return (error); 1730Sstevel@tonic-gate } 1740Sstevel@tonic-gate 1750Sstevel@tonic-gate /*ARGSUSED1*/ 1760Sstevel@tonic-gate static int 1770Sstevel@tonic-gate mmopen(dev_t *devp, int flag, int typ, struct cred *cred) 1780Sstevel@tonic-gate { 1790Sstevel@tonic-gate switch (getminor(*devp)) { 1800Sstevel@tonic-gate case M_NULL: 1810Sstevel@tonic-gate case M_ZERO: 1820Sstevel@tonic-gate case M_MEM: 1830Sstevel@tonic-gate case M_KMEM: 1840Sstevel@tonic-gate case M_ALLKMEM: 1850Sstevel@tonic-gate /* standard devices */ 1860Sstevel@tonic-gate break; 1870Sstevel@tonic-gate 1880Sstevel@tonic-gate default: 1890Sstevel@tonic-gate /* Unsupported or unknown type */ 1900Sstevel@tonic-gate return (EINVAL); 1910Sstevel@tonic-gate } 1926731Scth /* must be character device */ 1936731Scth if (typ != OTYP_CHR) 1946731Scth return (EINVAL); 1950Sstevel@tonic-gate return (0); 1960Sstevel@tonic-gate } 1970Sstevel@tonic-gate 1980Sstevel@tonic-gate struct pollhead mm_pollhd; 1990Sstevel@tonic-gate 2000Sstevel@tonic-gate /*ARGSUSED*/ 2010Sstevel@tonic-gate static int 2020Sstevel@tonic-gate mmchpoll(dev_t dev, short events, int anyyet, short *reventsp, 2030Sstevel@tonic-gate struct pollhead **phpp) 2040Sstevel@tonic-gate { 2050Sstevel@tonic-gate switch (getminor(dev)) { 2060Sstevel@tonic-gate case M_NULL: 2070Sstevel@tonic-gate case M_ZERO: 2080Sstevel@tonic-gate case M_MEM: 2090Sstevel@tonic-gate case M_KMEM: 2100Sstevel@tonic-gate case M_ALLKMEM: 2110Sstevel@tonic-gate *reventsp = events & (POLLIN | POLLOUT | POLLPRI | POLLRDNORM | 2124374Smb91622 POLLWRNORM | POLLRDBAND | POLLWRBAND); 2130Sstevel@tonic-gate /* 2140Sstevel@tonic-gate * A non NULL pollhead pointer should be returned in case 2150Sstevel@tonic-gate * user polls for 0 events. 2160Sstevel@tonic-gate */ 2170Sstevel@tonic-gate *phpp = !anyyet && !*reventsp ? 2180Sstevel@tonic-gate &mm_pollhd : (struct pollhead *)NULL; 2190Sstevel@tonic-gate return (0); 2200Sstevel@tonic-gate default: 2210Sstevel@tonic-gate /* no other devices currently support polling */ 2220Sstevel@tonic-gate return (ENXIO); 2230Sstevel@tonic-gate } 2240Sstevel@tonic-gate } 2250Sstevel@tonic-gate 2260Sstevel@tonic-gate static int 2270Sstevel@tonic-gate mmpropop(dev_t dev, dev_info_t *dip, ddi_prop_op_t prop_op, int flags, 2280Sstevel@tonic-gate char *name, caddr_t valuep, int *lengthp) 2290Sstevel@tonic-gate { 2300Sstevel@tonic-gate /* 2310Sstevel@tonic-gate * implement zero size to reduce overhead (avoid two failing 2320Sstevel@tonic-gate * property lookups per stat). 2330Sstevel@tonic-gate */ 2340Sstevel@tonic-gate return (ddi_prop_op_size(dev, dip, prop_op, 2350Sstevel@tonic-gate flags, name, valuep, lengthp, 0)); 2360Sstevel@tonic-gate } 2370Sstevel@tonic-gate 2380Sstevel@tonic-gate static int 2390Sstevel@tonic-gate mmio(struct uio *uio, enum uio_rw rw, pfn_t pfn, off_t pageoff, int allowio) 2400Sstevel@tonic-gate { 2410Sstevel@tonic-gate int error = 0; 2420Sstevel@tonic-gate size_t nbytes = MIN((size_t)(PAGESIZE - pageoff), 2430Sstevel@tonic-gate (size_t)uio->uio_iov->iov_len); 2440Sstevel@tonic-gate 2450Sstevel@tonic-gate mutex_enter(&mm_lock); 2460Sstevel@tonic-gate hat_devload(kas.a_hat, mm_map, PAGESIZE, pfn, 2470Sstevel@tonic-gate (uint_t)(rw == UIO_READ ? PROT_READ : PROT_READ | PROT_WRITE), 2480Sstevel@tonic-gate HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 2490Sstevel@tonic-gate 2500Sstevel@tonic-gate if (!pf_is_memory(pfn)) { 2510Sstevel@tonic-gate if (allowio) { 2520Sstevel@tonic-gate size_t c = uio->uio_iov->iov_len; 2530Sstevel@tonic-gate 2540Sstevel@tonic-gate if (ddi_peekpokeio(NULL, uio, rw, 2550Sstevel@tonic-gate (caddr_t)(uintptr_t)uio->uio_loffset, c, 2560Sstevel@tonic-gate sizeof (int32_t)) != DDI_SUCCESS) 2570Sstevel@tonic-gate error = EFAULT; 2580Sstevel@tonic-gate } else 2590Sstevel@tonic-gate error = EIO; 2600Sstevel@tonic-gate } else 2610Sstevel@tonic-gate error = uiomove(&mm_map[pageoff], nbytes, rw, uio); 2620Sstevel@tonic-gate 2630Sstevel@tonic-gate hat_unload(kas.a_hat, mm_map, PAGESIZE, HAT_UNLOAD_UNLOCK); 2640Sstevel@tonic-gate mutex_exit(&mm_lock); 2650Sstevel@tonic-gate return (error); 2660Sstevel@tonic-gate } 2670Sstevel@tonic-gate 268670Selowe static int 269670Selowe mmpagelock(struct as *as, caddr_t va) 270670Selowe { 271670Selowe struct seg *seg; 272670Selowe int i; 273670Selowe 274670Selowe AS_LOCK_ENTER(as, &as->a_lock, RW_READER); 275670Selowe seg = as_segat(as, va); 276670Selowe i = (seg != NULL)? SEGOP_CAPABLE(seg, S_CAPABILITY_NOMINFLT) : 0; 277670Selowe AS_LOCK_EXIT(as, &as->a_lock); 278670Selowe 279670Selowe return (i); 280670Selowe } 281670Selowe 2825084Sjohnlev #ifdef __sparc 2835084Sjohnlev 284670Selowe #define NEED_LOCK_KVADDR(kva) mmpagelock(&kas, kva) 2850Sstevel@tonic-gate 2860Sstevel@tonic-gate #else /* __i386, __amd64 */ 2870Sstevel@tonic-gate 2880Sstevel@tonic-gate #define NEED_LOCK_KVADDR(va) 0 2890Sstevel@tonic-gate 2900Sstevel@tonic-gate #endif /* __sparc */ 2910Sstevel@tonic-gate 2920Sstevel@tonic-gate /*ARGSUSED3*/ 2930Sstevel@tonic-gate static int 2940Sstevel@tonic-gate mmrw(dev_t dev, struct uio *uio, enum uio_rw rw, cred_t *cred) 2950Sstevel@tonic-gate { 2960Sstevel@tonic-gate pfn_t v; 2970Sstevel@tonic-gate struct iovec *iov; 2980Sstevel@tonic-gate int error = 0; 2990Sstevel@tonic-gate size_t c; 3000Sstevel@tonic-gate ssize_t oresid = uio->uio_resid; 3010Sstevel@tonic-gate minor_t minor = getminor(dev); 3020Sstevel@tonic-gate 3030Sstevel@tonic-gate while (uio->uio_resid > 0 && error == 0) { 3040Sstevel@tonic-gate iov = uio->uio_iov; 3050Sstevel@tonic-gate if (iov->iov_len == 0) { 3060Sstevel@tonic-gate uio->uio_iov++; 3070Sstevel@tonic-gate uio->uio_iovcnt--; 3080Sstevel@tonic-gate if (uio->uio_iovcnt < 0) 3090Sstevel@tonic-gate panic("mmrw"); 3100Sstevel@tonic-gate continue; 3110Sstevel@tonic-gate } 3120Sstevel@tonic-gate switch (minor) { 3130Sstevel@tonic-gate 3140Sstevel@tonic-gate case M_MEM: 3150Sstevel@tonic-gate memlist_read_lock(); 3160Sstevel@tonic-gate if (!address_in_memlist(phys_install, 3170Sstevel@tonic-gate (uint64_t)uio->uio_loffset, 1)) { 3180Sstevel@tonic-gate memlist_read_unlock(); 3190Sstevel@tonic-gate error = EFAULT; 3200Sstevel@tonic-gate break; 3210Sstevel@tonic-gate } 3220Sstevel@tonic-gate memlist_read_unlock(); 3230Sstevel@tonic-gate 3240Sstevel@tonic-gate v = BTOP((u_offset_t)uio->uio_loffset); 3250Sstevel@tonic-gate error = mmio(uio, rw, v, 3260Sstevel@tonic-gate uio->uio_loffset & PAGEOFFSET, 0); 3270Sstevel@tonic-gate break; 3280Sstevel@tonic-gate 3290Sstevel@tonic-gate case M_KMEM: 3300Sstevel@tonic-gate case M_ALLKMEM: 3310Sstevel@tonic-gate { 3320Sstevel@tonic-gate page_t **ppp; 3330Sstevel@tonic-gate caddr_t vaddr = (caddr_t)uio->uio_offset; 3340Sstevel@tonic-gate int try_lock = NEED_LOCK_KVADDR(vaddr); 3350Sstevel@tonic-gate int locked = 0; 3360Sstevel@tonic-gate 3375084Sjohnlev if ((error = plat_mem_do_mmio(uio, rw)) != ENOTSUP) 3383446Smrj break; 3393446Smrj 3400Sstevel@tonic-gate /* 3410Sstevel@tonic-gate * If vaddr does not map a valid page, as_pagelock() 3420Sstevel@tonic-gate * will return failure. Hence we can't check the 3430Sstevel@tonic-gate * return value and return EFAULT here as we'd like. 3440Sstevel@tonic-gate * seg_kp and seg_kpm do not properly support 3450Sstevel@tonic-gate * as_pagelock() for this context so we avoid it 3460Sstevel@tonic-gate * using the try_lock set check above. Some day when 3470Sstevel@tonic-gate * the kernel page locking gets redesigned all this 3480Sstevel@tonic-gate * muck can be cleaned up. 3490Sstevel@tonic-gate */ 3500Sstevel@tonic-gate if (try_lock) 3510Sstevel@tonic-gate locked = (as_pagelock(&kas, &ppp, vaddr, 3520Sstevel@tonic-gate PAGESIZE, S_WRITE) == 0); 3530Sstevel@tonic-gate 354513Sjongkis v = hat_getpfnum(kas.a_hat, 355513Sjongkis (caddr_t)(uintptr_t)uio->uio_loffset); 3560Sstevel@tonic-gate if (v == PFN_INVALID) { 3570Sstevel@tonic-gate if (locked) 3580Sstevel@tonic-gate as_pageunlock(&kas, ppp, vaddr, 3590Sstevel@tonic-gate PAGESIZE, S_WRITE); 3600Sstevel@tonic-gate error = EFAULT; 3610Sstevel@tonic-gate break; 3620Sstevel@tonic-gate } 3630Sstevel@tonic-gate 3640Sstevel@tonic-gate error = mmio(uio, rw, v, uio->uio_loffset & PAGEOFFSET, 3650Sstevel@tonic-gate minor == M_ALLKMEM || mm_kmem_io_access); 3660Sstevel@tonic-gate if (locked) 3670Sstevel@tonic-gate as_pageunlock(&kas, ppp, vaddr, PAGESIZE, 3680Sstevel@tonic-gate S_WRITE); 3690Sstevel@tonic-gate } 3700Sstevel@tonic-gate 3710Sstevel@tonic-gate break; 3720Sstevel@tonic-gate 3730Sstevel@tonic-gate case M_ZERO: 3740Sstevel@tonic-gate if (rw == UIO_READ) { 3750Sstevel@tonic-gate label_t ljb; 3760Sstevel@tonic-gate 3770Sstevel@tonic-gate if (on_fault(&ljb)) { 3780Sstevel@tonic-gate no_fault(); 3790Sstevel@tonic-gate error = EFAULT; 3800Sstevel@tonic-gate break; 3810Sstevel@tonic-gate } 3820Sstevel@tonic-gate uzero(iov->iov_base, iov->iov_len); 3830Sstevel@tonic-gate no_fault(); 3840Sstevel@tonic-gate uio->uio_resid -= iov->iov_len; 3850Sstevel@tonic-gate uio->uio_loffset += iov->iov_len; 3860Sstevel@tonic-gate break; 3870Sstevel@tonic-gate } 3880Sstevel@tonic-gate /* else it's a write, fall through to NULL case */ 3890Sstevel@tonic-gate /*FALLTHROUGH*/ 3900Sstevel@tonic-gate 3910Sstevel@tonic-gate case M_NULL: 3920Sstevel@tonic-gate if (rw == UIO_READ) 3930Sstevel@tonic-gate return (0); 3940Sstevel@tonic-gate c = iov->iov_len; 3950Sstevel@tonic-gate iov->iov_base += c; 3960Sstevel@tonic-gate iov->iov_len -= c; 3970Sstevel@tonic-gate uio->uio_loffset += c; 3980Sstevel@tonic-gate uio->uio_resid -= c; 3990Sstevel@tonic-gate break; 4000Sstevel@tonic-gate 4010Sstevel@tonic-gate } 4020Sstevel@tonic-gate } 4030Sstevel@tonic-gate return (uio->uio_resid == oresid ? error : 0); 4040Sstevel@tonic-gate } 4050Sstevel@tonic-gate 4060Sstevel@tonic-gate static int 4070Sstevel@tonic-gate mmread(dev_t dev, struct uio *uio, cred_t *cred) 4080Sstevel@tonic-gate { 4090Sstevel@tonic-gate return (mmrw(dev, uio, UIO_READ, cred)); 4100Sstevel@tonic-gate } 4110Sstevel@tonic-gate 4120Sstevel@tonic-gate static int 4130Sstevel@tonic-gate mmwrite(dev_t dev, struct uio *uio, cred_t *cred) 4140Sstevel@tonic-gate { 4150Sstevel@tonic-gate return (mmrw(dev, uio, UIO_WRITE, cred)); 4160Sstevel@tonic-gate } 4170Sstevel@tonic-gate 4180Sstevel@tonic-gate /* 4190Sstevel@tonic-gate * Private ioctl for libkvm to support kvm_physaddr(). 4200Sstevel@tonic-gate * Given an address space and a VA, compute the PA. 4210Sstevel@tonic-gate */ 4220Sstevel@tonic-gate static int 4230Sstevel@tonic-gate mmioctl_vtop(intptr_t data) 4240Sstevel@tonic-gate { 4251414Scindi #ifdef _SYSCALL32 4261414Scindi mem_vtop32_t vtop32; 4271414Scindi #endif 4280Sstevel@tonic-gate mem_vtop_t mem_vtop; 4290Sstevel@tonic-gate proc_t *p; 4300Sstevel@tonic-gate pfn_t pfn = (pfn_t)PFN_INVALID; 4310Sstevel@tonic-gate pid_t pid = 0; 4320Sstevel@tonic-gate struct as *as; 4330Sstevel@tonic-gate struct seg *seg; 4340Sstevel@tonic-gate 4351414Scindi if (get_udatamodel() == DATAMODEL_NATIVE) { 4361414Scindi if (copyin((void *)data, &mem_vtop, sizeof (mem_vtop_t))) 4371414Scindi return (EFAULT); 4381414Scindi } 4391414Scindi #ifdef _SYSCALL32 4401414Scindi else { 4411414Scindi if (copyin((void *)data, &vtop32, sizeof (mem_vtop32_t))) 4421414Scindi return (EFAULT); 4431717Swesolows mem_vtop.m_as = (struct as *)(uintptr_t)vtop32.m_as; 4441717Swesolows mem_vtop.m_va = (void *)(uintptr_t)vtop32.m_va; 4451414Scindi 4461414Scindi if (mem_vtop.m_as != NULL) 4471414Scindi return (EINVAL); 4481414Scindi } 4491414Scindi #endif 4501414Scindi 4510Sstevel@tonic-gate if (mem_vtop.m_as == &kas) { 4520Sstevel@tonic-gate pfn = hat_getpfnum(kas.a_hat, mem_vtop.m_va); 4530Sstevel@tonic-gate } else { 4541414Scindi if (mem_vtop.m_as == NULL) { 4551414Scindi /* 4561414Scindi * Assume the calling process's address space if the 4571414Scindi * caller didn't specify one. 4581414Scindi */ 4591414Scindi p = curthread->t_procp; 4601414Scindi if (p == NULL) 4611414Scindi return (EIO); 4621414Scindi mem_vtop.m_as = p->p_as; 4631414Scindi } 4641414Scindi 4650Sstevel@tonic-gate mutex_enter(&pidlock); 4660Sstevel@tonic-gate for (p = practive; p != NULL; p = p->p_next) { 4670Sstevel@tonic-gate if (p->p_as == mem_vtop.m_as) { 4680Sstevel@tonic-gate pid = p->p_pid; 4690Sstevel@tonic-gate break; 4700Sstevel@tonic-gate } 4710Sstevel@tonic-gate } 4720Sstevel@tonic-gate mutex_exit(&pidlock); 4730Sstevel@tonic-gate if (p == NULL) 4740Sstevel@tonic-gate return (EIO); 4750Sstevel@tonic-gate p = sprlock(pid); 4760Sstevel@tonic-gate if (p == NULL) 4770Sstevel@tonic-gate return (EIO); 4780Sstevel@tonic-gate as = p->p_as; 4790Sstevel@tonic-gate if (as == mem_vtop.m_as) { 4800Sstevel@tonic-gate mutex_exit(&p->p_lock); 4810Sstevel@tonic-gate AS_LOCK_ENTER(as, &as->a_lock, RW_READER); 4820Sstevel@tonic-gate for (seg = AS_SEGFIRST(as); seg != NULL; 4830Sstevel@tonic-gate seg = AS_SEGNEXT(as, seg)) 4840Sstevel@tonic-gate if ((uintptr_t)mem_vtop.m_va - 4850Sstevel@tonic-gate (uintptr_t)seg->s_base < seg->s_size) 4860Sstevel@tonic-gate break; 4870Sstevel@tonic-gate if (seg != NULL) 4880Sstevel@tonic-gate pfn = hat_getpfnum(as->a_hat, mem_vtop.m_va); 4890Sstevel@tonic-gate AS_LOCK_EXIT(as, &as->a_lock); 4900Sstevel@tonic-gate mutex_enter(&p->p_lock); 4910Sstevel@tonic-gate } 4920Sstevel@tonic-gate sprunlock(p); 4930Sstevel@tonic-gate } 4940Sstevel@tonic-gate mem_vtop.m_pfn = pfn; 4950Sstevel@tonic-gate if (pfn == PFN_INVALID) 4960Sstevel@tonic-gate return (EIO); 4971414Scindi 4981414Scindi if (get_udatamodel() == DATAMODEL_NATIVE) { 4991414Scindi if (copyout(&mem_vtop, (void *)data, sizeof (mem_vtop_t))) 5001414Scindi return (EFAULT); 5011414Scindi } 5021414Scindi #ifdef _SYSCALL32 5031414Scindi else { 5041414Scindi vtop32.m_pfn = mem_vtop.m_pfn; 5051414Scindi if (copyout(&vtop32, (void *)data, sizeof (mem_vtop32_t))) 5061414Scindi return (EFAULT); 5071414Scindi } 5081414Scindi #endif 5090Sstevel@tonic-gate 5100Sstevel@tonic-gate return (0); 5110Sstevel@tonic-gate } 5120Sstevel@tonic-gate 5130Sstevel@tonic-gate /* 514917Selowe * Given a PA, execute the given page retire command on it. 5150Sstevel@tonic-gate */ 5160Sstevel@tonic-gate static int 5170Sstevel@tonic-gate mmioctl_page_retire(int cmd, intptr_t data) 5180Sstevel@tonic-gate { 519917Selowe extern int page_retire_test(void); 5200Sstevel@tonic-gate uint64_t pa; 5210Sstevel@tonic-gate 522917Selowe if (copyin((void *)data, &pa, sizeof (uint64_t))) { 523917Selowe return (EFAULT); 5240Sstevel@tonic-gate } 5250Sstevel@tonic-gate 526917Selowe switch (cmd) { 527917Selowe case MEM_PAGE_ISRETIRED: 528917Selowe return (page_retire_check(pa, NULL)); 529917Selowe 530917Selowe case MEM_PAGE_UNRETIRE: 531917Selowe return (page_unretire(pa)); 532917Selowe 533917Selowe case MEM_PAGE_RETIRE: 534917Selowe return (page_retire(pa, PR_FMA)); 535917Selowe 536917Selowe case MEM_PAGE_RETIRE_MCE: 537917Selowe return (page_retire(pa, PR_MCE)); 538917Selowe 539917Selowe case MEM_PAGE_RETIRE_UE: 540917Selowe return (page_retire(pa, PR_UE)); 5410Sstevel@tonic-gate 542917Selowe case MEM_PAGE_GETERRORS: 543917Selowe { 544917Selowe uint64_t page_errors; 545917Selowe int rc = page_retire_check(pa, &page_errors); 546917Selowe if (copyout(&page_errors, (void *)data, 547917Selowe sizeof (uint64_t))) { 548917Selowe return (EFAULT); 549917Selowe } 550917Selowe return (rc); 551917Selowe } 552917Selowe 553917Selowe case MEM_PAGE_RETIRE_TEST: 554917Selowe return (page_retire_test()); 555917Selowe 556917Selowe } 557917Selowe 558917Selowe return (EINVAL); 5590Sstevel@tonic-gate } 5600Sstevel@tonic-gate 5611186Sayznaga /* 5621186Sayznaga * Given a mem-scheme FMRI for a page, execute the given page retire 5631186Sayznaga * command on it. 5641186Sayznaga */ 5651186Sayznaga static int 5661186Sayznaga mmioctl_page_fmri_retire(int cmd, intptr_t data) 5671186Sayznaga { 5681186Sayznaga mem_page_t mpage; 5691186Sayznaga uint64_t pa; 5701186Sayznaga nvlist_t *nvl; 5711186Sayznaga int err; 5721186Sayznaga 5731186Sayznaga if ((err = mm_read_mem_page(data, &mpage)) < 0) 5741186Sayznaga return (err); 5751186Sayznaga 5764374Smb91622 if ((err = mm_get_mem_fmri(&mpage, &nvl)) != 0) 5771186Sayznaga return (err); 5781186Sayznaga 5791414Scindi if ((err = mm_get_paddr(nvl, &pa)) != 0) { 5801186Sayznaga nvlist_free(nvl); 5811186Sayznaga return (err); 5821186Sayznaga } 5831186Sayznaga 5841186Sayznaga nvlist_free(nvl); 5851186Sayznaga 5861186Sayznaga switch (cmd) { 5871186Sayznaga case MEM_PAGE_FMRI_ISRETIRED: 5881186Sayznaga return (page_retire_check(pa, NULL)); 5891186Sayznaga 5901186Sayznaga case MEM_PAGE_FMRI_RETIRE: 5911186Sayznaga return (page_retire(pa, PR_FMA)); 5926111Scy152378 5936111Scy152378 case MEM_PAGE_FMRI_UNRETIRE: 5946111Scy152378 return (page_unretire(pa)); 5951186Sayznaga } 5961186Sayznaga 5971186Sayznaga return (EINVAL); 5981186Sayznaga } 5991186Sayznaga 6000Sstevel@tonic-gate #ifdef __sparc 6010Sstevel@tonic-gate /* 6020Sstevel@tonic-gate * Given a syndrome, syndrome type, and address return the 6030Sstevel@tonic-gate * associated memory name in the provided data buffer. 6040Sstevel@tonic-gate */ 6050Sstevel@tonic-gate static int 6060Sstevel@tonic-gate mmioctl_get_mem_name(intptr_t data) 6070Sstevel@tonic-gate { 6080Sstevel@tonic-gate mem_name_t mem_name; 6090Sstevel@tonic-gate void *buf; 6100Sstevel@tonic-gate size_t bufsize; 6110Sstevel@tonic-gate int len, err; 6120Sstevel@tonic-gate 6130Sstevel@tonic-gate if ((bufsize = cpu_get_name_bufsize()) == 0) 6140Sstevel@tonic-gate return (ENOTSUP); 6150Sstevel@tonic-gate 6161186Sayznaga if ((err = mm_read_mem_name(data, &mem_name)) < 0) 6171186Sayznaga return (err); 6180Sstevel@tonic-gate 6190Sstevel@tonic-gate buf = kmem_alloc(bufsize, KM_SLEEP); 6200Sstevel@tonic-gate 6210Sstevel@tonic-gate /* 6220Sstevel@tonic-gate * Call into cpu specific code to do the lookup. 6230Sstevel@tonic-gate */ 6240Sstevel@tonic-gate if ((err = cpu_get_mem_name(mem_name.m_synd, mem_name.m_type, 6250Sstevel@tonic-gate mem_name.m_addr, buf, bufsize, &len)) != 0) { 6260Sstevel@tonic-gate kmem_free(buf, bufsize); 6270Sstevel@tonic-gate return (err); 6280Sstevel@tonic-gate } 6290Sstevel@tonic-gate 6300Sstevel@tonic-gate if (len >= mem_name.m_namelen) { 6310Sstevel@tonic-gate kmem_free(buf, bufsize); 632*6803Spothier return (ENOSPC); 6330Sstevel@tonic-gate } 6340Sstevel@tonic-gate 6350Sstevel@tonic-gate if (copyoutstr(buf, (char *)mem_name.m_name, 6360Sstevel@tonic-gate mem_name.m_namelen, NULL) != 0) { 6370Sstevel@tonic-gate kmem_free(buf, bufsize); 6380Sstevel@tonic-gate return (EFAULT); 6390Sstevel@tonic-gate } 6400Sstevel@tonic-gate 6410Sstevel@tonic-gate kmem_free(buf, bufsize); 6420Sstevel@tonic-gate return (0); 6430Sstevel@tonic-gate } 6440Sstevel@tonic-gate 6450Sstevel@tonic-gate /* 6460Sstevel@tonic-gate * Given a syndrome and address return information about the associated memory. 6470Sstevel@tonic-gate */ 6480Sstevel@tonic-gate static int 6490Sstevel@tonic-gate mmioctl_get_mem_info(intptr_t data) 6500Sstevel@tonic-gate { 6510Sstevel@tonic-gate mem_info_t mem_info; 6520Sstevel@tonic-gate int err; 6530Sstevel@tonic-gate 6540Sstevel@tonic-gate if (copyin((void *)data, &mem_info, sizeof (mem_info_t))) 6550Sstevel@tonic-gate return (EFAULT); 6560Sstevel@tonic-gate 6570Sstevel@tonic-gate if ((err = cpu_get_mem_info(mem_info.m_synd, mem_info.m_addr, 6580Sstevel@tonic-gate &mem_info.m_mem_size, &mem_info.m_seg_size, &mem_info.m_bank_size, 6590Sstevel@tonic-gate &mem_info.m_segments, &mem_info.m_banks, &mem_info.m_mcid)) != 0) 6600Sstevel@tonic-gate return (err); 6610Sstevel@tonic-gate 6620Sstevel@tonic-gate if (copyout(&mem_info, (void *)data, sizeof (mem_info_t)) != 0) 6630Sstevel@tonic-gate return (EFAULT); 6640Sstevel@tonic-gate 6650Sstevel@tonic-gate return (0); 6660Sstevel@tonic-gate } 6671186Sayznaga 6681186Sayznaga /* 6691186Sayznaga * Given a memory name, return its associated serial id 6701186Sayznaga */ 6711186Sayznaga static int 6721186Sayznaga mmioctl_get_mem_sid(intptr_t data) 6731186Sayznaga { 6741186Sayznaga mem_name_t mem_name; 6751186Sayznaga void *buf; 6761186Sayznaga void *name; 6771186Sayznaga size_t name_len; 6781186Sayznaga size_t bufsize; 6791186Sayznaga int len, err; 6801186Sayznaga 6811186Sayznaga if ((bufsize = cpu_get_name_bufsize()) == 0) 6821186Sayznaga return (ENOTSUP); 6831186Sayznaga 6841186Sayznaga if ((err = mm_read_mem_name(data, &mem_name)) < 0) 6851186Sayznaga return (err); 6861186Sayznaga 6871186Sayznaga buf = kmem_alloc(bufsize, KM_SLEEP); 6881186Sayznaga 6891186Sayznaga if (mem_name.m_namelen > 1024) 6901186Sayznaga mem_name.m_namelen = 1024; /* cap at 1024 bytes */ 6911186Sayznaga 6921186Sayznaga name = kmem_alloc(mem_name.m_namelen, KM_SLEEP); 6931186Sayznaga 6941186Sayznaga if ((err = copyinstr((char *)mem_name.m_name, (char *)name, 6951186Sayznaga mem_name.m_namelen, &name_len)) != 0) { 6961186Sayznaga kmem_free(buf, bufsize); 6971186Sayznaga kmem_free(name, mem_name.m_namelen); 6981186Sayznaga return (err); 6991186Sayznaga } 7001186Sayznaga 7011186Sayznaga /* 7021186Sayznaga * Call into cpu specific code to do the lookup. 7031186Sayznaga */ 7041186Sayznaga if ((err = cpu_get_mem_sid(name, buf, bufsize, &len)) != 0) { 7051186Sayznaga kmem_free(buf, bufsize); 7061186Sayznaga kmem_free(name, mem_name.m_namelen); 7071186Sayznaga return (err); 7081186Sayznaga } 7091186Sayznaga 7101186Sayznaga if (len > mem_name.m_sidlen) { 7111186Sayznaga kmem_free(buf, bufsize); 7121186Sayznaga kmem_free(name, mem_name.m_namelen); 7131186Sayznaga return (ENAMETOOLONG); 7141186Sayznaga } 7151186Sayznaga 7161186Sayznaga if (copyoutstr(buf, (char *)mem_name.m_sid, 7171186Sayznaga mem_name.m_sidlen, NULL) != 0) { 7181186Sayznaga kmem_free(buf, bufsize); 7191186Sayznaga kmem_free(name, mem_name.m_namelen); 7201186Sayznaga return (EFAULT); 7211186Sayznaga } 7221186Sayznaga 7231186Sayznaga kmem_free(buf, bufsize); 7241186Sayznaga kmem_free(name, mem_name.m_namelen); 7251186Sayznaga return (0); 7261186Sayznaga } 7270Sstevel@tonic-gate #endif /* __sparc */ 7280Sstevel@tonic-gate 7290Sstevel@tonic-gate /* 7300Sstevel@tonic-gate * Private ioctls for 7310Sstevel@tonic-gate * libkvm to support kvm_physaddr(). 7320Sstevel@tonic-gate * FMA support for page_retire() and memory attribute information. 7330Sstevel@tonic-gate */ 7340Sstevel@tonic-gate /*ARGSUSED*/ 7350Sstevel@tonic-gate static int 7360Sstevel@tonic-gate mmioctl(dev_t dev, int cmd, intptr_t data, int flag, cred_t *cred, int *rvalp) 7370Sstevel@tonic-gate { 7381283Sayznaga if ((cmd == MEM_VTOP && getminor(dev) != M_KMEM) || 7391283Sayznaga (cmd != MEM_VTOP && getminor(dev) != M_MEM)) 7401186Sayznaga return (ENXIO); 7411186Sayznaga 7420Sstevel@tonic-gate switch (cmd) { 7430Sstevel@tonic-gate case MEM_VTOP: 7440Sstevel@tonic-gate return (mmioctl_vtop(data)); 7450Sstevel@tonic-gate 7460Sstevel@tonic-gate case MEM_PAGE_RETIRE: 7470Sstevel@tonic-gate case MEM_PAGE_ISRETIRED: 748917Selowe case MEM_PAGE_UNRETIRE: 749917Selowe case MEM_PAGE_RETIRE_MCE: 750917Selowe case MEM_PAGE_RETIRE_UE: 751917Selowe case MEM_PAGE_GETERRORS: 752917Selowe case MEM_PAGE_RETIRE_TEST: 7530Sstevel@tonic-gate return (mmioctl_page_retire(cmd, data)); 7540Sstevel@tonic-gate 7551186Sayznaga case MEM_PAGE_FMRI_RETIRE: 7561186Sayznaga case MEM_PAGE_FMRI_ISRETIRED: 7576111Scy152378 case MEM_PAGE_FMRI_UNRETIRE: 7581186Sayznaga return (mmioctl_page_fmri_retire(cmd, data)); 7591186Sayznaga 7600Sstevel@tonic-gate #ifdef __sparc 7611186Sayznaga case MEM_NAME: 7620Sstevel@tonic-gate return (mmioctl_get_mem_name(data)); 7630Sstevel@tonic-gate 7640Sstevel@tonic-gate case MEM_INFO: 7650Sstevel@tonic-gate return (mmioctl_get_mem_info(data)); 7661186Sayznaga 7671186Sayznaga case MEM_SID: 7681186Sayznaga return (mmioctl_get_mem_sid(data)); 7690Sstevel@tonic-gate #else 7701186Sayznaga case MEM_NAME: 7711186Sayznaga case MEM_INFO: 7721186Sayznaga case MEM_SID: 7730Sstevel@tonic-gate return (ENOTSUP); 7741186Sayznaga #endif /* __sparc */ 7750Sstevel@tonic-gate } 7760Sstevel@tonic-gate return (ENXIO); 7770Sstevel@tonic-gate } 7780Sstevel@tonic-gate 7790Sstevel@tonic-gate /*ARGSUSED2*/ 7800Sstevel@tonic-gate static int 7810Sstevel@tonic-gate mmmmap(dev_t dev, off_t off, int prot) 7820Sstevel@tonic-gate { 7830Sstevel@tonic-gate pfn_t pf; 7840Sstevel@tonic-gate struct memlist *pmem; 7850Sstevel@tonic-gate minor_t minor = getminor(dev); 7860Sstevel@tonic-gate 7870Sstevel@tonic-gate switch (minor) { 7880Sstevel@tonic-gate case M_MEM: 7890Sstevel@tonic-gate pf = btop(off); 7900Sstevel@tonic-gate memlist_read_lock(); 7910Sstevel@tonic-gate for (pmem = phys_install; pmem != NULL; pmem = pmem->next) { 7920Sstevel@tonic-gate if (pf >= BTOP(pmem->address) && 7930Sstevel@tonic-gate pf < BTOP(pmem->address + pmem->size)) { 7940Sstevel@tonic-gate memlist_read_unlock(); 7950Sstevel@tonic-gate return (impl_obmem_pfnum(pf)); 7960Sstevel@tonic-gate } 7970Sstevel@tonic-gate } 7980Sstevel@tonic-gate memlist_read_unlock(); 7990Sstevel@tonic-gate break; 8000Sstevel@tonic-gate 8010Sstevel@tonic-gate case M_KMEM: 8020Sstevel@tonic-gate case M_ALLKMEM: 8030Sstevel@tonic-gate /* no longer supported with KPR */ 8040Sstevel@tonic-gate return (-1); 8050Sstevel@tonic-gate 8060Sstevel@tonic-gate case M_ZERO: 8070Sstevel@tonic-gate /* 8080Sstevel@tonic-gate * We shouldn't be mmap'ing to /dev/zero here as 8090Sstevel@tonic-gate * mmsegmap() should have already converted 8100Sstevel@tonic-gate * a mapping request for this device to a mapping 8110Sstevel@tonic-gate * using seg_vn for anonymous memory. 8120Sstevel@tonic-gate */ 8130Sstevel@tonic-gate break; 8140Sstevel@tonic-gate 8150Sstevel@tonic-gate } 8160Sstevel@tonic-gate return (-1); 8170Sstevel@tonic-gate } 8180Sstevel@tonic-gate 8190Sstevel@tonic-gate /* 8200Sstevel@tonic-gate * This function is called when a memory device is mmap'ed. 8210Sstevel@tonic-gate * Set up the mapping to the correct device driver. 8220Sstevel@tonic-gate */ 8230Sstevel@tonic-gate static int 8240Sstevel@tonic-gate mmsegmap(dev_t dev, off_t off, struct as *as, caddr_t *addrp, off_t len, 8250Sstevel@tonic-gate uint_t prot, uint_t maxprot, uint_t flags, struct cred *cred) 8260Sstevel@tonic-gate { 8270Sstevel@tonic-gate struct segvn_crargs vn_a; 8280Sstevel@tonic-gate struct segdev_crargs dev_a; 8290Sstevel@tonic-gate int error; 8300Sstevel@tonic-gate minor_t minor; 8310Sstevel@tonic-gate off_t i; 8320Sstevel@tonic-gate 8330Sstevel@tonic-gate minor = getminor(dev); 8340Sstevel@tonic-gate 8350Sstevel@tonic-gate as_rangelock(as); 8366036Smec /* 8376036Smec * No need to worry about vac alignment on /dev/zero 8386036Smec * since this is a "clone" object that doesn't yet exist. 8396036Smec */ 8406036Smec error = choose_addr(as, addrp, len, off, 8416036Smec (minor == M_MEM) || (minor == M_KMEM), flags); 8426036Smec if (error != 0) { 8436036Smec as_rangeunlock(as); 8446036Smec return (error); 8450Sstevel@tonic-gate } 8460Sstevel@tonic-gate 8470Sstevel@tonic-gate switch (minor) { 8480Sstevel@tonic-gate case M_MEM: 8490Sstevel@tonic-gate /* /dev/mem cannot be mmap'ed with MAP_PRIVATE */ 8500Sstevel@tonic-gate if ((flags & MAP_TYPE) != MAP_SHARED) { 8510Sstevel@tonic-gate as_rangeunlock(as); 8520Sstevel@tonic-gate return (EINVAL); 8530Sstevel@tonic-gate } 8540Sstevel@tonic-gate 8550Sstevel@tonic-gate /* 8560Sstevel@tonic-gate * Check to ensure that the entire range is 8570Sstevel@tonic-gate * legal and we are not trying to map in 8580Sstevel@tonic-gate * more than the device will let us. 8590Sstevel@tonic-gate */ 8600Sstevel@tonic-gate for (i = 0; i < len; i += PAGESIZE) { 8610Sstevel@tonic-gate if (mmmmap(dev, off + i, maxprot) == -1) { 8620Sstevel@tonic-gate as_rangeunlock(as); 8630Sstevel@tonic-gate return (ENXIO); 8640Sstevel@tonic-gate } 8650Sstevel@tonic-gate } 8660Sstevel@tonic-gate 8670Sstevel@tonic-gate /* 8680Sstevel@tonic-gate * Use seg_dev segment driver for /dev/mem mapping. 8690Sstevel@tonic-gate */ 8700Sstevel@tonic-gate dev_a.mapfunc = mmmmap; 8710Sstevel@tonic-gate dev_a.dev = dev; 8720Sstevel@tonic-gate dev_a.offset = off; 8730Sstevel@tonic-gate dev_a.type = (flags & MAP_TYPE); 8740Sstevel@tonic-gate dev_a.prot = (uchar_t)prot; 8750Sstevel@tonic-gate dev_a.maxprot = (uchar_t)maxprot; 8760Sstevel@tonic-gate dev_a.hat_attr = 0; 8770Sstevel@tonic-gate 8780Sstevel@tonic-gate /* 8790Sstevel@tonic-gate * Make /dev/mem mappings non-consistent since we can't 8800Sstevel@tonic-gate * alias pages that don't have page structs behind them, 8810Sstevel@tonic-gate * such as kernel stack pages. If someone mmap()s a kernel 8820Sstevel@tonic-gate * stack page and if we give him a tte with cv, a line from 8830Sstevel@tonic-gate * that page can get into both pages of the spitfire d$. 8840Sstevel@tonic-gate * But snoop from another processor will only invalidate 8850Sstevel@tonic-gate * the first page. This later caused kernel (xc_attention) 8860Sstevel@tonic-gate * to go into an infinite loop at pil 13 and no interrupts 8870Sstevel@tonic-gate * could come in. See 1203630. 8880Sstevel@tonic-gate * 8890Sstevel@tonic-gate */ 8900Sstevel@tonic-gate dev_a.hat_flags = HAT_LOAD_NOCONSIST; 8910Sstevel@tonic-gate dev_a.devmap_data = NULL; 8920Sstevel@tonic-gate 8930Sstevel@tonic-gate error = as_map(as, *addrp, len, segdev_create, &dev_a); 8940Sstevel@tonic-gate break; 8950Sstevel@tonic-gate 8960Sstevel@tonic-gate case M_ZERO: 8970Sstevel@tonic-gate /* 8980Sstevel@tonic-gate * Use seg_vn segment driver for /dev/zero mapping. 8990Sstevel@tonic-gate * Passing in a NULL amp gives us the "cloning" effect. 9000Sstevel@tonic-gate */ 9010Sstevel@tonic-gate vn_a.vp = NULL; 9020Sstevel@tonic-gate vn_a.offset = 0; 9030Sstevel@tonic-gate vn_a.type = (flags & MAP_TYPE); 9040Sstevel@tonic-gate vn_a.prot = prot; 9050Sstevel@tonic-gate vn_a.maxprot = maxprot; 9060Sstevel@tonic-gate vn_a.flags = flags & ~MAP_TYPE; 9070Sstevel@tonic-gate vn_a.cred = cred; 9080Sstevel@tonic-gate vn_a.amp = NULL; 9090Sstevel@tonic-gate vn_a.szc = 0; 9100Sstevel@tonic-gate vn_a.lgrp_mem_policy_flags = 0; 9110Sstevel@tonic-gate error = as_map(as, *addrp, len, segvn_create, &vn_a); 9120Sstevel@tonic-gate break; 9130Sstevel@tonic-gate 9140Sstevel@tonic-gate case M_KMEM: 9150Sstevel@tonic-gate case M_ALLKMEM: 9160Sstevel@tonic-gate /* No longer supported with KPR. */ 9170Sstevel@tonic-gate error = ENXIO; 9180Sstevel@tonic-gate break; 9190Sstevel@tonic-gate 9200Sstevel@tonic-gate case M_NULL: 9210Sstevel@tonic-gate /* 9220Sstevel@tonic-gate * Use seg_dev segment driver for /dev/null mapping. 9230Sstevel@tonic-gate */ 9240Sstevel@tonic-gate dev_a.mapfunc = mmmmap; 9250Sstevel@tonic-gate dev_a.dev = dev; 9260Sstevel@tonic-gate dev_a.offset = off; 9270Sstevel@tonic-gate dev_a.type = 0; /* neither PRIVATE nor SHARED */ 9280Sstevel@tonic-gate dev_a.prot = dev_a.maxprot = (uchar_t)PROT_NONE; 9290Sstevel@tonic-gate dev_a.hat_attr = 0; 9300Sstevel@tonic-gate dev_a.hat_flags = 0; 9310Sstevel@tonic-gate error = as_map(as, *addrp, len, segdev_create, &dev_a); 9320Sstevel@tonic-gate break; 9330Sstevel@tonic-gate 9340Sstevel@tonic-gate default: 9350Sstevel@tonic-gate error = ENXIO; 9360Sstevel@tonic-gate } 9370Sstevel@tonic-gate 9380Sstevel@tonic-gate as_rangeunlock(as); 9390Sstevel@tonic-gate return (error); 9400Sstevel@tonic-gate } 9410Sstevel@tonic-gate 9420Sstevel@tonic-gate static struct cb_ops mm_cb_ops = { 9430Sstevel@tonic-gate mmopen, /* open */ 9440Sstevel@tonic-gate nulldev, /* close */ 9450Sstevel@tonic-gate nodev, /* strategy */ 9460Sstevel@tonic-gate nodev, /* print */ 9470Sstevel@tonic-gate nodev, /* dump */ 9480Sstevel@tonic-gate mmread, /* read */ 9490Sstevel@tonic-gate mmwrite, /* write */ 9500Sstevel@tonic-gate mmioctl, /* ioctl */ 9510Sstevel@tonic-gate nodev, /* devmap */ 9520Sstevel@tonic-gate mmmmap, /* mmap */ 9530Sstevel@tonic-gate mmsegmap, /* segmap */ 9540Sstevel@tonic-gate mmchpoll, /* poll */ 9550Sstevel@tonic-gate mmpropop, /* prop_op */ 9560Sstevel@tonic-gate 0, /* streamtab */ 9570Sstevel@tonic-gate D_NEW | D_MP | D_64BIT | D_U64BIT 9580Sstevel@tonic-gate }; 9590Sstevel@tonic-gate 9600Sstevel@tonic-gate static struct dev_ops mm_ops = { 9610Sstevel@tonic-gate DEVO_REV, /* devo_rev, */ 9620Sstevel@tonic-gate 0, /* refcnt */ 9630Sstevel@tonic-gate mm_info, /* get_dev_info */ 9640Sstevel@tonic-gate nulldev, /* identify */ 9650Sstevel@tonic-gate nulldev, /* probe */ 9660Sstevel@tonic-gate mm_attach, /* attach */ 9670Sstevel@tonic-gate nodev, /* detach */ 9680Sstevel@tonic-gate nodev, /* reset */ 9690Sstevel@tonic-gate &mm_cb_ops, /* driver operations */ 9700Sstevel@tonic-gate (struct bus_ops *)0 /* bus operations */ 9710Sstevel@tonic-gate }; 9720Sstevel@tonic-gate 9730Sstevel@tonic-gate static struct modldrv modldrv = { 9740Sstevel@tonic-gate &mod_driverops, "memory driver %I%", &mm_ops, 9750Sstevel@tonic-gate }; 9760Sstevel@tonic-gate 9770Sstevel@tonic-gate static struct modlinkage modlinkage = { 9780Sstevel@tonic-gate MODREV_1, &modldrv, NULL 9790Sstevel@tonic-gate }; 9800Sstevel@tonic-gate 9810Sstevel@tonic-gate int 9820Sstevel@tonic-gate _init(void) 9830Sstevel@tonic-gate { 9840Sstevel@tonic-gate return (mod_install(&modlinkage)); 9850Sstevel@tonic-gate } 9860Sstevel@tonic-gate 9870Sstevel@tonic-gate int 9880Sstevel@tonic-gate _info(struct modinfo *modinfop) 9890Sstevel@tonic-gate { 9900Sstevel@tonic-gate return (mod_info(&modlinkage, modinfop)); 9910Sstevel@tonic-gate } 9920Sstevel@tonic-gate 9930Sstevel@tonic-gate int 9940Sstevel@tonic-gate _fini(void) 9950Sstevel@tonic-gate { 9960Sstevel@tonic-gate return (mod_remove(&modlinkage)); 9970Sstevel@tonic-gate } 9980Sstevel@tonic-gate 9990Sstevel@tonic-gate static int 10000Sstevel@tonic-gate mm_kstat_update(kstat_t *ksp, int rw) 10010Sstevel@tonic-gate { 10020Sstevel@tonic-gate struct memlist *pmem; 10030Sstevel@tonic-gate uint_t count; 10040Sstevel@tonic-gate 10050Sstevel@tonic-gate if (rw == KSTAT_WRITE) 10060Sstevel@tonic-gate return (EACCES); 10070Sstevel@tonic-gate 10080Sstevel@tonic-gate count = 0; 10090Sstevel@tonic-gate memlist_read_lock(); 10100Sstevel@tonic-gate for (pmem = phys_install; pmem != NULL; pmem = pmem->next) { 10110Sstevel@tonic-gate count++; 10120Sstevel@tonic-gate } 10130Sstevel@tonic-gate memlist_read_unlock(); 10140Sstevel@tonic-gate 10150Sstevel@tonic-gate ksp->ks_ndata = count; 10160Sstevel@tonic-gate ksp->ks_data_size = count * 2 * sizeof (uint64_t); 10170Sstevel@tonic-gate 10180Sstevel@tonic-gate return (0); 10190Sstevel@tonic-gate } 10200Sstevel@tonic-gate 10210Sstevel@tonic-gate static int 10220Sstevel@tonic-gate mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw) 10230Sstevel@tonic-gate { 10240Sstevel@tonic-gate struct memlist *pmem; 10250Sstevel@tonic-gate struct memunit { 10260Sstevel@tonic-gate uint64_t address; 10270Sstevel@tonic-gate uint64_t size; 10280Sstevel@tonic-gate } *kspmem; 10290Sstevel@tonic-gate 10300Sstevel@tonic-gate if (rw == KSTAT_WRITE) 10310Sstevel@tonic-gate return (EACCES); 10320Sstevel@tonic-gate 10330Sstevel@tonic-gate ksp->ks_snaptime = gethrtime(); 10340Sstevel@tonic-gate 10350Sstevel@tonic-gate kspmem = (struct memunit *)buf; 10360Sstevel@tonic-gate memlist_read_lock(); 10370Sstevel@tonic-gate for (pmem = phys_install; pmem != NULL; pmem = pmem->next, kspmem++) { 10380Sstevel@tonic-gate if ((caddr_t)kspmem >= (caddr_t)buf + ksp->ks_data_size) 10390Sstevel@tonic-gate break; 10400Sstevel@tonic-gate kspmem->address = pmem->address; 10410Sstevel@tonic-gate kspmem->size = pmem->size; 10420Sstevel@tonic-gate } 10430Sstevel@tonic-gate memlist_read_unlock(); 10440Sstevel@tonic-gate 10450Sstevel@tonic-gate return (0); 10460Sstevel@tonic-gate } 10471186Sayznaga 10481186Sayznaga /* 10491186Sayznaga * Read a mem_name_t from user-space and store it in the mem_name_t 10501186Sayznaga * pointed to by the mem_name argument. 10511186Sayznaga */ 10521186Sayznaga static int 10531186Sayznaga mm_read_mem_name(intptr_t data, mem_name_t *mem_name) 10541186Sayznaga { 10551186Sayznaga if (get_udatamodel() == DATAMODEL_NATIVE) { 10561186Sayznaga if (copyin((void *)data, mem_name, sizeof (mem_name_t))) 10571186Sayznaga return (EFAULT); 10581186Sayznaga } 10591186Sayznaga #ifdef _SYSCALL32 10601186Sayznaga else { 10611186Sayznaga mem_name32_t mem_name32; 10621186Sayznaga 10631186Sayznaga if (copyin((void *)data, &mem_name32, sizeof (mem_name32_t))) 10641186Sayznaga return (EFAULT); 10651186Sayznaga mem_name->m_addr = mem_name32.m_addr; 10661186Sayznaga mem_name->m_synd = mem_name32.m_synd; 10671186Sayznaga mem_name->m_type[0] = mem_name32.m_type[0]; 10681186Sayznaga mem_name->m_type[1] = mem_name32.m_type[1]; 10691283Sayznaga mem_name->m_name = (caddr_t)(uintptr_t)mem_name32.m_name; 10701186Sayznaga mem_name->m_namelen = (size_t)mem_name32.m_namelen; 10711283Sayznaga mem_name->m_sid = (caddr_t)(uintptr_t)mem_name32.m_sid; 10721186Sayznaga mem_name->m_sidlen = (size_t)mem_name32.m_sidlen; 10731186Sayznaga } 10741186Sayznaga #endif /* _SYSCALL32 */ 10751186Sayznaga 10761186Sayznaga return (0); 10771186Sayznaga } 10781186Sayznaga 10791186Sayznaga /* 10801186Sayznaga * Read a mem_page_t from user-space and store it in the mem_page_t 10811186Sayznaga * pointed to by the mpage argument. 10821186Sayznaga */ 10831186Sayznaga static int 10841186Sayznaga mm_read_mem_page(intptr_t data, mem_page_t *mpage) 10851186Sayznaga { 10861186Sayznaga if (get_udatamodel() == DATAMODEL_NATIVE) { 10871186Sayznaga if (copyin((void *)data, mpage, sizeof (mem_page_t)) != 0) 10881186Sayznaga return (EFAULT); 10891186Sayznaga } 10901186Sayznaga #ifdef _SYSCALL32 10911186Sayznaga else { 10921186Sayznaga mem_page32_t mpage32; 10931186Sayznaga 10941186Sayznaga if (copyin((void *)data, &mpage32, sizeof (mem_page32_t)) != 0) 10951186Sayznaga return (EFAULT); 10961186Sayznaga 10971186Sayznaga mpage->m_fmri = (caddr_t)(uintptr_t)mpage32.m_fmri; 10981186Sayznaga mpage->m_fmrisz = mpage32.m_fmrisz; 10991186Sayznaga } 11001186Sayznaga #endif /* _SYSCALL32 */ 11011186Sayznaga 11021186Sayznaga return (0); 11031186Sayznaga } 11041186Sayznaga 11051186Sayznaga /* 11061186Sayznaga * Expand an FMRI from a mem_page_t. 11071186Sayznaga */ 11081186Sayznaga static int 11091186Sayznaga mm_get_mem_fmri(mem_page_t *mpage, nvlist_t **nvl) 11101186Sayznaga { 11111186Sayznaga char *buf; 11121186Sayznaga int err; 11131186Sayznaga 11141186Sayznaga if (mpage->m_fmri == NULL || mpage->m_fmrisz > MEM_FMRI_MAX_BUFSIZE) 11151186Sayznaga return (EINVAL); 11161186Sayznaga 11171186Sayznaga buf = kmem_alloc(mpage->m_fmrisz, KM_SLEEP); 11181186Sayznaga if (copyin(mpage->m_fmri, buf, mpage->m_fmrisz) != 0) { 11191186Sayznaga kmem_free(buf, mpage->m_fmrisz); 11201186Sayznaga return (EFAULT); 11211186Sayznaga } 11221186Sayznaga 11231186Sayznaga err = nvlist_unpack(buf, mpage->m_fmrisz, nvl, KM_SLEEP); 11241186Sayznaga kmem_free(buf, mpage->m_fmrisz); 11251186Sayznaga 11261186Sayznaga return (err); 11271186Sayznaga } 11281186Sayznaga 11291186Sayznaga static int 11301186Sayznaga mm_get_paddr(nvlist_t *nvl, uint64_t *paddr) 11311186Sayznaga { 11321186Sayznaga uint8_t version; 11331189Sayznaga uint64_t pa; 11341186Sayznaga char *scheme; 11355254Sgavinm int err; 11361189Sayznaga #ifdef __sparc 11371189Sayznaga uint64_t offset; 11381186Sayznaga char *unum; 11391186Sayznaga char **serids; 11401186Sayznaga uint_t nserids; 11411189Sayznaga #endif 11421186Sayznaga 11431186Sayznaga /* Verify FMRI scheme name and version number */ 11441186Sayznaga if ((nvlist_lookup_string(nvl, FM_FMRI_SCHEME, &scheme) != 0) || 11451186Sayznaga (strcmp(scheme, FM_FMRI_SCHEME_MEM) != 0) || 11461186Sayznaga (nvlist_lookup_uint8(nvl, FM_VERSION, &version) != 0) || 11471186Sayznaga version > FM_MEM_SCHEME_VERSION) { 11481186Sayznaga return (EINVAL); 11491186Sayznaga } 11501186Sayznaga 11511186Sayznaga /* 11521186Sayznaga * There are two ways a physical address can be obtained from a mem 11531186Sayznaga * scheme FMRI. One way is to use the "offset" and "serial" 11541186Sayznaga * members, if they are present, together with the "unum" member to 11551186Sayznaga * calculate a physical address. This is the preferred way since 11561186Sayznaga * it is independent of possible changes to the programming of 11571186Sayznaga * underlying hardware registers that may change the physical address. 11581186Sayznaga * If the "offset" member is not present, then the address is 11591186Sayznaga * retrieved from the "physaddr" member. 11601186Sayznaga */ 11611414Scindi #if defined(__sparc) 11621186Sayznaga if (nvlist_lookup_uint64(nvl, FM_FMRI_MEM_OFFSET, &offset) != 0) { 11631186Sayznaga if (nvlist_lookup_uint64(nvl, FM_FMRI_MEM_PHYSADDR, &pa) != 11641186Sayznaga 0) { 11651186Sayznaga return (EINVAL); 11661186Sayznaga } 11671186Sayznaga } else if (nvlist_lookup_string(nvl, FM_FMRI_MEM_UNUM, &unum) != 0 || 11681186Sayznaga nvlist_lookup_string_array(nvl, FM_FMRI_MEM_SERIAL_ID, &serids, 11691186Sayznaga &nserids) != 0) { 11701186Sayznaga return (EINVAL); 11711186Sayznaga } else { 11721463Sayznaga err = cpu_get_mem_addr(unum, serids[0], offset, &pa); 11731463Sayznaga if (err != 0) { 11741463Sayznaga if (err == ENOTSUP) { 11751463Sayznaga /* Fall back to physaddr */ 11761463Sayznaga if (nvlist_lookup_uint64(nvl, 11771463Sayznaga FM_FMRI_MEM_PHYSADDR, &pa) != 0) 11781463Sayznaga return (EINVAL); 11791463Sayznaga } else 11801463Sayznaga return (err); 11811463Sayznaga } 11821186Sayznaga } 11833446Smrj #elif defined(__x86) 11845254Sgavinm if ((err = cmi_mc_unumtopa(NULL, nvl, &pa)) != CMI_SUCCESS && 11855254Sgavinm err != CMIERR_MC_PARTIALUNUMTOPA) 11861187Sayznaga return (EINVAL); 11871414Scindi #else 11881414Scindi #error "port me" 11891187Sayznaga #endif /* __sparc */ 11901186Sayznaga 11911186Sayznaga *paddr = pa; 11921186Sayznaga return (0); 11931186Sayznaga } 1194