xref: /illumos-gate/usr/src/uts/common/io/mem.c (revision db874c57ae335a07060499f1492b0d0e2593e26c)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
57c478bd9Sstevel@tonic-gate  * Common Development and Distribution License, Version 1.0 only
67c478bd9Sstevel@tonic-gate  * (the "License").  You may not use this file except in compliance
77c478bd9Sstevel@tonic-gate  * with the License.
87c478bd9Sstevel@tonic-gate  *
97c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
107c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
117c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
127c478bd9Sstevel@tonic-gate  * and limitations under the License.
137c478bd9Sstevel@tonic-gate  *
147c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
157c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
167c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
177c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
187c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
197c478bd9Sstevel@tonic-gate  *
207c478bd9Sstevel@tonic-gate  * CDDL HEADER END
217c478bd9Sstevel@tonic-gate  */
227c478bd9Sstevel@tonic-gate /*
237c478bd9Sstevel@tonic-gate  * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
247c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
257c478bd9Sstevel@tonic-gate  */
267c478bd9Sstevel@tonic-gate 
277c478bd9Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
287c478bd9Sstevel@tonic-gate 
297c478bd9Sstevel@tonic-gate /*
307c478bd9Sstevel@tonic-gate  * Memory special file
317c478bd9Sstevel@tonic-gate  */
327c478bd9Sstevel@tonic-gate 
337c478bd9Sstevel@tonic-gate #include <sys/types.h>
347c478bd9Sstevel@tonic-gate #include <sys/param.h>
357c478bd9Sstevel@tonic-gate #include <sys/user.h>
367c478bd9Sstevel@tonic-gate #include <sys/buf.h>
377c478bd9Sstevel@tonic-gate #include <sys/systm.h>
387c478bd9Sstevel@tonic-gate #include <sys/cred.h>
397c478bd9Sstevel@tonic-gate #include <sys/vm.h>
407c478bd9Sstevel@tonic-gate #include <sys/uio.h>
417c478bd9Sstevel@tonic-gate #include <sys/mman.h>
427c478bd9Sstevel@tonic-gate #include <sys/kmem.h>
437c478bd9Sstevel@tonic-gate #include <vm/seg.h>
447c478bd9Sstevel@tonic-gate #include <vm/page.h>
457c478bd9Sstevel@tonic-gate #include <sys/stat.h>
467c478bd9Sstevel@tonic-gate #include <sys/vmem.h>
477c478bd9Sstevel@tonic-gate #include <sys/memlist.h>
487c478bd9Sstevel@tonic-gate #include <sys/bootconf.h>
497c478bd9Sstevel@tonic-gate 
507c478bd9Sstevel@tonic-gate #include <vm/seg_vn.h>
517c478bd9Sstevel@tonic-gate #include <vm/seg_dev.h>
527c478bd9Sstevel@tonic-gate #include <vm/seg_kmem.h>
537c478bd9Sstevel@tonic-gate #include <vm/seg_kp.h>
547c478bd9Sstevel@tonic-gate #include <vm/seg_kpm.h>
557c478bd9Sstevel@tonic-gate #include <vm/hat.h>
567c478bd9Sstevel@tonic-gate 
577c478bd9Sstevel@tonic-gate #include <sys/conf.h>
587c478bd9Sstevel@tonic-gate #include <sys/mem.h>
597c478bd9Sstevel@tonic-gate #include <sys/types.h>
607c478bd9Sstevel@tonic-gate #include <sys/conf.h>
617c478bd9Sstevel@tonic-gate #include <sys/param.h>
627c478bd9Sstevel@tonic-gate #include <sys/systm.h>
637c478bd9Sstevel@tonic-gate #include <sys/errno.h>
647c478bd9Sstevel@tonic-gate #include <sys/modctl.h>
657c478bd9Sstevel@tonic-gate #include <sys/memlist.h>
667c478bd9Sstevel@tonic-gate #include <sys/ddi.h>
677c478bd9Sstevel@tonic-gate #include <sys/sunddi.h>
687c478bd9Sstevel@tonic-gate #include <sys/debug.h>
697c478bd9Sstevel@tonic-gate 
707c478bd9Sstevel@tonic-gate #ifdef __sparc
717c478bd9Sstevel@tonic-gate extern int cpu_get_mem_name(uint64_t, uint64_t *, uint64_t, char *, int, int *);
727c478bd9Sstevel@tonic-gate extern int cpu_get_mem_info(uint64_t, uint64_t, uint64_t *, uint64_t *,
737c478bd9Sstevel@tonic-gate     uint64_t *, int *, int *, int *);
747c478bd9Sstevel@tonic-gate extern size_t cpu_get_name_bufsize(void);
757c478bd9Sstevel@tonic-gate #endif
767c478bd9Sstevel@tonic-gate 
777c478bd9Sstevel@tonic-gate /*
787c478bd9Sstevel@tonic-gate  * Turn a byte length into a pagecount.  The DDI btop takes a
797c478bd9Sstevel@tonic-gate  * 32-bit size on 32-bit machines, this handles 64-bit sizes for
807c478bd9Sstevel@tonic-gate  * large physical-memory 32-bit machines.
817c478bd9Sstevel@tonic-gate  */
827c478bd9Sstevel@tonic-gate #define	BTOP(x)	((pgcnt_t)((x) >> _pageshift))
837c478bd9Sstevel@tonic-gate 
847c478bd9Sstevel@tonic-gate static kmutex_t mm_lock;
857c478bd9Sstevel@tonic-gate static caddr_t mm_map;
867c478bd9Sstevel@tonic-gate 
877c478bd9Sstevel@tonic-gate static dev_info_t *mm_dip;	/* private copy of devinfo pointer */
887c478bd9Sstevel@tonic-gate 
897c478bd9Sstevel@tonic-gate static int mm_kmem_io_access;
907c478bd9Sstevel@tonic-gate 
917c478bd9Sstevel@tonic-gate static int mm_kstat_update(kstat_t *ksp, int rw);
927c478bd9Sstevel@tonic-gate static int mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw);
937c478bd9Sstevel@tonic-gate 
947c478bd9Sstevel@tonic-gate /*ARGSUSED1*/
957c478bd9Sstevel@tonic-gate static int
967c478bd9Sstevel@tonic-gate mm_attach(dev_info_t *devi, ddi_attach_cmd_t cmd)
977c478bd9Sstevel@tonic-gate {
987c478bd9Sstevel@tonic-gate 	int i;
997c478bd9Sstevel@tonic-gate 	struct mem_minor {
1007c478bd9Sstevel@tonic-gate 		char *name;
1017c478bd9Sstevel@tonic-gate 		minor_t minor;
1027c478bd9Sstevel@tonic-gate 		int privonly;
1037c478bd9Sstevel@tonic-gate 		const char *rdpriv;
1047c478bd9Sstevel@tonic-gate 		const char *wrpriv;
1057c478bd9Sstevel@tonic-gate 		mode_t priv_mode;
1067c478bd9Sstevel@tonic-gate 	} mm[] = {
1077c478bd9Sstevel@tonic-gate 		{ "mem",	M_MEM,		0,	NULL,	"all",	0640 },
1087c478bd9Sstevel@tonic-gate 		{ "kmem",	M_KMEM,		0,	NULL,	"all",	0640 },
1097c478bd9Sstevel@tonic-gate 		{ "allkmem",	M_ALLKMEM,	0,	"all",	"all",	0600 },
1107c478bd9Sstevel@tonic-gate 		{ "null",	M_NULL,	PRIVONLY_DEV,	NULL,	NULL,	0666 },
1117c478bd9Sstevel@tonic-gate 		{ "zero",	M_ZERO, PRIVONLY_DEV,	NULL,	NULL,	0666 },
1127c478bd9Sstevel@tonic-gate 	};
1137c478bd9Sstevel@tonic-gate 	kstat_t *ksp;
1147c478bd9Sstevel@tonic-gate 
1157c478bd9Sstevel@tonic-gate 	mutex_init(&mm_lock, NULL, MUTEX_DEFAULT, NULL);
1167c478bd9Sstevel@tonic-gate 	mm_map = vmem_alloc(heap_arena, PAGESIZE, VM_SLEEP);
1177c478bd9Sstevel@tonic-gate 
1187c478bd9Sstevel@tonic-gate 	for (i = 0; i < (sizeof (mm) / sizeof (mm[0])); i++) {
1197c478bd9Sstevel@tonic-gate 		if (ddi_create_priv_minor_node(devi, mm[i].name, S_IFCHR,
1207c478bd9Sstevel@tonic-gate 		    mm[i].minor, DDI_PSEUDO, mm[i].privonly,
1217c478bd9Sstevel@tonic-gate 		    mm[i].rdpriv, mm[i].wrpriv, mm[i].priv_mode) ==
1227c478bd9Sstevel@tonic-gate 		    DDI_FAILURE) {
1237c478bd9Sstevel@tonic-gate 			ddi_remove_minor_node(devi, NULL);
1247c478bd9Sstevel@tonic-gate 			return (DDI_FAILURE);
1257c478bd9Sstevel@tonic-gate 		}
1267c478bd9Sstevel@tonic-gate 	}
1277c478bd9Sstevel@tonic-gate 
1287c478bd9Sstevel@tonic-gate 	mm_dip = devi;
1297c478bd9Sstevel@tonic-gate 
1307c478bd9Sstevel@tonic-gate 	ksp = kstat_create("mm", 0, "phys_installed", "misc",
1317c478bd9Sstevel@tonic-gate 	    KSTAT_TYPE_RAW, 0, KSTAT_FLAG_VAR_SIZE | KSTAT_FLAG_VIRTUAL);
1327c478bd9Sstevel@tonic-gate 	if (ksp != NULL) {
1337c478bd9Sstevel@tonic-gate 		ksp->ks_update = mm_kstat_update;
1347c478bd9Sstevel@tonic-gate 		ksp->ks_snapshot = mm_kstat_snapshot;
1357c478bd9Sstevel@tonic-gate 		ksp->ks_lock = &mm_lock; /* XXX - not really needed */
1367c478bd9Sstevel@tonic-gate 		kstat_install(ksp);
1377c478bd9Sstevel@tonic-gate 	}
1387c478bd9Sstevel@tonic-gate 
1397c478bd9Sstevel@tonic-gate 	mm_kmem_io_access = ddi_getprop(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
1407c478bd9Sstevel@tonic-gate 	    "kmem_io_access", 0);
1417c478bd9Sstevel@tonic-gate 
1427c478bd9Sstevel@tonic-gate 	return (DDI_SUCCESS);
1437c478bd9Sstevel@tonic-gate }
1447c478bd9Sstevel@tonic-gate 
1457c478bd9Sstevel@tonic-gate /*ARGSUSED*/
1467c478bd9Sstevel@tonic-gate static int
1477c478bd9Sstevel@tonic-gate mm_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result)
1487c478bd9Sstevel@tonic-gate {
1497c478bd9Sstevel@tonic-gate 	register int error;
1507c478bd9Sstevel@tonic-gate 
1517c478bd9Sstevel@tonic-gate 	switch (infocmd) {
1527c478bd9Sstevel@tonic-gate 	case DDI_INFO_DEVT2DEVINFO:
1537c478bd9Sstevel@tonic-gate 		*result = (void *)mm_dip;
1547c478bd9Sstevel@tonic-gate 		error = DDI_SUCCESS;
1557c478bd9Sstevel@tonic-gate 		break;
1567c478bd9Sstevel@tonic-gate 	case DDI_INFO_DEVT2INSTANCE:
1577c478bd9Sstevel@tonic-gate 		*result = (void *)0;
1587c478bd9Sstevel@tonic-gate 		error = DDI_SUCCESS;
1597c478bd9Sstevel@tonic-gate 		break;
1607c478bd9Sstevel@tonic-gate 	default:
1617c478bd9Sstevel@tonic-gate 		error = DDI_FAILURE;
1627c478bd9Sstevel@tonic-gate 	}
1637c478bd9Sstevel@tonic-gate 	return (error);
1647c478bd9Sstevel@tonic-gate }
1657c478bd9Sstevel@tonic-gate 
1667c478bd9Sstevel@tonic-gate /*ARGSUSED1*/
1677c478bd9Sstevel@tonic-gate static int
1687c478bd9Sstevel@tonic-gate mmopen(dev_t *devp, int flag, int typ, struct cred *cred)
1697c478bd9Sstevel@tonic-gate {
1707c478bd9Sstevel@tonic-gate 	switch (getminor(*devp)) {
1717c478bd9Sstevel@tonic-gate 	case M_NULL:
1727c478bd9Sstevel@tonic-gate 	case M_ZERO:
1737c478bd9Sstevel@tonic-gate 	case M_MEM:
1747c478bd9Sstevel@tonic-gate 	case M_KMEM:
1757c478bd9Sstevel@tonic-gate 	case M_ALLKMEM:
1767c478bd9Sstevel@tonic-gate 		/* standard devices */
1777c478bd9Sstevel@tonic-gate 		break;
1787c478bd9Sstevel@tonic-gate 
1797c478bd9Sstevel@tonic-gate 	default:
1807c478bd9Sstevel@tonic-gate 		/* Unsupported or unknown type */
1817c478bd9Sstevel@tonic-gate 		return (EINVAL);
1827c478bd9Sstevel@tonic-gate 	}
1837c478bd9Sstevel@tonic-gate 	return (0);
1847c478bd9Sstevel@tonic-gate }
1857c478bd9Sstevel@tonic-gate 
1867c478bd9Sstevel@tonic-gate struct pollhead	mm_pollhd;
1877c478bd9Sstevel@tonic-gate 
1887c478bd9Sstevel@tonic-gate /*ARGSUSED*/
1897c478bd9Sstevel@tonic-gate static int
1907c478bd9Sstevel@tonic-gate mmchpoll(dev_t dev, short events, int anyyet, short *reventsp,
1917c478bd9Sstevel@tonic-gate     struct pollhead **phpp)
1927c478bd9Sstevel@tonic-gate {
1937c478bd9Sstevel@tonic-gate 	switch (getminor(dev)) {
1947c478bd9Sstevel@tonic-gate 	case M_NULL:
1957c478bd9Sstevel@tonic-gate 	case M_ZERO:
1967c478bd9Sstevel@tonic-gate 	case M_MEM:
1977c478bd9Sstevel@tonic-gate 	case M_KMEM:
1987c478bd9Sstevel@tonic-gate 	case M_ALLKMEM:
1997c478bd9Sstevel@tonic-gate 		*reventsp = events & (POLLIN | POLLOUT | POLLPRI | POLLRDNORM |
2007c478bd9Sstevel@tonic-gate 			POLLWRNORM | POLLRDBAND | POLLWRBAND);
2017c478bd9Sstevel@tonic-gate 		/*
2027c478bd9Sstevel@tonic-gate 		 * A non NULL pollhead pointer should be returned in case
2037c478bd9Sstevel@tonic-gate 		 * user polls for 0 events.
2047c478bd9Sstevel@tonic-gate 		 */
2057c478bd9Sstevel@tonic-gate 		*phpp = !anyyet && !*reventsp ?
2067c478bd9Sstevel@tonic-gate 		    &mm_pollhd : (struct pollhead *)NULL;
2077c478bd9Sstevel@tonic-gate 		return (0);
2087c478bd9Sstevel@tonic-gate 	default:
2097c478bd9Sstevel@tonic-gate 		/* no other devices currently support polling */
2107c478bd9Sstevel@tonic-gate 		return (ENXIO);
2117c478bd9Sstevel@tonic-gate 	}
2127c478bd9Sstevel@tonic-gate }
2137c478bd9Sstevel@tonic-gate 
2147c478bd9Sstevel@tonic-gate static int
2157c478bd9Sstevel@tonic-gate mmpropop(dev_t dev, dev_info_t *dip, ddi_prop_op_t prop_op, int flags,
2167c478bd9Sstevel@tonic-gate     char *name, caddr_t valuep, int *lengthp)
2177c478bd9Sstevel@tonic-gate {
2187c478bd9Sstevel@tonic-gate 	/*
2197c478bd9Sstevel@tonic-gate 	 * implement zero size to reduce overhead (avoid two failing
2207c478bd9Sstevel@tonic-gate 	 * property lookups per stat).
2217c478bd9Sstevel@tonic-gate 	 */
2227c478bd9Sstevel@tonic-gate 	return (ddi_prop_op_size(dev, dip, prop_op,
2237c478bd9Sstevel@tonic-gate 	    flags, name, valuep, lengthp, 0));
2247c478bd9Sstevel@tonic-gate }
2257c478bd9Sstevel@tonic-gate 
2267c478bd9Sstevel@tonic-gate static int
2277c478bd9Sstevel@tonic-gate mmio(struct uio *uio, enum uio_rw rw, pfn_t pfn, off_t pageoff, int allowio)
2287c478bd9Sstevel@tonic-gate {
2297c478bd9Sstevel@tonic-gate 	int error = 0;
2307c478bd9Sstevel@tonic-gate 	size_t nbytes = MIN((size_t)(PAGESIZE - pageoff),
2317c478bd9Sstevel@tonic-gate 	    (size_t)uio->uio_iov->iov_len);
2327c478bd9Sstevel@tonic-gate 
2337c478bd9Sstevel@tonic-gate 	mutex_enter(&mm_lock);
2347c478bd9Sstevel@tonic-gate 	hat_devload(kas.a_hat, mm_map, PAGESIZE, pfn,
2357c478bd9Sstevel@tonic-gate 	    (uint_t)(rw == UIO_READ ? PROT_READ : PROT_READ | PROT_WRITE),
2367c478bd9Sstevel@tonic-gate 	    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
2377c478bd9Sstevel@tonic-gate 
2387c478bd9Sstevel@tonic-gate 	if (!pf_is_memory(pfn)) {
2397c478bd9Sstevel@tonic-gate 		if (allowio) {
2407c478bd9Sstevel@tonic-gate 			size_t c = uio->uio_iov->iov_len;
2417c478bd9Sstevel@tonic-gate 
2427c478bd9Sstevel@tonic-gate 			if (ddi_peekpokeio(NULL, uio, rw,
2437c478bd9Sstevel@tonic-gate 			    (caddr_t)(uintptr_t)uio->uio_loffset, c,
2447c478bd9Sstevel@tonic-gate 			    sizeof (int32_t)) != DDI_SUCCESS)
2457c478bd9Sstevel@tonic-gate 				error = EFAULT;
2467c478bd9Sstevel@tonic-gate 		} else
2477c478bd9Sstevel@tonic-gate 			error = EIO;
2487c478bd9Sstevel@tonic-gate 	} else
2497c478bd9Sstevel@tonic-gate 		error = uiomove(&mm_map[pageoff], nbytes, rw, uio);
2507c478bd9Sstevel@tonic-gate 
2517c478bd9Sstevel@tonic-gate 	hat_unload(kas.a_hat, mm_map, PAGESIZE, HAT_UNLOAD_UNLOCK);
2527c478bd9Sstevel@tonic-gate 	mutex_exit(&mm_lock);
2537c478bd9Sstevel@tonic-gate 	return (error);
2547c478bd9Sstevel@tonic-gate }
2557c478bd9Sstevel@tonic-gate 
2567c478bd9Sstevel@tonic-gate #ifdef	__sparc
2577c478bd9Sstevel@tonic-gate 
2581bd5c35fSelowe static int
2591bd5c35fSelowe mmpagelock(struct as *as, caddr_t va)
2601bd5c35fSelowe {
2611bd5c35fSelowe 	struct seg *seg;
2621bd5c35fSelowe 	int i;
2631bd5c35fSelowe 
2641bd5c35fSelowe 	AS_LOCK_ENTER(as, &as->a_lock, RW_READER);
2651bd5c35fSelowe 	seg = as_segat(as, va);
2661bd5c35fSelowe 	i = (seg != NULL)? SEGOP_CAPABLE(seg, S_CAPABILITY_NOMINFLT) : 0;
2671bd5c35fSelowe 	AS_LOCK_EXIT(as, &as->a_lock);
2681bd5c35fSelowe 
2691bd5c35fSelowe 	return (i);
2701bd5c35fSelowe }
2711bd5c35fSelowe 
2721bd5c35fSelowe #define	NEED_LOCK_KVADDR(kva)	mmpagelock(&kas, kva)
2737c478bd9Sstevel@tonic-gate 
2747c478bd9Sstevel@tonic-gate #else	/* __i386, __amd64 */
2757c478bd9Sstevel@tonic-gate 
2767c478bd9Sstevel@tonic-gate #define	NEED_LOCK_KVADDR(va)	0
2777c478bd9Sstevel@tonic-gate 
2787c478bd9Sstevel@tonic-gate #endif	/* __sparc */
2797c478bd9Sstevel@tonic-gate 
2807c478bd9Sstevel@tonic-gate /*ARGSUSED3*/
2817c478bd9Sstevel@tonic-gate static int
2827c478bd9Sstevel@tonic-gate mmrw(dev_t dev, struct uio *uio, enum uio_rw rw, cred_t *cred)
2837c478bd9Sstevel@tonic-gate {
2847c478bd9Sstevel@tonic-gate 	pfn_t v;
2857c478bd9Sstevel@tonic-gate 	struct iovec *iov;
2867c478bd9Sstevel@tonic-gate 	int error = 0;
2877c478bd9Sstevel@tonic-gate 	size_t c;
2887c478bd9Sstevel@tonic-gate 	ssize_t oresid = uio->uio_resid;
2897c478bd9Sstevel@tonic-gate 	minor_t minor = getminor(dev);
2907c478bd9Sstevel@tonic-gate 
2917c478bd9Sstevel@tonic-gate 	while (uio->uio_resid > 0 && error == 0) {
2927c478bd9Sstevel@tonic-gate 		iov = uio->uio_iov;
2937c478bd9Sstevel@tonic-gate 		if (iov->iov_len == 0) {
2947c478bd9Sstevel@tonic-gate 			uio->uio_iov++;
2957c478bd9Sstevel@tonic-gate 			uio->uio_iovcnt--;
2967c478bd9Sstevel@tonic-gate 			if (uio->uio_iovcnt < 0)
2977c478bd9Sstevel@tonic-gate 				panic("mmrw");
2987c478bd9Sstevel@tonic-gate 			continue;
2997c478bd9Sstevel@tonic-gate 		}
3007c478bd9Sstevel@tonic-gate 		switch (minor) {
3017c478bd9Sstevel@tonic-gate 
3027c478bd9Sstevel@tonic-gate 		case M_MEM:
3037c478bd9Sstevel@tonic-gate 			memlist_read_lock();
3047c478bd9Sstevel@tonic-gate 			if (!address_in_memlist(phys_install,
3057c478bd9Sstevel@tonic-gate 			    (uint64_t)uio->uio_loffset, 1)) {
3067c478bd9Sstevel@tonic-gate 				memlist_read_unlock();
3077c478bd9Sstevel@tonic-gate 				error = EFAULT;
3087c478bd9Sstevel@tonic-gate 				break;
3097c478bd9Sstevel@tonic-gate 			}
3107c478bd9Sstevel@tonic-gate 			memlist_read_unlock();
3117c478bd9Sstevel@tonic-gate 
3127c478bd9Sstevel@tonic-gate 			v = BTOP((u_offset_t)uio->uio_loffset);
3137c478bd9Sstevel@tonic-gate 			error = mmio(uio, rw, v,
3147c478bd9Sstevel@tonic-gate 			    uio->uio_loffset & PAGEOFFSET, 0);
3157c478bd9Sstevel@tonic-gate 			break;
3167c478bd9Sstevel@tonic-gate 
3177c478bd9Sstevel@tonic-gate 		case M_KMEM:
3187c478bd9Sstevel@tonic-gate 		case M_ALLKMEM:
3197c478bd9Sstevel@tonic-gate 			{
3207c478bd9Sstevel@tonic-gate 			page_t **ppp;
3217c478bd9Sstevel@tonic-gate 			caddr_t vaddr = (caddr_t)uio->uio_offset;
3227c478bd9Sstevel@tonic-gate 			int try_lock = NEED_LOCK_KVADDR(vaddr);
3237c478bd9Sstevel@tonic-gate 			int locked = 0;
3247c478bd9Sstevel@tonic-gate 
3257c478bd9Sstevel@tonic-gate 			/*
3267c478bd9Sstevel@tonic-gate 			 * If vaddr does not map a valid page, as_pagelock()
3277c478bd9Sstevel@tonic-gate 			 * will return failure. Hence we can't check the
3287c478bd9Sstevel@tonic-gate 			 * return value and return EFAULT here as we'd like.
3297c478bd9Sstevel@tonic-gate 			 * seg_kp and seg_kpm do not properly support
3307c478bd9Sstevel@tonic-gate 			 * as_pagelock() for this context so we avoid it
3317c478bd9Sstevel@tonic-gate 			 * using the try_lock set check above.  Some day when
3327c478bd9Sstevel@tonic-gate 			 * the kernel page locking gets redesigned all this
3337c478bd9Sstevel@tonic-gate 			 * muck can be cleaned up.
3347c478bd9Sstevel@tonic-gate 			 */
3357c478bd9Sstevel@tonic-gate 			if (try_lock)
3367c478bd9Sstevel@tonic-gate 				locked = (as_pagelock(&kas, &ppp, vaddr,
3377c478bd9Sstevel@tonic-gate 				    PAGESIZE, S_WRITE) == 0);
3387c478bd9Sstevel@tonic-gate 
339e42d2a1cSjongkis 			v = hat_getpfnum(kas.a_hat,
340e42d2a1cSjongkis 			    (caddr_t)(uintptr_t)uio->uio_loffset);
3417c478bd9Sstevel@tonic-gate 			if (v == PFN_INVALID) {
3427c478bd9Sstevel@tonic-gate 				if (locked)
3437c478bd9Sstevel@tonic-gate 					as_pageunlock(&kas, ppp, vaddr,
3447c478bd9Sstevel@tonic-gate 					    PAGESIZE, S_WRITE);
3457c478bd9Sstevel@tonic-gate 				error = EFAULT;
3467c478bd9Sstevel@tonic-gate 				break;
3477c478bd9Sstevel@tonic-gate 			}
3487c478bd9Sstevel@tonic-gate 
3497c478bd9Sstevel@tonic-gate 			error = mmio(uio, rw, v, uio->uio_loffset & PAGEOFFSET,
3507c478bd9Sstevel@tonic-gate 			    minor == M_ALLKMEM || mm_kmem_io_access);
3517c478bd9Sstevel@tonic-gate 			if (locked)
3527c478bd9Sstevel@tonic-gate 				as_pageunlock(&kas, ppp, vaddr, PAGESIZE,
3537c478bd9Sstevel@tonic-gate 				    S_WRITE);
3547c478bd9Sstevel@tonic-gate 			}
3557c478bd9Sstevel@tonic-gate 
3567c478bd9Sstevel@tonic-gate 			break;
3577c478bd9Sstevel@tonic-gate 
3587c478bd9Sstevel@tonic-gate 		case M_ZERO:
3597c478bd9Sstevel@tonic-gate 			if (rw == UIO_READ) {
3607c478bd9Sstevel@tonic-gate 				label_t ljb;
3617c478bd9Sstevel@tonic-gate 
3627c478bd9Sstevel@tonic-gate 				if (on_fault(&ljb)) {
3637c478bd9Sstevel@tonic-gate 					no_fault();
3647c478bd9Sstevel@tonic-gate 					error = EFAULT;
3657c478bd9Sstevel@tonic-gate 					break;
3667c478bd9Sstevel@tonic-gate 				}
3677c478bd9Sstevel@tonic-gate 				uzero(iov->iov_base, iov->iov_len);
3687c478bd9Sstevel@tonic-gate 				no_fault();
3697c478bd9Sstevel@tonic-gate 				uio->uio_resid -= iov->iov_len;
3707c478bd9Sstevel@tonic-gate 				uio->uio_loffset += iov->iov_len;
3717c478bd9Sstevel@tonic-gate 				break;
3727c478bd9Sstevel@tonic-gate 			}
3737c478bd9Sstevel@tonic-gate 			/* else it's a write, fall through to NULL case */
3747c478bd9Sstevel@tonic-gate 			/*FALLTHROUGH*/
3757c478bd9Sstevel@tonic-gate 
3767c478bd9Sstevel@tonic-gate 		case M_NULL:
3777c478bd9Sstevel@tonic-gate 			if (rw == UIO_READ)
3787c478bd9Sstevel@tonic-gate 				return (0);
3797c478bd9Sstevel@tonic-gate 			c = iov->iov_len;
3807c478bd9Sstevel@tonic-gate 			iov->iov_base += c;
3817c478bd9Sstevel@tonic-gate 			iov->iov_len -= c;
3827c478bd9Sstevel@tonic-gate 			uio->uio_loffset += c;
3837c478bd9Sstevel@tonic-gate 			uio->uio_resid -= c;
3847c478bd9Sstevel@tonic-gate 			break;
3857c478bd9Sstevel@tonic-gate 
3867c478bd9Sstevel@tonic-gate 		}
3877c478bd9Sstevel@tonic-gate 	}
3887c478bd9Sstevel@tonic-gate 	return (uio->uio_resid == oresid ? error : 0);
3897c478bd9Sstevel@tonic-gate }
3907c478bd9Sstevel@tonic-gate 
3917c478bd9Sstevel@tonic-gate static int
3927c478bd9Sstevel@tonic-gate mmread(dev_t dev, struct uio *uio, cred_t *cred)
3937c478bd9Sstevel@tonic-gate {
3947c478bd9Sstevel@tonic-gate 	return (mmrw(dev, uio, UIO_READ, cred));
3957c478bd9Sstevel@tonic-gate }
3967c478bd9Sstevel@tonic-gate 
3977c478bd9Sstevel@tonic-gate static int
3987c478bd9Sstevel@tonic-gate mmwrite(dev_t dev, struct uio *uio, cred_t *cred)
3997c478bd9Sstevel@tonic-gate {
4007c478bd9Sstevel@tonic-gate 	return (mmrw(dev, uio, UIO_WRITE, cred));
4017c478bd9Sstevel@tonic-gate }
4027c478bd9Sstevel@tonic-gate 
4037c478bd9Sstevel@tonic-gate /*
4047c478bd9Sstevel@tonic-gate  * Private ioctl for libkvm to support kvm_physaddr().
4057c478bd9Sstevel@tonic-gate  * Given an address space and a VA, compute the PA.
4067c478bd9Sstevel@tonic-gate  */
4077c478bd9Sstevel@tonic-gate static int
4087c478bd9Sstevel@tonic-gate mmioctl_vtop(intptr_t data)
4097c478bd9Sstevel@tonic-gate {
4107c478bd9Sstevel@tonic-gate 	mem_vtop_t mem_vtop;
4117c478bd9Sstevel@tonic-gate 	proc_t *p;
4127c478bd9Sstevel@tonic-gate 	pfn_t pfn = (pfn_t)PFN_INVALID;
4137c478bd9Sstevel@tonic-gate 	pid_t pid = 0;
4147c478bd9Sstevel@tonic-gate 	struct as *as;
4157c478bd9Sstevel@tonic-gate 	struct seg *seg;
4167c478bd9Sstevel@tonic-gate 
4177c478bd9Sstevel@tonic-gate 	if (copyin((void *)data, &mem_vtop, sizeof (mem_vtop_t)))
4187c478bd9Sstevel@tonic-gate 		return (EFAULT);
4197c478bd9Sstevel@tonic-gate 	if (mem_vtop.m_as == &kas) {
4207c478bd9Sstevel@tonic-gate 		pfn = hat_getpfnum(kas.a_hat, mem_vtop.m_va);
4217c478bd9Sstevel@tonic-gate 	} else if (mem_vtop.m_as == NULL) {
4227c478bd9Sstevel@tonic-gate 		return (EIO);
4237c478bd9Sstevel@tonic-gate 	} else {
4247c478bd9Sstevel@tonic-gate 		mutex_enter(&pidlock);
4257c478bd9Sstevel@tonic-gate 		for (p = practive; p != NULL; p = p->p_next) {
4267c478bd9Sstevel@tonic-gate 			if (p->p_as == mem_vtop.m_as) {
4277c478bd9Sstevel@tonic-gate 				pid = p->p_pid;
4287c478bd9Sstevel@tonic-gate 				break;
4297c478bd9Sstevel@tonic-gate 			}
4307c478bd9Sstevel@tonic-gate 		}
4317c478bd9Sstevel@tonic-gate 		mutex_exit(&pidlock);
4327c478bd9Sstevel@tonic-gate 		if (p == NULL)
4337c478bd9Sstevel@tonic-gate 			return (EIO);
4347c478bd9Sstevel@tonic-gate 		p = sprlock(pid);
4357c478bd9Sstevel@tonic-gate 		if (p == NULL)
4367c478bd9Sstevel@tonic-gate 			return (EIO);
4377c478bd9Sstevel@tonic-gate 		as = p->p_as;
4387c478bd9Sstevel@tonic-gate 		if (as == mem_vtop.m_as) {
4397c478bd9Sstevel@tonic-gate 			mutex_exit(&p->p_lock);
4407c478bd9Sstevel@tonic-gate 			AS_LOCK_ENTER(as, &as->a_lock, RW_READER);
4417c478bd9Sstevel@tonic-gate 			for (seg = AS_SEGFIRST(as); seg != NULL;
4427c478bd9Sstevel@tonic-gate 			    seg = AS_SEGNEXT(as, seg))
4437c478bd9Sstevel@tonic-gate 				if ((uintptr_t)mem_vtop.m_va -
4447c478bd9Sstevel@tonic-gate 				    (uintptr_t)seg->s_base < seg->s_size)
4457c478bd9Sstevel@tonic-gate 					break;
4467c478bd9Sstevel@tonic-gate 			if (seg != NULL)
4477c478bd9Sstevel@tonic-gate 				pfn = hat_getpfnum(as->a_hat, mem_vtop.m_va);
4487c478bd9Sstevel@tonic-gate 			AS_LOCK_EXIT(as, &as->a_lock);
4497c478bd9Sstevel@tonic-gate 			mutex_enter(&p->p_lock);
4507c478bd9Sstevel@tonic-gate 		}
4517c478bd9Sstevel@tonic-gate 		sprunlock(p);
4527c478bd9Sstevel@tonic-gate 	}
4537c478bd9Sstevel@tonic-gate 	mem_vtop.m_pfn = pfn;
4547c478bd9Sstevel@tonic-gate 	if (pfn == PFN_INVALID)
4557c478bd9Sstevel@tonic-gate 		return (EIO);
4567c478bd9Sstevel@tonic-gate 	if (copyout(&mem_vtop, (void *)data, sizeof (mem_vtop_t)))
4577c478bd9Sstevel@tonic-gate 		return (EFAULT);
4587c478bd9Sstevel@tonic-gate 
4597c478bd9Sstevel@tonic-gate 	return (0);
4607c478bd9Sstevel@tonic-gate }
4617c478bd9Sstevel@tonic-gate 
4627c478bd9Sstevel@tonic-gate /*
463*db874c57Selowe  * Given a PA, execute the given page retire command on it.
4647c478bd9Sstevel@tonic-gate  */
4657c478bd9Sstevel@tonic-gate static int
4667c478bd9Sstevel@tonic-gate mmioctl_page_retire(int cmd, intptr_t data)
4677c478bd9Sstevel@tonic-gate {
468*db874c57Selowe 	extern int page_retire_test(void);
4697c478bd9Sstevel@tonic-gate 	uint64_t pa;
4707c478bd9Sstevel@tonic-gate 
471*db874c57Selowe 	if (copyin((void *)data, &pa, sizeof (uint64_t))) {
4727c478bd9Sstevel@tonic-gate 		return (EFAULT);
4737c478bd9Sstevel@tonic-gate 	}
4747c478bd9Sstevel@tonic-gate 
475*db874c57Selowe 	switch (cmd) {
476*db874c57Selowe 	case MEM_PAGE_ISRETIRED:
477*db874c57Selowe 		return (page_retire_check(pa, NULL));
4787c478bd9Sstevel@tonic-gate 
479*db874c57Selowe 	case MEM_PAGE_UNRETIRE:
480*db874c57Selowe 		return (page_unretire(pa));
481*db874c57Selowe 
482*db874c57Selowe 	case MEM_PAGE_RETIRE:
483*db874c57Selowe 		return (page_retire(pa, PR_FMA));
484*db874c57Selowe 
485*db874c57Selowe 	case MEM_PAGE_RETIRE_MCE:
486*db874c57Selowe 		return (page_retire(pa, PR_MCE));
487*db874c57Selowe 
488*db874c57Selowe 	case MEM_PAGE_RETIRE_UE:
489*db874c57Selowe 		return (page_retire(pa, PR_UE));
490*db874c57Selowe 
491*db874c57Selowe 	case MEM_PAGE_GETERRORS:
492*db874c57Selowe 		{
493*db874c57Selowe 			uint64_t page_errors;
494*db874c57Selowe 			int rc = page_retire_check(pa, &page_errors);
495*db874c57Selowe 			if (copyout(&page_errors, (void *)data,
496*db874c57Selowe 			    sizeof (uint64_t))) {
497*db874c57Selowe 				return (EFAULT);
498*db874c57Selowe 			}
499*db874c57Selowe 			return (rc);
500*db874c57Selowe 		}
501*db874c57Selowe 
502*db874c57Selowe 	case MEM_PAGE_RETIRE_TEST:
503*db874c57Selowe 		return (page_retire_test());
504*db874c57Selowe 
505*db874c57Selowe 	}
506*db874c57Selowe 
507*db874c57Selowe 	return (EINVAL);
5087c478bd9Sstevel@tonic-gate }
5097c478bd9Sstevel@tonic-gate 
5107c478bd9Sstevel@tonic-gate #ifdef __sparc
5117c478bd9Sstevel@tonic-gate /*
5127c478bd9Sstevel@tonic-gate  * Given a syndrome, syndrome type, and address return the
5137c478bd9Sstevel@tonic-gate  * associated memory name in the provided data buffer.
5147c478bd9Sstevel@tonic-gate  */
5157c478bd9Sstevel@tonic-gate static int
5167c478bd9Sstevel@tonic-gate mmioctl_get_mem_name(intptr_t data)
5177c478bd9Sstevel@tonic-gate {
5187c478bd9Sstevel@tonic-gate 	mem_name_t mem_name;
5197c478bd9Sstevel@tonic-gate #ifdef	_SYSCALL32
5207c478bd9Sstevel@tonic-gate 	mem_name32_t mem_name32;
5217c478bd9Sstevel@tonic-gate #endif
5227c478bd9Sstevel@tonic-gate 	void *buf;
5237c478bd9Sstevel@tonic-gate 	size_t bufsize;
5247c478bd9Sstevel@tonic-gate 	int len, err;
5257c478bd9Sstevel@tonic-gate 
5267c478bd9Sstevel@tonic-gate 	if ((bufsize = cpu_get_name_bufsize()) == 0)
5277c478bd9Sstevel@tonic-gate 		return (ENOTSUP);
5287c478bd9Sstevel@tonic-gate 
5297c478bd9Sstevel@tonic-gate 	if (get_udatamodel() == DATAMODEL_NATIVE) {
5307c478bd9Sstevel@tonic-gate 		if (copyin((void *)data, &mem_name, sizeof (mem_name_t)))
5317c478bd9Sstevel@tonic-gate 			return (EFAULT);
5327c478bd9Sstevel@tonic-gate 	}
5337c478bd9Sstevel@tonic-gate #ifdef	_SYSCALL32
5347c478bd9Sstevel@tonic-gate 	else {
5357c478bd9Sstevel@tonic-gate 		if (copyin((void *)data, &mem_name32, sizeof (mem_name32_t)))
5367c478bd9Sstevel@tonic-gate 			return (EFAULT);
5377c478bd9Sstevel@tonic-gate 		mem_name.m_addr = mem_name32.m_addr;
5387c478bd9Sstevel@tonic-gate 		mem_name.m_synd = mem_name32.m_synd;
5397c478bd9Sstevel@tonic-gate 		mem_name.m_type[0] = mem_name32.m_type[0];
5407c478bd9Sstevel@tonic-gate 		mem_name.m_type[1] = mem_name32.m_type[1];
541e42d2a1cSjongkis 		mem_name.m_name = (caddr_t)(uintptr_t)mem_name32.m_name;
5427c478bd9Sstevel@tonic-gate 		mem_name.m_namelen = (size_t)mem_name32.m_namelen;
5437c478bd9Sstevel@tonic-gate 	}
5447c478bd9Sstevel@tonic-gate #endif	/* _SYSCALL32 */
5457c478bd9Sstevel@tonic-gate 
5467c478bd9Sstevel@tonic-gate 	buf = kmem_alloc(bufsize, KM_SLEEP);
5477c478bd9Sstevel@tonic-gate 
5487c478bd9Sstevel@tonic-gate 	/*
5497c478bd9Sstevel@tonic-gate 	 * Call into cpu specific code to do the lookup.
5507c478bd9Sstevel@tonic-gate 	 */
5517c478bd9Sstevel@tonic-gate 	if ((err = cpu_get_mem_name(mem_name.m_synd, mem_name.m_type,
5527c478bd9Sstevel@tonic-gate 	    mem_name.m_addr, buf, bufsize, &len)) != 0) {
5537c478bd9Sstevel@tonic-gate 		kmem_free(buf, bufsize);
5547c478bd9Sstevel@tonic-gate 		return (err);
5557c478bd9Sstevel@tonic-gate 	}
5567c478bd9Sstevel@tonic-gate 
5577c478bd9Sstevel@tonic-gate 	if (len >= mem_name.m_namelen) {
5587c478bd9Sstevel@tonic-gate 		kmem_free(buf, bufsize);
5597c478bd9Sstevel@tonic-gate 		return (ENAMETOOLONG);
5607c478bd9Sstevel@tonic-gate 	}
5617c478bd9Sstevel@tonic-gate 
5627c478bd9Sstevel@tonic-gate 	if (copyoutstr(buf, (char *)mem_name.m_name,
5637c478bd9Sstevel@tonic-gate 	    mem_name.m_namelen, NULL) != 0) {
5647c478bd9Sstevel@tonic-gate 		kmem_free(buf, bufsize);
5657c478bd9Sstevel@tonic-gate 		return (EFAULT);
5667c478bd9Sstevel@tonic-gate 	}
5677c478bd9Sstevel@tonic-gate 
5687c478bd9Sstevel@tonic-gate 	kmem_free(buf, bufsize);
5697c478bd9Sstevel@tonic-gate 	return (0);
5707c478bd9Sstevel@tonic-gate }
5717c478bd9Sstevel@tonic-gate 
5727c478bd9Sstevel@tonic-gate /*
5737c478bd9Sstevel@tonic-gate  * Given a syndrome and address return information about the associated memory.
5747c478bd9Sstevel@tonic-gate  */
5757c478bd9Sstevel@tonic-gate static int
5767c478bd9Sstevel@tonic-gate mmioctl_get_mem_info(intptr_t data)
5777c478bd9Sstevel@tonic-gate {
5787c478bd9Sstevel@tonic-gate 	mem_info_t mem_info;
5797c478bd9Sstevel@tonic-gate 	int err;
5807c478bd9Sstevel@tonic-gate 
5817c478bd9Sstevel@tonic-gate 	if (copyin((void *)data, &mem_info, sizeof (mem_info_t)))
5827c478bd9Sstevel@tonic-gate 		return (EFAULT);
5837c478bd9Sstevel@tonic-gate 
5847c478bd9Sstevel@tonic-gate 	if ((err = cpu_get_mem_info(mem_info.m_synd, mem_info.m_addr,
5857c478bd9Sstevel@tonic-gate 	    &mem_info.m_mem_size, &mem_info.m_seg_size, &mem_info.m_bank_size,
5867c478bd9Sstevel@tonic-gate 	    &mem_info.m_segments, &mem_info.m_banks, &mem_info.m_mcid)) != 0)
5877c478bd9Sstevel@tonic-gate 		return (err);
5887c478bd9Sstevel@tonic-gate 
5897c478bd9Sstevel@tonic-gate 	if (copyout(&mem_info, (void *)data, sizeof (mem_info_t)) != 0)
5907c478bd9Sstevel@tonic-gate 		return (EFAULT);
5917c478bd9Sstevel@tonic-gate 
5927c478bd9Sstevel@tonic-gate 	return (0);
5937c478bd9Sstevel@tonic-gate }
5947c478bd9Sstevel@tonic-gate #endif	/* __sparc */
5957c478bd9Sstevel@tonic-gate 
5967c478bd9Sstevel@tonic-gate /*
5977c478bd9Sstevel@tonic-gate  * Private ioctls for
5987c478bd9Sstevel@tonic-gate  *	libkvm to support kvm_physaddr().
5997c478bd9Sstevel@tonic-gate  *	FMA support for page_retire() and memory attribute information.
6007c478bd9Sstevel@tonic-gate  */
6017c478bd9Sstevel@tonic-gate /*ARGSUSED*/
6027c478bd9Sstevel@tonic-gate static int
6037c478bd9Sstevel@tonic-gate mmioctl(dev_t dev, int cmd, intptr_t data, int flag, cred_t *cred, int *rvalp)
6047c478bd9Sstevel@tonic-gate {
6057c478bd9Sstevel@tonic-gate 	switch (cmd) {
6067c478bd9Sstevel@tonic-gate 	case MEM_VTOP:
6077c478bd9Sstevel@tonic-gate 		if (getminor(dev) != M_KMEM)
6087c478bd9Sstevel@tonic-gate 			return (ENXIO);
6097c478bd9Sstevel@tonic-gate 		return (mmioctl_vtop(data));
6107c478bd9Sstevel@tonic-gate 
6117c478bd9Sstevel@tonic-gate 	case MEM_PAGE_RETIRE:
6127c478bd9Sstevel@tonic-gate 	case MEM_PAGE_ISRETIRED:
613*db874c57Selowe 	case MEM_PAGE_UNRETIRE:
614*db874c57Selowe 	case MEM_PAGE_RETIRE_MCE:
615*db874c57Selowe 	case MEM_PAGE_RETIRE_UE:
616*db874c57Selowe 	case MEM_PAGE_GETERRORS:
617*db874c57Selowe 	case MEM_PAGE_RETIRE_TEST:
6187c478bd9Sstevel@tonic-gate 		if (getminor(dev) != M_MEM)
6197c478bd9Sstevel@tonic-gate 			return (ENXIO);
6207c478bd9Sstevel@tonic-gate 		return (mmioctl_page_retire(cmd, data));
6217c478bd9Sstevel@tonic-gate 
6227c478bd9Sstevel@tonic-gate 	case MEM_NAME:
6237c478bd9Sstevel@tonic-gate 		if (getminor(dev) != M_MEM)
6247c478bd9Sstevel@tonic-gate 			return (ENXIO);
6257c478bd9Sstevel@tonic-gate #ifdef __sparc
6267c478bd9Sstevel@tonic-gate 		return (mmioctl_get_mem_name(data));
6277c478bd9Sstevel@tonic-gate #else
6287c478bd9Sstevel@tonic-gate 		return (ENOTSUP);
6297c478bd9Sstevel@tonic-gate #endif
6307c478bd9Sstevel@tonic-gate 
6317c478bd9Sstevel@tonic-gate 	case MEM_INFO:
6327c478bd9Sstevel@tonic-gate 		if (getminor(dev) != M_MEM)
6337c478bd9Sstevel@tonic-gate 			return (ENXIO);
6347c478bd9Sstevel@tonic-gate #ifdef __sparc
6357c478bd9Sstevel@tonic-gate 		return (mmioctl_get_mem_info(data));
6367c478bd9Sstevel@tonic-gate #else
6377c478bd9Sstevel@tonic-gate 		return (ENOTSUP);
6387c478bd9Sstevel@tonic-gate #endif
6397c478bd9Sstevel@tonic-gate 	}
6407c478bd9Sstevel@tonic-gate 	return (ENXIO);
6417c478bd9Sstevel@tonic-gate }
6427c478bd9Sstevel@tonic-gate 
6437c478bd9Sstevel@tonic-gate /*ARGSUSED2*/
6447c478bd9Sstevel@tonic-gate static int
6457c478bd9Sstevel@tonic-gate mmmmap(dev_t dev, off_t off, int prot)
6467c478bd9Sstevel@tonic-gate {
6477c478bd9Sstevel@tonic-gate 	pfn_t pf;
6487c478bd9Sstevel@tonic-gate 	struct memlist *pmem;
6497c478bd9Sstevel@tonic-gate 	minor_t minor = getminor(dev);
6507c478bd9Sstevel@tonic-gate 
6517c478bd9Sstevel@tonic-gate 	switch (minor) {
6527c478bd9Sstevel@tonic-gate 	case M_MEM:
6537c478bd9Sstevel@tonic-gate 		pf = btop(off);
6547c478bd9Sstevel@tonic-gate 		memlist_read_lock();
6557c478bd9Sstevel@tonic-gate 		for (pmem = phys_install; pmem != NULL; pmem = pmem->next) {
6567c478bd9Sstevel@tonic-gate 			if (pf >= BTOP(pmem->address) &&
6577c478bd9Sstevel@tonic-gate 			    pf < BTOP(pmem->address + pmem->size)) {
6587c478bd9Sstevel@tonic-gate 				memlist_read_unlock();
6597c478bd9Sstevel@tonic-gate 				return (impl_obmem_pfnum(pf));
6607c478bd9Sstevel@tonic-gate 			}
6617c478bd9Sstevel@tonic-gate 		}
6627c478bd9Sstevel@tonic-gate 		memlist_read_unlock();
6637c478bd9Sstevel@tonic-gate 		break;
6647c478bd9Sstevel@tonic-gate 
6657c478bd9Sstevel@tonic-gate 	case M_KMEM:
6667c478bd9Sstevel@tonic-gate 	case M_ALLKMEM:
6677c478bd9Sstevel@tonic-gate 		/* no longer supported with KPR */
6687c478bd9Sstevel@tonic-gate 		return (-1);
6697c478bd9Sstevel@tonic-gate 
6707c478bd9Sstevel@tonic-gate 	case M_ZERO:
6717c478bd9Sstevel@tonic-gate 		/*
6727c478bd9Sstevel@tonic-gate 		 * We shouldn't be mmap'ing to /dev/zero here as
6737c478bd9Sstevel@tonic-gate 		 * mmsegmap() should have already converted
6747c478bd9Sstevel@tonic-gate 		 * a mapping request for this device to a mapping
6757c478bd9Sstevel@tonic-gate 		 * using seg_vn for anonymous memory.
6767c478bd9Sstevel@tonic-gate 		 */
6777c478bd9Sstevel@tonic-gate 		break;
6787c478bd9Sstevel@tonic-gate 
6797c478bd9Sstevel@tonic-gate 	}
6807c478bd9Sstevel@tonic-gate 	return (-1);
6817c478bd9Sstevel@tonic-gate }
6827c478bd9Sstevel@tonic-gate 
6837c478bd9Sstevel@tonic-gate /*
6847c478bd9Sstevel@tonic-gate  * This function is called when a memory device is mmap'ed.
6857c478bd9Sstevel@tonic-gate  * Set up the mapping to the correct device driver.
6867c478bd9Sstevel@tonic-gate  */
6877c478bd9Sstevel@tonic-gate static int
6887c478bd9Sstevel@tonic-gate mmsegmap(dev_t dev, off_t off, struct as *as, caddr_t *addrp, off_t len,
6897c478bd9Sstevel@tonic-gate     uint_t prot, uint_t maxprot, uint_t flags, struct cred *cred)
6907c478bd9Sstevel@tonic-gate {
6917c478bd9Sstevel@tonic-gate 	struct segvn_crargs vn_a;
6927c478bd9Sstevel@tonic-gate 	struct segdev_crargs dev_a;
6937c478bd9Sstevel@tonic-gate 	int error;
6947c478bd9Sstevel@tonic-gate 	minor_t minor;
6957c478bd9Sstevel@tonic-gate 	off_t i;
6967c478bd9Sstevel@tonic-gate 
6977c478bd9Sstevel@tonic-gate 	minor = getminor(dev);
6987c478bd9Sstevel@tonic-gate 
6997c478bd9Sstevel@tonic-gate 	as_rangelock(as);
7007c478bd9Sstevel@tonic-gate 	if ((flags & MAP_FIXED) == 0) {
7017c478bd9Sstevel@tonic-gate 		/*
7027c478bd9Sstevel@tonic-gate 		 * No need to worry about vac alignment on /dev/zero
7037c478bd9Sstevel@tonic-gate 		 * since this is a "clone" object that doesn't yet exist.
7047c478bd9Sstevel@tonic-gate 		 */
7057c478bd9Sstevel@tonic-gate 		map_addr(addrp, len, (offset_t)off,
7067c478bd9Sstevel@tonic-gate 				(minor == M_MEM) || (minor == M_KMEM), flags);
7077c478bd9Sstevel@tonic-gate 
7087c478bd9Sstevel@tonic-gate 		if (*addrp == NULL) {
7097c478bd9Sstevel@tonic-gate 			as_rangeunlock(as);
7107c478bd9Sstevel@tonic-gate 			return (ENOMEM);
7117c478bd9Sstevel@tonic-gate 		}
7127c478bd9Sstevel@tonic-gate 	} else {
7137c478bd9Sstevel@tonic-gate 		/*
7147c478bd9Sstevel@tonic-gate 		 * User specified address -
7157c478bd9Sstevel@tonic-gate 		 * Blow away any previous mappings.
7167c478bd9Sstevel@tonic-gate 		 */
7177c478bd9Sstevel@tonic-gate 		(void) as_unmap(as, *addrp, len);
7187c478bd9Sstevel@tonic-gate 	}
7197c478bd9Sstevel@tonic-gate 
7207c478bd9Sstevel@tonic-gate 	switch (minor) {
7217c478bd9Sstevel@tonic-gate 	case M_MEM:
7227c478bd9Sstevel@tonic-gate 		/* /dev/mem cannot be mmap'ed with MAP_PRIVATE */
7237c478bd9Sstevel@tonic-gate 		if ((flags & MAP_TYPE) != MAP_SHARED) {
7247c478bd9Sstevel@tonic-gate 			as_rangeunlock(as);
7257c478bd9Sstevel@tonic-gate 			return (EINVAL);
7267c478bd9Sstevel@tonic-gate 		}
7277c478bd9Sstevel@tonic-gate 
7287c478bd9Sstevel@tonic-gate 		/*
7297c478bd9Sstevel@tonic-gate 		 * Check to ensure that the entire range is
7307c478bd9Sstevel@tonic-gate 		 * legal and we are not trying to map in
7317c478bd9Sstevel@tonic-gate 		 * more than the device will let us.
7327c478bd9Sstevel@tonic-gate 		 */
7337c478bd9Sstevel@tonic-gate 		for (i = 0; i < len; i += PAGESIZE) {
7347c478bd9Sstevel@tonic-gate 			if (mmmmap(dev, off + i, maxprot) == -1) {
7357c478bd9Sstevel@tonic-gate 				as_rangeunlock(as);
7367c478bd9Sstevel@tonic-gate 				return (ENXIO);
7377c478bd9Sstevel@tonic-gate 			}
7387c478bd9Sstevel@tonic-gate 		}
7397c478bd9Sstevel@tonic-gate 
7407c478bd9Sstevel@tonic-gate 		/*
7417c478bd9Sstevel@tonic-gate 		 * Use seg_dev segment driver for /dev/mem mapping.
7427c478bd9Sstevel@tonic-gate 		 */
7437c478bd9Sstevel@tonic-gate 		dev_a.mapfunc = mmmmap;
7447c478bd9Sstevel@tonic-gate 		dev_a.dev = dev;
7457c478bd9Sstevel@tonic-gate 		dev_a.offset = off;
7467c478bd9Sstevel@tonic-gate 		dev_a.type = (flags & MAP_TYPE);
7477c478bd9Sstevel@tonic-gate 		dev_a.prot = (uchar_t)prot;
7487c478bd9Sstevel@tonic-gate 		dev_a.maxprot = (uchar_t)maxprot;
7497c478bd9Sstevel@tonic-gate 		dev_a.hat_attr = 0;
7507c478bd9Sstevel@tonic-gate 
7517c478bd9Sstevel@tonic-gate 		/*
7527c478bd9Sstevel@tonic-gate 		 * Make /dev/mem mappings non-consistent since we can't
7537c478bd9Sstevel@tonic-gate 		 * alias pages that don't have page structs behind them,
7547c478bd9Sstevel@tonic-gate 		 * such as kernel stack pages. If someone mmap()s a kernel
7557c478bd9Sstevel@tonic-gate 		 * stack page and if we give him a tte with cv, a line from
7567c478bd9Sstevel@tonic-gate 		 * that page can get into both pages of the spitfire d$.
7577c478bd9Sstevel@tonic-gate 		 * But snoop from another processor will only invalidate
7587c478bd9Sstevel@tonic-gate 		 * the first page. This later caused kernel (xc_attention)
7597c478bd9Sstevel@tonic-gate 		 * to go into an infinite loop at pil 13 and no interrupts
7607c478bd9Sstevel@tonic-gate 		 * could come in. See 1203630.
7617c478bd9Sstevel@tonic-gate 		 *
7627c478bd9Sstevel@tonic-gate 		 */
7637c478bd9Sstevel@tonic-gate 		dev_a.hat_flags = HAT_LOAD_NOCONSIST;
7647c478bd9Sstevel@tonic-gate 		dev_a.devmap_data = NULL;
7657c478bd9Sstevel@tonic-gate 
7667c478bd9Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segdev_create, &dev_a);
7677c478bd9Sstevel@tonic-gate 		break;
7687c478bd9Sstevel@tonic-gate 
7697c478bd9Sstevel@tonic-gate 	case M_ZERO:
7707c478bd9Sstevel@tonic-gate 		/*
7717c478bd9Sstevel@tonic-gate 		 * Use seg_vn segment driver for /dev/zero mapping.
7727c478bd9Sstevel@tonic-gate 		 * Passing in a NULL amp gives us the "cloning" effect.
7737c478bd9Sstevel@tonic-gate 		 */
7747c478bd9Sstevel@tonic-gate 		vn_a.vp = NULL;
7757c478bd9Sstevel@tonic-gate 		vn_a.offset = 0;
7767c478bd9Sstevel@tonic-gate 		vn_a.type = (flags & MAP_TYPE);
7777c478bd9Sstevel@tonic-gate 		vn_a.prot = prot;
7787c478bd9Sstevel@tonic-gate 		vn_a.maxprot = maxprot;
7797c478bd9Sstevel@tonic-gate 		vn_a.flags = flags & ~MAP_TYPE;
7807c478bd9Sstevel@tonic-gate 		vn_a.cred = cred;
7817c478bd9Sstevel@tonic-gate 		vn_a.amp = NULL;
7827c478bd9Sstevel@tonic-gate 		vn_a.szc = 0;
7837c478bd9Sstevel@tonic-gate 		vn_a.lgrp_mem_policy_flags = 0;
7847c478bd9Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segvn_create, &vn_a);
7857c478bd9Sstevel@tonic-gate 		break;
7867c478bd9Sstevel@tonic-gate 
7877c478bd9Sstevel@tonic-gate 	case M_KMEM:
7887c478bd9Sstevel@tonic-gate 	case M_ALLKMEM:
7897c478bd9Sstevel@tonic-gate 		/* No longer supported with KPR. */
7907c478bd9Sstevel@tonic-gate 		error = ENXIO;
7917c478bd9Sstevel@tonic-gate 		break;
7927c478bd9Sstevel@tonic-gate 
7937c478bd9Sstevel@tonic-gate 	case M_NULL:
7947c478bd9Sstevel@tonic-gate 		/*
7957c478bd9Sstevel@tonic-gate 		 * Use seg_dev segment driver for /dev/null mapping.
7967c478bd9Sstevel@tonic-gate 		 */
7977c478bd9Sstevel@tonic-gate 		dev_a.mapfunc = mmmmap;
7987c478bd9Sstevel@tonic-gate 		dev_a.dev = dev;
7997c478bd9Sstevel@tonic-gate 		dev_a.offset = off;
8007c478bd9Sstevel@tonic-gate 		dev_a.type = 0;		/* neither PRIVATE nor SHARED */
8017c478bd9Sstevel@tonic-gate 		dev_a.prot = dev_a.maxprot = (uchar_t)PROT_NONE;
8027c478bd9Sstevel@tonic-gate 		dev_a.hat_attr = 0;
8037c478bd9Sstevel@tonic-gate 		dev_a.hat_flags = 0;
8047c478bd9Sstevel@tonic-gate 		error = as_map(as, *addrp, len, segdev_create, &dev_a);
8057c478bd9Sstevel@tonic-gate 		break;
8067c478bd9Sstevel@tonic-gate 
8077c478bd9Sstevel@tonic-gate 	default:
8087c478bd9Sstevel@tonic-gate 		error = ENXIO;
8097c478bd9Sstevel@tonic-gate 	}
8107c478bd9Sstevel@tonic-gate 
8117c478bd9Sstevel@tonic-gate 	as_rangeunlock(as);
8127c478bd9Sstevel@tonic-gate 	return (error);
8137c478bd9Sstevel@tonic-gate }
8147c478bd9Sstevel@tonic-gate 
8157c478bd9Sstevel@tonic-gate static struct cb_ops mm_cb_ops = {
8167c478bd9Sstevel@tonic-gate 	mmopen,			/* open */
8177c478bd9Sstevel@tonic-gate 	nulldev,		/* close */
8187c478bd9Sstevel@tonic-gate 	nodev,			/* strategy */
8197c478bd9Sstevel@tonic-gate 	nodev,			/* print */
8207c478bd9Sstevel@tonic-gate 	nodev,			/* dump */
8217c478bd9Sstevel@tonic-gate 	mmread,			/* read */
8227c478bd9Sstevel@tonic-gate 	mmwrite,		/* write */
8237c478bd9Sstevel@tonic-gate 	mmioctl,		/* ioctl */
8247c478bd9Sstevel@tonic-gate 	nodev,			/* devmap */
8257c478bd9Sstevel@tonic-gate 	mmmmap,			/* mmap */
8267c478bd9Sstevel@tonic-gate 	mmsegmap,		/* segmap */
8277c478bd9Sstevel@tonic-gate 	mmchpoll,		/* poll */
8287c478bd9Sstevel@tonic-gate 	mmpropop,		/* prop_op */
8297c478bd9Sstevel@tonic-gate 	0,			/* streamtab  */
8307c478bd9Sstevel@tonic-gate 	D_NEW | D_MP | D_64BIT | D_U64BIT
8317c478bd9Sstevel@tonic-gate };
8327c478bd9Sstevel@tonic-gate 
8337c478bd9Sstevel@tonic-gate static struct dev_ops mm_ops = {
8347c478bd9Sstevel@tonic-gate 	DEVO_REV,		/* devo_rev, */
8357c478bd9Sstevel@tonic-gate 	0,			/* refcnt  */
8367c478bd9Sstevel@tonic-gate 	mm_info,		/* get_dev_info */
8377c478bd9Sstevel@tonic-gate 	nulldev,		/* identify */
8387c478bd9Sstevel@tonic-gate 	nulldev,		/* probe */
8397c478bd9Sstevel@tonic-gate 	mm_attach,		/* attach */
8407c478bd9Sstevel@tonic-gate 	nodev,			/* detach */
8417c478bd9Sstevel@tonic-gate 	nodev,			/* reset */
8427c478bd9Sstevel@tonic-gate 	&mm_cb_ops,		/* driver operations */
8437c478bd9Sstevel@tonic-gate 	(struct bus_ops *)0	/* bus operations */
8447c478bd9Sstevel@tonic-gate };
8457c478bd9Sstevel@tonic-gate 
8467c478bd9Sstevel@tonic-gate static struct modldrv modldrv = {
8477c478bd9Sstevel@tonic-gate 	&mod_driverops, "memory driver %I%", &mm_ops,
8487c478bd9Sstevel@tonic-gate };
8497c478bd9Sstevel@tonic-gate 
8507c478bd9Sstevel@tonic-gate static struct modlinkage modlinkage = {
8517c478bd9Sstevel@tonic-gate 	MODREV_1, &modldrv, NULL
8527c478bd9Sstevel@tonic-gate };
8537c478bd9Sstevel@tonic-gate 
8547c478bd9Sstevel@tonic-gate int
8557c478bd9Sstevel@tonic-gate _init(void)
8567c478bd9Sstevel@tonic-gate {
8577c478bd9Sstevel@tonic-gate 	return (mod_install(&modlinkage));
8587c478bd9Sstevel@tonic-gate }
8597c478bd9Sstevel@tonic-gate 
8607c478bd9Sstevel@tonic-gate int
8617c478bd9Sstevel@tonic-gate _info(struct modinfo *modinfop)
8627c478bd9Sstevel@tonic-gate {
8637c478bd9Sstevel@tonic-gate 	return (mod_info(&modlinkage, modinfop));
8647c478bd9Sstevel@tonic-gate }
8657c478bd9Sstevel@tonic-gate 
8667c478bd9Sstevel@tonic-gate int
8677c478bd9Sstevel@tonic-gate _fini(void)
8687c478bd9Sstevel@tonic-gate {
8697c478bd9Sstevel@tonic-gate 	return (mod_remove(&modlinkage));
8707c478bd9Sstevel@tonic-gate }
8717c478bd9Sstevel@tonic-gate 
8727c478bd9Sstevel@tonic-gate static int
8737c478bd9Sstevel@tonic-gate mm_kstat_update(kstat_t *ksp, int rw)
8747c478bd9Sstevel@tonic-gate {
8757c478bd9Sstevel@tonic-gate 	struct memlist *pmem;
8767c478bd9Sstevel@tonic-gate 	uint_t count;
8777c478bd9Sstevel@tonic-gate 
8787c478bd9Sstevel@tonic-gate 	if (rw == KSTAT_WRITE)
8797c478bd9Sstevel@tonic-gate 		return (EACCES);
8807c478bd9Sstevel@tonic-gate 
8817c478bd9Sstevel@tonic-gate 	count = 0;
8827c478bd9Sstevel@tonic-gate 	memlist_read_lock();
8837c478bd9Sstevel@tonic-gate 	for (pmem = phys_install; pmem != NULL; pmem = pmem->next) {
8847c478bd9Sstevel@tonic-gate 		count++;
8857c478bd9Sstevel@tonic-gate 	}
8867c478bd9Sstevel@tonic-gate 	memlist_read_unlock();
8877c478bd9Sstevel@tonic-gate 
8887c478bd9Sstevel@tonic-gate 	ksp->ks_ndata = count;
8897c478bd9Sstevel@tonic-gate 	ksp->ks_data_size = count * 2 * sizeof (uint64_t);
8907c478bd9Sstevel@tonic-gate 
8917c478bd9Sstevel@tonic-gate 	return (0);
8927c478bd9Sstevel@tonic-gate }
8937c478bd9Sstevel@tonic-gate 
8947c478bd9Sstevel@tonic-gate static int
8957c478bd9Sstevel@tonic-gate mm_kstat_snapshot(kstat_t *ksp, void *buf, int rw)
8967c478bd9Sstevel@tonic-gate {
8977c478bd9Sstevel@tonic-gate 	struct memlist *pmem;
8987c478bd9Sstevel@tonic-gate 	struct memunit {
8997c478bd9Sstevel@tonic-gate 		uint64_t address;
9007c478bd9Sstevel@tonic-gate 		uint64_t size;
9017c478bd9Sstevel@tonic-gate 	} *kspmem;
9027c478bd9Sstevel@tonic-gate 
9037c478bd9Sstevel@tonic-gate 	if (rw == KSTAT_WRITE)
9047c478bd9Sstevel@tonic-gate 		return (EACCES);
9057c478bd9Sstevel@tonic-gate 
9067c478bd9Sstevel@tonic-gate 	ksp->ks_snaptime = gethrtime();
9077c478bd9Sstevel@tonic-gate 
9087c478bd9Sstevel@tonic-gate 	kspmem = (struct memunit *)buf;
9097c478bd9Sstevel@tonic-gate 	memlist_read_lock();
9107c478bd9Sstevel@tonic-gate 	for (pmem = phys_install; pmem != NULL; pmem = pmem->next, kspmem++) {
9117c478bd9Sstevel@tonic-gate 		if ((caddr_t)kspmem >= (caddr_t)buf + ksp->ks_data_size)
9127c478bd9Sstevel@tonic-gate 			break;
9137c478bd9Sstevel@tonic-gate 		kspmem->address = pmem->address;
9147c478bd9Sstevel@tonic-gate 		kspmem->size = pmem->size;
9157c478bd9Sstevel@tonic-gate 	}
9167c478bd9Sstevel@tonic-gate 	memlist_read_unlock();
9177c478bd9Sstevel@tonic-gate 
9187c478bd9Sstevel@tonic-gate 	return (0);
9197c478bd9Sstevel@tonic-gate }
920