xref: /freebsd/sys/dev/xen/privcmd/privcmd.c (revision 0012f373e43db2341c20329163ed2d5ad3b0f341)
1bf7313e3SRoger Pau Monné /*
2bf7313e3SRoger Pau Monné  * Copyright (c) 2014 Roger Pau Monné <roger.pau@citrix.com>
3bf7313e3SRoger Pau Monné  * All rights reserved.
4bf7313e3SRoger Pau Monné  *
5bf7313e3SRoger Pau Monné  * Redistribution and use in source and binary forms, with or without
6bf7313e3SRoger Pau Monné  * modification, are permitted provided that the following conditions
7bf7313e3SRoger Pau Monné  * are met:
8bf7313e3SRoger Pau Monné  * 1. Redistributions of source code must retain the above copyright
9bf7313e3SRoger Pau Monné  *    notice, this list of conditions and the following disclaimer.
10bf7313e3SRoger Pau Monné  * 2. Redistributions in binary form must reproduce the above copyright
11bf7313e3SRoger Pau Monné  *    notice, this list of conditions and the following disclaimer in the
12bf7313e3SRoger Pau Monné  *    documentation and/or other materials provided with the distribution.
13bf7313e3SRoger Pau Monné  *
14bf7313e3SRoger Pau Monné  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS AS IS'' AND
15bf7313e3SRoger Pau Monné  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16bf7313e3SRoger Pau Monné  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17bf7313e3SRoger Pau Monné  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18bf7313e3SRoger Pau Monné  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19bf7313e3SRoger Pau Monné  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20bf7313e3SRoger Pau Monné  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21bf7313e3SRoger Pau Monné  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22bf7313e3SRoger Pau Monné  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23bf7313e3SRoger Pau Monné  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24bf7313e3SRoger Pau Monné  * SUCH DAMAGE.
25bf7313e3SRoger Pau Monné  */
26bf7313e3SRoger Pau Monné 
27bf7313e3SRoger Pau Monné #include <sys/cdefs.h>
28bf7313e3SRoger Pau Monné __FBSDID("$FreeBSD$");
29bf7313e3SRoger Pau Monné 
30bf7313e3SRoger Pau Monné #include <sys/param.h>
31bf7313e3SRoger Pau Monné #include <sys/systm.h>
32bf7313e3SRoger Pau Monné #include <sys/uio.h>
33bf7313e3SRoger Pau Monné #include <sys/bus.h>
34bf7313e3SRoger Pau Monné #include <sys/malloc.h>
35bf7313e3SRoger Pau Monné #include <sys/kernel.h>
36bf7313e3SRoger Pau Monné #include <sys/lock.h>
37bf7313e3SRoger Pau Monné #include <sys/mutex.h>
38bf7313e3SRoger Pau Monné #include <sys/rwlock.h>
39bf7313e3SRoger Pau Monné #include <sys/selinfo.h>
40bf7313e3SRoger Pau Monné #include <sys/poll.h>
41bf7313e3SRoger Pau Monné #include <sys/conf.h>
42bf7313e3SRoger Pau Monné #include <sys/fcntl.h>
43bf7313e3SRoger Pau Monné #include <sys/ioccom.h>
44bf7313e3SRoger Pau Monné #include <sys/rman.h>
45bf7313e3SRoger Pau Monné #include <sys/tree.h>
46bf7313e3SRoger Pau Monné #include <sys/module.h>
47bf7313e3SRoger Pau Monné #include <sys/proc.h>
48288b2385SRoger Pau Monné #include <sys/bitset.h>
49bf7313e3SRoger Pau Monné 
50bf7313e3SRoger Pau Monné #include <vm/vm.h>
51bf7313e3SRoger Pau Monné #include <vm/vm_param.h>
52bf7313e3SRoger Pau Monné #include <vm/vm_extern.h>
53bf7313e3SRoger Pau Monné #include <vm/vm_kern.h>
54bf7313e3SRoger Pau Monné #include <vm/vm_page.h>
55bf7313e3SRoger Pau Monné #include <vm/vm_map.h>
56bf7313e3SRoger Pau Monné #include <vm/vm_object.h>
57bf7313e3SRoger Pau Monné #include <vm/vm_pager.h>
58bf7313e3SRoger Pau Monné 
59bf7313e3SRoger Pau Monné #include <machine/md_var.h>
60bf7313e3SRoger Pau Monné 
61bf7313e3SRoger Pau Monné #include <xen/xen-os.h>
62bf7313e3SRoger Pau Monné #include <xen/hypervisor.h>
63bf7313e3SRoger Pau Monné #include <xen/privcmd.h>
64bf7313e3SRoger Pau Monné #include <xen/error.h>
65bf7313e3SRoger Pau Monné 
66bf7313e3SRoger Pau Monné MALLOC_DEFINE(M_PRIVCMD, "privcmd_dev", "Xen privcmd user-space device");
67bf7313e3SRoger Pau Monné 
68bf7313e3SRoger Pau Monné struct privcmd_map {
69bf7313e3SRoger Pau Monné 	vm_object_t mem;
70bf7313e3SRoger Pau Monné 	vm_size_t size;
71bf7313e3SRoger Pau Monné 	struct resource *pseudo_phys_res;
72bf7313e3SRoger Pau Monné 	int pseudo_phys_res_id;
73bf7313e3SRoger Pau Monné 	vm_paddr_t phys_base_addr;
74bf7313e3SRoger Pau Monné 	boolean_t mapped;
75288b2385SRoger Pau Monné 	BITSET_DEFINE_VAR() *err;
76bf7313e3SRoger Pau Monné };
77bf7313e3SRoger Pau Monné 
78bf7313e3SRoger Pau Monné static d_ioctl_t     privcmd_ioctl;
79bf7313e3SRoger Pau Monné static d_mmap_single_t	privcmd_mmap_single;
80bf7313e3SRoger Pau Monné 
81bf7313e3SRoger Pau Monné static struct cdevsw privcmd_devsw = {
82bf7313e3SRoger Pau Monné 	.d_version = D_VERSION,
83bf7313e3SRoger Pau Monné 	.d_ioctl = privcmd_ioctl,
84bf7313e3SRoger Pau Monné 	.d_mmap_single = privcmd_mmap_single,
85bf7313e3SRoger Pau Monné 	.d_name = "privcmd",
86bf7313e3SRoger Pau Monné };
87bf7313e3SRoger Pau Monné 
88bf7313e3SRoger Pau Monné static int privcmd_pg_ctor(void *handle, vm_ooffset_t size, vm_prot_t prot,
89bf7313e3SRoger Pau Monné     vm_ooffset_t foff, struct ucred *cred, u_short *color);
90bf7313e3SRoger Pau Monné static void privcmd_pg_dtor(void *handle);
91bf7313e3SRoger Pau Monné static int privcmd_pg_fault(vm_object_t object, vm_ooffset_t offset,
92bf7313e3SRoger Pau Monné     int prot, vm_page_t *mres);
93bf7313e3SRoger Pau Monné 
94bf7313e3SRoger Pau Monné static struct cdev_pager_ops privcmd_pg_ops = {
95bf7313e3SRoger Pau Monné 	.cdev_pg_fault = privcmd_pg_fault,
96bf7313e3SRoger Pau Monné 	.cdev_pg_ctor =	privcmd_pg_ctor,
97bf7313e3SRoger Pau Monné 	.cdev_pg_dtor =	privcmd_pg_dtor,
98bf7313e3SRoger Pau Monné };
99bf7313e3SRoger Pau Monné 
100bf7313e3SRoger Pau Monné static device_t privcmd_dev = NULL;
101bf7313e3SRoger Pau Monné 
102bf7313e3SRoger Pau Monné /*------------------------- Privcmd Pager functions --------------------------*/
103bf7313e3SRoger Pau Monné static int
104bf7313e3SRoger Pau Monné privcmd_pg_ctor(void *handle, vm_ooffset_t size, vm_prot_t prot,
105bf7313e3SRoger Pau Monné     vm_ooffset_t foff, struct ucred *cred, u_short *color)
106bf7313e3SRoger Pau Monné {
107bf7313e3SRoger Pau Monné 
108bf7313e3SRoger Pau Monné 	return (0);
109bf7313e3SRoger Pau Monné }
110bf7313e3SRoger Pau Monné 
111bf7313e3SRoger Pau Monné static void
112bf7313e3SRoger Pau Monné privcmd_pg_dtor(void *handle)
113bf7313e3SRoger Pau Monné {
114bf7313e3SRoger Pau Monné 	struct xen_remove_from_physmap rm = { .domid = DOMID_SELF };
115bf7313e3SRoger Pau Monné 	struct privcmd_map *map = handle;
116bf7313e3SRoger Pau Monné 	int error;
117bf7313e3SRoger Pau Monné 	vm_size_t i;
118bf7313e3SRoger Pau Monné 	vm_page_t m;
119bf7313e3SRoger Pau Monné 
120bf7313e3SRoger Pau Monné 	/*
121bf7313e3SRoger Pau Monné 	 * Remove the mappings from the used pages. This will remove the
122bf7313e3SRoger Pau Monné 	 * underlying p2m bindings in Xen second stage translation.
123bf7313e3SRoger Pau Monné 	 */
124bf7313e3SRoger Pau Monné 	if (map->mapped == true) {
125bf7313e3SRoger Pau Monné 		VM_OBJECT_WLOCK(map->mem);
126bf7313e3SRoger Pau Monné retry:
127bf7313e3SRoger Pau Monné 		for (i = 0; i < map->size; i++) {
128bf7313e3SRoger Pau Monné 			m = vm_page_lookup(map->mem, i);
129bf7313e3SRoger Pau Monné 			if (m == NULL)
130bf7313e3SRoger Pau Monné 				continue;
131c7575748SJeff Roberson 			if (vm_page_busy_acquire(m, VM_ALLOC_WAITFAIL) == 0)
132bf7313e3SRoger Pau Monné 				goto retry;
133bf7313e3SRoger Pau Monné 			cdev_pager_free_page(map->mem, m);
134bf7313e3SRoger Pau Monné 		}
135bf7313e3SRoger Pau Monné 		VM_OBJECT_WUNLOCK(map->mem);
136bf7313e3SRoger Pau Monné 
137bf7313e3SRoger Pau Monné 		for (i = 0; i < map->size; i++) {
138bf7313e3SRoger Pau Monné 			rm.gpfn = atop(map->phys_base_addr) + i;
139bf7313e3SRoger Pau Monné 			HYPERVISOR_memory_op(XENMEM_remove_from_physmap, &rm);
140bf7313e3SRoger Pau Monné 		}
141288b2385SRoger Pau Monné 		free(map->err, M_PRIVCMD);
142bf7313e3SRoger Pau Monné 	}
143bf7313e3SRoger Pau Monné 
1440df8b29dSRoger Pau Monné 	error = xenmem_free(privcmd_dev, map->pseudo_phys_res_id,
1450df8b29dSRoger Pau Monné 	    map->pseudo_phys_res);
146bf7313e3SRoger Pau Monné 	KASSERT(error == 0, ("Unable to release memory resource: %d", error));
147bf7313e3SRoger Pau Monné 
148bf7313e3SRoger Pau Monné 	free(map, M_PRIVCMD);
149bf7313e3SRoger Pau Monné }
150bf7313e3SRoger Pau Monné 
151bf7313e3SRoger Pau Monné static int
152bf7313e3SRoger Pau Monné privcmd_pg_fault(vm_object_t object, vm_ooffset_t offset,
153bf7313e3SRoger Pau Monné     int prot, vm_page_t *mres)
154bf7313e3SRoger Pau Monné {
155bf7313e3SRoger Pau Monné 	struct privcmd_map *map = object->handle;
156bf7313e3SRoger Pau Monné 	vm_pindex_t pidx;
157bf7313e3SRoger Pau Monné 	vm_page_t page, oldm;
158bf7313e3SRoger Pau Monné 
159bf7313e3SRoger Pau Monné 	if (map->mapped != true)
160bf7313e3SRoger Pau Monné 		return (VM_PAGER_FAIL);
161bf7313e3SRoger Pau Monné 
162bf7313e3SRoger Pau Monné 	pidx = OFF_TO_IDX(offset);
163288b2385SRoger Pau Monné 	if (pidx >= map->size || BIT_ISSET(map->size, pidx, map->err))
164bf7313e3SRoger Pau Monné 		return (VM_PAGER_FAIL);
165bf7313e3SRoger Pau Monné 
166bf7313e3SRoger Pau Monné 	page = PHYS_TO_VM_PAGE(map->phys_base_addr + offset);
167bf7313e3SRoger Pau Monné 	if (page == NULL)
168bf7313e3SRoger Pau Monné 		return (VM_PAGER_FAIL);
169bf7313e3SRoger Pau Monné 
170bf7313e3SRoger Pau Monné 	KASSERT((page->flags & PG_FICTITIOUS) != 0,
171bf7313e3SRoger Pau Monné 	    ("not fictitious %p", page));
172fee2a2faSMark Johnston 	KASSERT(vm_page_wired(page), ("page %p not wired", page));
173fee2a2faSMark Johnston 	KASSERT(!vm_page_busied(page), ("page %p is busy", page));
174bf7313e3SRoger Pau Monné 
175bf7313e3SRoger Pau Monné 	if (*mres != NULL) {
176bf7313e3SRoger Pau Monné 		oldm = *mres;
177bf7313e3SRoger Pau Monné 		vm_page_free(oldm);
178bf7313e3SRoger Pau Monné 		*mres = NULL;
179bf7313e3SRoger Pau Monné 	}
180bf7313e3SRoger Pau Monné 
18163e97555SJeff Roberson 	vm_page_busy_acquire(page, 0);
182*0012f373SJeff Roberson 	vm_page_valid(page);
183bf7313e3SRoger Pau Monné 	vm_page_insert(page, object, pidx);
184bf7313e3SRoger Pau Monné 	*mres = page;
185bf7313e3SRoger Pau Monné 	return (VM_PAGER_OK);
186bf7313e3SRoger Pau Monné }
187bf7313e3SRoger Pau Monné 
188bf7313e3SRoger Pau Monné /*----------------------- Privcmd char device methods ------------------------*/
189bf7313e3SRoger Pau Monné static int
190bf7313e3SRoger Pau Monné privcmd_mmap_single(struct cdev *cdev, vm_ooffset_t *offset, vm_size_t size,
191bf7313e3SRoger Pau Monné     vm_object_t *object, int nprot)
192bf7313e3SRoger Pau Monné {
193bf7313e3SRoger Pau Monné 	struct privcmd_map *map;
194bf7313e3SRoger Pau Monné 
195bf7313e3SRoger Pau Monné 	map = malloc(sizeof(*map), M_PRIVCMD, M_WAITOK | M_ZERO);
196bf7313e3SRoger Pau Monné 
197bf7313e3SRoger Pau Monné 	map->size = OFF_TO_IDX(size);
198bf7313e3SRoger Pau Monné 	map->pseudo_phys_res_id = 0;
199bf7313e3SRoger Pau Monné 
2000df8b29dSRoger Pau Monné 	map->pseudo_phys_res = xenmem_alloc(privcmd_dev,
2010df8b29dSRoger Pau Monné 	    &map->pseudo_phys_res_id, size);
202bf7313e3SRoger Pau Monné 	if (map->pseudo_phys_res == NULL) {
203bf7313e3SRoger Pau Monné 		free(map, M_PRIVCMD);
204bf7313e3SRoger Pau Monné 		return (ENOMEM);
205bf7313e3SRoger Pau Monné 	}
206bf7313e3SRoger Pau Monné 
207bf7313e3SRoger Pau Monné 	map->phys_base_addr = rman_get_start(map->pseudo_phys_res);
208bf7313e3SRoger Pau Monné 	map->mem = cdev_pager_allocate(map, OBJT_MGTDEVICE, &privcmd_pg_ops,
209bf7313e3SRoger Pau Monné 	    size, nprot, *offset, NULL);
210bf7313e3SRoger Pau Monné 	if (map->mem == NULL) {
2110df8b29dSRoger Pau Monné 		xenmem_free(privcmd_dev, map->pseudo_phys_res_id,
2120df8b29dSRoger Pau Monné 		    map->pseudo_phys_res);
213bf7313e3SRoger Pau Monné 		free(map, M_PRIVCMD);
214bf7313e3SRoger Pau Monné 		return (ENOMEM);
215bf7313e3SRoger Pau Monné 	}
216bf7313e3SRoger Pau Monné 
217bf7313e3SRoger Pau Monné 	*object = map->mem;
218bf7313e3SRoger Pau Monné 
219bf7313e3SRoger Pau Monné 	return (0);
220bf7313e3SRoger Pau Monné }
221bf7313e3SRoger Pau Monné 
222bf7313e3SRoger Pau Monné static int
223bf7313e3SRoger Pau Monné privcmd_ioctl(struct cdev *dev, unsigned long cmd, caddr_t arg,
224bf7313e3SRoger Pau Monné 	      int mode, struct thread *td)
225bf7313e3SRoger Pau Monné {
226bf7313e3SRoger Pau Monné 	int error, i;
227bf7313e3SRoger Pau Monné 
228bf7313e3SRoger Pau Monné 	switch (cmd) {
229bf7313e3SRoger Pau Monné 	case IOCTL_PRIVCMD_HYPERCALL: {
230bf7313e3SRoger Pau Monné 		struct ioctl_privcmd_hypercall *hcall;
231bf7313e3SRoger Pau Monné 
232bf7313e3SRoger Pau Monné 		hcall = (struct ioctl_privcmd_hypercall *)arg;
2335ff6c7f3SRoger Pau Monné #ifdef __amd64__
2345ff6c7f3SRoger Pau Monné 		/*
2355ff6c7f3SRoger Pau Monné 		 * The hypervisor page table walker will refuse to access
2365ff6c7f3SRoger Pau Monné 		 * user-space pages if SMAP is enabled, so temporary disable it
2375ff6c7f3SRoger Pau Monné 		 * while performing the hypercall.
2385ff6c7f3SRoger Pau Monné 		 */
2395ff6c7f3SRoger Pau Monné 		if (cpu_stdext_feature & CPUID_STDEXT_SMAP)
2405ff6c7f3SRoger Pau Monné 			stac();
2415ff6c7f3SRoger Pau Monné #endif
242bf7313e3SRoger Pau Monné 		error = privcmd_hypercall(hcall->op, hcall->arg[0],
243bf7313e3SRoger Pau Monné 		    hcall->arg[1], hcall->arg[2], hcall->arg[3], hcall->arg[4]);
2445ff6c7f3SRoger Pau Monné #ifdef __amd64__
2455ff6c7f3SRoger Pau Monné 		if (cpu_stdext_feature & CPUID_STDEXT_SMAP)
2465ff6c7f3SRoger Pau Monné 			clac();
2475ff6c7f3SRoger Pau Monné #endif
248bf7313e3SRoger Pau Monné 		if (error >= 0) {
249bf7313e3SRoger Pau Monné 			hcall->retval = error;
250bf7313e3SRoger Pau Monné 			error = 0;
251bf7313e3SRoger Pau Monné 		} else {
252bf7313e3SRoger Pau Monné 			error = xen_translate_error(error);
253bf7313e3SRoger Pau Monné 			hcall->retval = 0;
254bf7313e3SRoger Pau Monné 		}
255bf7313e3SRoger Pau Monné 		break;
256bf7313e3SRoger Pau Monné 	}
257bf7313e3SRoger Pau Monné 	case IOCTL_PRIVCMD_MMAPBATCH: {
258bf7313e3SRoger Pau Monné 		struct ioctl_privcmd_mmapbatch *mmap;
259bf7313e3SRoger Pau Monné 		vm_map_t map;
260bf7313e3SRoger Pau Monné 		vm_map_entry_t entry;
261bf7313e3SRoger Pau Monné 		vm_object_t mem;
262288b2385SRoger Pau Monné 		vm_pindex_t pindex;
263bf7313e3SRoger Pau Monné 		vm_prot_t prot;
264bf7313e3SRoger Pau Monné 		boolean_t wired;
265bf7313e3SRoger Pau Monné 		struct xen_add_to_physmap_range add;
266bf7313e3SRoger Pau Monné 		xen_ulong_t *idxs;
267bf7313e3SRoger Pau Monné 		xen_pfn_t *gpfns;
268288b2385SRoger Pau Monné 		int *errs, index;
269bf7313e3SRoger Pau Monné 		struct privcmd_map *umap;
270288b2385SRoger Pau Monné 		uint16_t num;
271bf7313e3SRoger Pau Monné 
272bf7313e3SRoger Pau Monné 		mmap = (struct ioctl_privcmd_mmapbatch *)arg;
273bf7313e3SRoger Pau Monné 
274bf7313e3SRoger Pau Monné 		if ((mmap->num == 0) ||
275bf7313e3SRoger Pau Monné 		    ((mmap->addr & PAGE_MASK) != 0)) {
276bf7313e3SRoger Pau Monné 			error = EINVAL;
277bf7313e3SRoger Pau Monné 			break;
278bf7313e3SRoger Pau Monné 		}
279bf7313e3SRoger Pau Monné 
280bf7313e3SRoger Pau Monné 		map = &td->td_proc->p_vmspace->vm_map;
281bf7313e3SRoger Pau Monné 		error = vm_map_lookup(&map, mmap->addr, VM_PROT_NONE, &entry,
282288b2385SRoger Pau Monné 		    &mem, &pindex, &prot, &wired);
283bf7313e3SRoger Pau Monné 		if (error != KERN_SUCCESS) {
284bf7313e3SRoger Pau Monné 			error = EINVAL;
285bf7313e3SRoger Pau Monné 			break;
286bf7313e3SRoger Pau Monné 		}
287bf7313e3SRoger Pau Monné 		if ((entry->start != mmap->addr) ||
288bf7313e3SRoger Pau Monné 		    (entry->end != mmap->addr + (mmap->num * PAGE_SIZE))) {
289bf7313e3SRoger Pau Monné 			vm_map_lookup_done(map, entry);
290bf7313e3SRoger Pau Monné 			error = EINVAL;
291bf7313e3SRoger Pau Monné 			break;
292bf7313e3SRoger Pau Monné 		}
293bf7313e3SRoger Pau Monné 		vm_map_lookup_done(map, entry);
294bf7313e3SRoger Pau Monné 		if ((mem->type != OBJT_MGTDEVICE) ||
295bf7313e3SRoger Pau Monné 		    (mem->un_pager.devp.ops != &privcmd_pg_ops)) {
296bf7313e3SRoger Pau Monné 			error = EINVAL;
297bf7313e3SRoger Pau Monné 			break;
298bf7313e3SRoger Pau Monné 		}
299bf7313e3SRoger Pau Monné 		umap = mem->handle;
300bf7313e3SRoger Pau Monné 
301bf7313e3SRoger Pau Monné 		add.domid = DOMID_SELF;
302bf7313e3SRoger Pau Monné 		add.space = XENMAPSPACE_gmfn_foreign;
303bf7313e3SRoger Pau Monné 		add.foreign_domid = mmap->dom;
304bf7313e3SRoger Pau Monné 
305288b2385SRoger Pau Monné 		/*
306288b2385SRoger Pau Monné 		 * The 'size' field in the xen_add_to_physmap_range only
307288b2385SRoger Pau Monné 		 * allows for UINT16_MAX mappings in a single hypercall.
308288b2385SRoger Pau Monné 		 */
309288b2385SRoger Pau Monné 		num = MIN(mmap->num, UINT16_MAX);
310288b2385SRoger Pau Monné 
311288b2385SRoger Pau Monné 		idxs = malloc(sizeof(*idxs) * num, M_PRIVCMD, M_WAITOK);
312288b2385SRoger Pau Monné 		gpfns = malloc(sizeof(*gpfns) * num, M_PRIVCMD, M_WAITOK);
313288b2385SRoger Pau Monné 		errs = malloc(sizeof(*errs) * num, M_PRIVCMD, M_WAITOK);
314bf7313e3SRoger Pau Monné 
315bf7313e3SRoger Pau Monné 		set_xen_guest_handle(add.idxs, idxs);
316bf7313e3SRoger Pau Monné 		set_xen_guest_handle(add.gpfns, gpfns);
317bf7313e3SRoger Pau Monné 		set_xen_guest_handle(add.errs, errs);
318bf7313e3SRoger Pau Monné 
319288b2385SRoger Pau Monné 		/* Allocate a bitset to store broken page mappings. */
320288b2385SRoger Pau Monné 		umap->err = BITSET_ALLOC(mmap->num, M_PRIVCMD,
321288b2385SRoger Pau Monné 		    M_WAITOK | M_ZERO);
322288b2385SRoger Pau Monné 
323288b2385SRoger Pau Monné 		for (index = 0; index < mmap->num; index += num) {
324288b2385SRoger Pau Monné 			num = MIN(mmap->num - index, UINT16_MAX);
325288b2385SRoger Pau Monné 			add.size = num;
326288b2385SRoger Pau Monné 
327288b2385SRoger Pau Monné 			error = copyin(&mmap->arr[index], idxs,
328288b2385SRoger Pau Monné 			    sizeof(idxs[0]) * num);
329bf7313e3SRoger Pau Monné 			if (error != 0)
330bf7313e3SRoger Pau Monné 				goto mmap_out;
331bf7313e3SRoger Pau Monné 
332288b2385SRoger Pau Monné 			for (i = 0; i < num; i++)
333288b2385SRoger Pau Monné 				gpfns[i] = atop(umap->phys_base_addr +
334288b2385SRoger Pau Monné 				    (i + index) * PAGE_SIZE);
335bf7313e3SRoger Pau Monné 
336288b2385SRoger Pau Monné 			bzero(errs, sizeof(*errs) * num);
337288b2385SRoger Pau Monné 
338288b2385SRoger Pau Monné 			error = HYPERVISOR_memory_op(
339288b2385SRoger Pau Monné 			    XENMEM_add_to_physmap_range, &add);
340288b2385SRoger Pau Monné 			if (error != 0) {
341bf7313e3SRoger Pau Monné 				error = xen_translate_error(error);
342bf7313e3SRoger Pau Monné 				goto mmap_out;
343bf7313e3SRoger Pau Monné 			}
344bf7313e3SRoger Pau Monné 
345288b2385SRoger Pau Monné 			for (i = 0; i < num; i++) {
346288b2385SRoger Pau Monné 				if (errs[i] != 0) {
347bf7313e3SRoger Pau Monné 					errs[i] = xen_translate_error(errs[i]);
348288b2385SRoger Pau Monné 
349288b2385SRoger Pau Monné 					/* Mark the page as invalid. */
350288b2385SRoger Pau Monné 					BIT_SET(mmap->num, index + i,
351288b2385SRoger Pau Monné 					    umap->err);
352288b2385SRoger Pau Monné 				}
353bf7313e3SRoger Pau Monné 			}
354bf7313e3SRoger Pau Monné 
355288b2385SRoger Pau Monné 			error = copyout(errs, &mmap->err[index],
356288b2385SRoger Pau Monné 			    sizeof(errs[0]) * num);
357288b2385SRoger Pau Monné 			if (error != 0)
358288b2385SRoger Pau Monné 				goto mmap_out;
359288b2385SRoger Pau Monné 		}
360bf7313e3SRoger Pau Monné 
361288b2385SRoger Pau Monné 		umap->mapped = true;
362bf7313e3SRoger Pau Monné 
363bf7313e3SRoger Pau Monné mmap_out:
364bf7313e3SRoger Pau Monné 		free(idxs, M_PRIVCMD);
365bf7313e3SRoger Pau Monné 		free(gpfns, M_PRIVCMD);
366bf7313e3SRoger Pau Monné 		free(errs, M_PRIVCMD);
367288b2385SRoger Pau Monné 		if (!umap->mapped)
368288b2385SRoger Pau Monné 			free(umap->err, M_PRIVCMD);
369bf7313e3SRoger Pau Monné 
370bf7313e3SRoger Pau Monné 		break;
371bf7313e3SRoger Pau Monné 	}
372bf7313e3SRoger Pau Monné 
373bf7313e3SRoger Pau Monné 	default:
374bf7313e3SRoger Pau Monné 		error = ENOSYS;
375bf7313e3SRoger Pau Monné 		break;
376bf7313e3SRoger Pau Monné 	}
377bf7313e3SRoger Pau Monné 
378bf7313e3SRoger Pau Monné 	return (error);
379bf7313e3SRoger Pau Monné }
380bf7313e3SRoger Pau Monné 
381bf7313e3SRoger Pau Monné /*------------------ Private Device Attachment Functions  --------------------*/
382bf7313e3SRoger Pau Monné static void
383bf7313e3SRoger Pau Monné privcmd_identify(driver_t *driver, device_t parent)
384bf7313e3SRoger Pau Monné {
385bf7313e3SRoger Pau Monné 
386bf7313e3SRoger Pau Monné 	KASSERT(xen_domain(),
387bf7313e3SRoger Pau Monné 	    ("Trying to attach privcmd device on non Xen domain"));
388bf7313e3SRoger Pau Monné 
389bf7313e3SRoger Pau Monné 	if (BUS_ADD_CHILD(parent, 0, "privcmd", 0) == NULL)
390bf7313e3SRoger Pau Monné 		panic("unable to attach privcmd user-space device");
391bf7313e3SRoger Pau Monné }
392bf7313e3SRoger Pau Monné 
393bf7313e3SRoger Pau Monné static int
394bf7313e3SRoger Pau Monné privcmd_probe(device_t dev)
395bf7313e3SRoger Pau Monné {
396bf7313e3SRoger Pau Monné 
397bf7313e3SRoger Pau Monné 	privcmd_dev = dev;
398bf7313e3SRoger Pau Monné 	device_set_desc(dev, "Xen privileged interface user-space device");
399bf7313e3SRoger Pau Monné 	return (BUS_PROBE_NOWILDCARD);
400bf7313e3SRoger Pau Monné }
401bf7313e3SRoger Pau Monné 
402bf7313e3SRoger Pau Monné static int
403bf7313e3SRoger Pau Monné privcmd_attach(device_t dev)
404bf7313e3SRoger Pau Monné {
405bf7313e3SRoger Pau Monné 
406bf7313e3SRoger Pau Monné 	make_dev_credf(MAKEDEV_ETERNAL, &privcmd_devsw, 0, NULL, UID_ROOT,
407bf7313e3SRoger Pau Monné 	    GID_WHEEL, 0600, "xen/privcmd");
408bf7313e3SRoger Pau Monné 	return (0);
409bf7313e3SRoger Pau Monné }
410bf7313e3SRoger Pau Monné 
411bf7313e3SRoger Pau Monné /*-------------------- Private Device Attachment Data  -----------------------*/
412bf7313e3SRoger Pau Monné static device_method_t privcmd_methods[] = {
413bf7313e3SRoger Pau Monné 	DEVMETHOD(device_identify,	privcmd_identify),
414bf7313e3SRoger Pau Monné 	DEVMETHOD(device_probe,		privcmd_probe),
415bf7313e3SRoger Pau Monné 	DEVMETHOD(device_attach,	privcmd_attach),
416bf7313e3SRoger Pau Monné 
417bf7313e3SRoger Pau Monné 	DEVMETHOD_END
418bf7313e3SRoger Pau Monné };
419bf7313e3SRoger Pau Monné 
420bf7313e3SRoger Pau Monné static driver_t privcmd_driver = {
421bf7313e3SRoger Pau Monné 	"privcmd",
422bf7313e3SRoger Pau Monné 	privcmd_methods,
423bf7313e3SRoger Pau Monné 	0,
424bf7313e3SRoger Pau Monné };
425bf7313e3SRoger Pau Monné 
426bf7313e3SRoger Pau Monné devclass_t privcmd_devclass;
427bf7313e3SRoger Pau Monné 
428bf7313e3SRoger Pau Monné DRIVER_MODULE(privcmd, xenpv, privcmd_driver, privcmd_devclass, 0, 0);
429bf7313e3SRoger Pau Monné MODULE_DEPEND(privcmd, xenpv, 1, 1, 1);
430