xref: /freebsd/lib/libvmmapi/vmmapi.c (revision 23a28fe7776f6d76643a6ac16758d114dfbbeec2)
1366f6083SPeter Grehan /*-
24d846d26SWarner Losh  * SPDX-License-Identifier: BSD-2-Clause
35e53a4f9SPedro F. Giffuni  *
4366f6083SPeter Grehan  * Copyright (c) 2011 NetApp, Inc.
5366f6083SPeter Grehan  * All rights reserved.
6366f6083SPeter Grehan  *
7366f6083SPeter Grehan  * Redistribution and use in source and binary forms, with or without
8366f6083SPeter Grehan  * modification, are permitted provided that the following conditions
9366f6083SPeter Grehan  * are met:
10366f6083SPeter Grehan  * 1. Redistributions of source code must retain the above copyright
11366f6083SPeter Grehan  *    notice, this list of conditions and the following disclaimer.
12366f6083SPeter Grehan  * 2. Redistributions in binary form must reproduce the above copyright
13366f6083SPeter Grehan  *    notice, this list of conditions and the following disclaimer in the
14366f6083SPeter Grehan  *    documentation and/or other materials provided with the distribution.
15366f6083SPeter Grehan  *
16366f6083SPeter Grehan  * THIS SOFTWARE IS PROVIDED BY NETAPP, INC ``AS IS'' AND
17366f6083SPeter Grehan  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18366f6083SPeter Grehan  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19366f6083SPeter Grehan  * ARE DISCLAIMED.  IN NO EVENT SHALL NETAPP, INC OR CONTRIBUTORS BE LIABLE
20366f6083SPeter Grehan  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21366f6083SPeter Grehan  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22366f6083SPeter Grehan  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23366f6083SPeter Grehan  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24366f6083SPeter Grehan  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25366f6083SPeter Grehan  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26366f6083SPeter Grehan  * SUCH DAMAGE.
27366f6083SPeter Grehan  */
28366f6083SPeter Grehan 
2995ebc360SNeel Natu #include <sys/param.h>
303e9b4532SMark Johnston #include <sys/capsicum.h>
31366f6083SPeter Grehan #include <sys/sysctl.h>
32366f6083SPeter Grehan #include <sys/ioctl.h>
33366f6083SPeter Grehan #include <sys/mman.h>
34967264cfSMark Johnston #include <sys/linker.h>
35a71dc724SMarcelo Araujo #include <sys/module.h>
366303b65dSNeel Natu #include <sys/_iovec.h>
3795ebc360SNeel Natu #include <sys/cpuset.h>
38366f6083SPeter Grehan 
393e9b4532SMark Johnston #include <capsicum_helpers.h>
4099127fd1SMark Johnston #include <err.h>
419c4d5478SNeel Natu #include <errno.h>
42483d953aSJohn Baldwin #include <stdbool.h>
43366f6083SPeter Grehan #include <stdio.h>
44366f6083SPeter Grehan #include <stdlib.h>
45366f6083SPeter Grehan #include <assert.h>
46366f6083SPeter Grehan #include <string.h>
47366f6083SPeter Grehan #include <fcntl.h>
48366f6083SPeter Grehan #include <unistd.h>
49366f6083SPeter Grehan 
50200758f1SNeel Natu #include <libutil.h>
51200758f1SNeel Natu 
52483d953aSJohn Baldwin #include <vm/vm.h>
53366f6083SPeter Grehan #include <machine/vmm.h>
5456a26fc1SMark Johnston #ifdef WITH_VMMAPI_SNAPSHOT
55483d953aSJohn Baldwin #include <machine/vmm_snapshot.h>
5656a26fc1SMark Johnston #endif
57366f6083SPeter Grehan 
5899127fd1SMark Johnston #include <dev/vmm/vmm_dev.h>
5999127fd1SMark Johnston 
60366f6083SPeter Grehan #include "vmmapi.h"
617d9ef309SJohn Baldwin #include "internal.h"
62366f6083SPeter Grehan 
63200758f1SNeel Natu #define	MB	(1024 * 1024UL)
64b060ba50SNeel Natu #define	GB	(1024 * 1024 * 1024UL)
65b060ba50SNeel Natu 
665ec6c300SMark Johnston #ifdef __amd64__
677e0fa794SMark Johnston #define	VM_LOWMEM_LIMIT	(3 * GB)
685ec6c300SMark Johnston #else
695ec6c300SMark Johnston #define	VM_LOWMEM_LIMIT	0
705ec6c300SMark Johnston #endif
717e0fa794SMark Johnston #define	VM_HIGHMEM_BASE	(4 * GB)
727e0fa794SMark Johnston 
739b1aa8d6SNeel Natu /*
749b1aa8d6SNeel Natu  * Size of the guard region before and after the virtual address space
759b1aa8d6SNeel Natu  * mapping the guest physical memory. This must be a multiple of the
769b1aa8d6SNeel Natu  * superpage size for performance reasons.
779b1aa8d6SNeel Natu  */
789b1aa8d6SNeel Natu #define	VM_MMAP_GUARD_SIZE	(4 * MB)
799b1aa8d6SNeel Natu 
809b1aa8d6SNeel Natu #define	PROT_RW		(PROT_READ | PROT_WRITE)
819b1aa8d6SNeel Natu #define	PROT_ALL	(PROT_READ | PROT_WRITE | PROT_EXEC)
829b1aa8d6SNeel Natu 
83366f6083SPeter Grehan static int
vm_device_open(const char * name)84366f6083SPeter Grehan vm_device_open(const char *name)
85366f6083SPeter Grehan {
8699127fd1SMark Johnston 	char devpath[PATH_MAX];
87366f6083SPeter Grehan 
8899127fd1SMark Johnston 	assert(strlen(name) <= VM_MAX_NAMELEN);
8999127fd1SMark Johnston 	(void)snprintf(devpath, sizeof(devpath), "/dev/vmm/%s", name);
9099127fd1SMark Johnston 	return (open(devpath, O_RDWR));
9199127fd1SMark Johnston }
92366f6083SPeter Grehan 
9399127fd1SMark Johnston static int
vm_ctl_open(void)94*23a28fe7SMark Johnston vm_ctl_open(void)
95*23a28fe7SMark Johnston {
96*23a28fe7SMark Johnston 	if (modfind("vmm") < 0)
97*23a28fe7SMark Johnston 		(void)kldload("vmm");
98*23a28fe7SMark Johnston 	return (open("/dev/vmmctl", O_RDWR, 0));
99*23a28fe7SMark Johnston }
100*23a28fe7SMark Johnston 
101*23a28fe7SMark Johnston static int
vm_ctl_create(const char * name,int ctlfd)10299127fd1SMark Johnston vm_ctl_create(const char *name, int ctlfd)
10399127fd1SMark Johnston {
10499127fd1SMark Johnston 	struct vmmctl_vm_create vmc;
105366f6083SPeter Grehan 
10699127fd1SMark Johnston 	memset(&vmc, 0, sizeof(vmc));
10799127fd1SMark Johnston 	if (strlcpy(vmc.name, name, sizeof(vmc.name)) >= sizeof(vmc.name)) {
10899127fd1SMark Johnston 		errno = ENAMETOOLONG;
10999127fd1SMark Johnston 		return (-1);
11099127fd1SMark Johnston 	}
11199127fd1SMark Johnston 	return (ioctl(ctlfd, VMMCTL_VM_CREATE, &vmc));
112366f6083SPeter Grehan }
113366f6083SPeter Grehan 
114366f6083SPeter Grehan int
vm_create(const char * name)115366f6083SPeter Grehan vm_create(const char *name)
116366f6083SPeter Grehan {
11799127fd1SMark Johnston 	int error, fd;
11899127fd1SMark Johnston 
119*23a28fe7SMark Johnston 	fd = vm_ctl_open();
12099127fd1SMark Johnston 	if (fd < 0)
121*23a28fe7SMark Johnston 		return (-1);
122*23a28fe7SMark Johnston 
12399127fd1SMark Johnston 	error = vm_ctl_create(name, fd);
12499127fd1SMark Johnston 	if (error != 0) {
12599127fd1SMark Johnston 		error = errno;
12699127fd1SMark Johnston 		(void)close(fd);
12799127fd1SMark Johnston 		errno = error;
12899127fd1SMark Johnston 		return (-1);
12999127fd1SMark Johnston 	}
13099127fd1SMark Johnston 	(void)close(fd);
13199127fd1SMark Johnston 	return (0);
132366f6083SPeter Grehan }
133366f6083SPeter Grehan 
134366f6083SPeter Grehan struct vmctx *
vm_open(const char * name)135366f6083SPeter Grehan vm_open(const char *name)
136366f6083SPeter Grehan {
13799127fd1SMark Johnston 	return (vm_openf(name, 0));
13899127fd1SMark Johnston }
13999127fd1SMark Johnston 
14099127fd1SMark Johnston struct vmctx *
vm_openf(const char * name,int flags)14199127fd1SMark Johnston vm_openf(const char *name, int flags)
14299127fd1SMark Johnston {
143366f6083SPeter Grehan 	struct vmctx *vm;
144a7f81b48SRobert Wing 	int saved_errno;
14599127fd1SMark Johnston 	bool created;
14699127fd1SMark Johnston 
14799127fd1SMark Johnston 	created = false;
148366f6083SPeter Grehan 
149366f6083SPeter Grehan 	vm = malloc(sizeof(struct vmctx) + strlen(name) + 1);
150366f6083SPeter Grehan 	assert(vm != NULL);
151366f6083SPeter Grehan 
15299127fd1SMark Johnston 	vm->fd = vm->ctlfd = -1;
1530dd10c00SNeel Natu 	vm->memflags = 0;
154366f6083SPeter Grehan 	vm->name = (char *)(vm + 1);
155366f6083SPeter Grehan 	strcpy(vm->name, name);
1567e0fa794SMark Johnston 	memset(vm->memsegs, 0, sizeof(vm->memsegs));
157366f6083SPeter Grehan 
158*23a28fe7SMark Johnston 	if ((vm->ctlfd = vm_ctl_open()) < 0)
15999127fd1SMark Johnston 		goto err;
16099127fd1SMark Johnston 
16199127fd1SMark Johnston 	vm->fd = vm_device_open(vm->name);
16299127fd1SMark Johnston 	if (vm->fd < 0 && errno == ENOENT) {
16399127fd1SMark Johnston 		if (flags & VMMAPI_OPEN_CREATE) {
16499127fd1SMark Johnston 			if (vm_ctl_create(vm->name, vm->ctlfd) != 0)
16599127fd1SMark Johnston 				goto err;
16699127fd1SMark Johnston 			vm->fd = vm_device_open(vm->name);
16799127fd1SMark Johnston 			created = true;
16899127fd1SMark Johnston 		}
16999127fd1SMark Johnston 	}
17099127fd1SMark Johnston 	if (vm->fd < 0)
17199127fd1SMark Johnston 		goto err;
17299127fd1SMark Johnston 
17399127fd1SMark Johnston 	if (!created && (flags & VMMAPI_OPEN_REINIT) != 0 && vm_reinit(vm) != 0)
174366f6083SPeter Grehan 		goto err;
175366f6083SPeter Grehan 
176366f6083SPeter Grehan 	return (vm);
177366f6083SPeter Grehan err:
178a7f81b48SRobert Wing 	saved_errno = errno;
17999127fd1SMark Johnston 	if (created)
18099127fd1SMark Johnston 		vm_destroy(vm);
18199127fd1SMark Johnston 	else
18299127fd1SMark Johnston 		vm_close(vm);
183a7f81b48SRobert Wing 	errno = saved_errno;
184366f6083SPeter Grehan 	return (NULL);
185366f6083SPeter Grehan }
186366f6083SPeter Grehan 
187366f6083SPeter Grehan void
vm_close(struct vmctx * vm)188f0880ab7SVitaliy Gusev vm_close(struct vmctx *vm)
189f0880ab7SVitaliy Gusev {
190f0880ab7SVitaliy Gusev 	assert(vm != NULL);
191f0880ab7SVitaliy Gusev 
19299127fd1SMark Johnston 	if (vm->fd >= 0)
19399127fd1SMark Johnston 		(void)close(vm->fd);
19499127fd1SMark Johnston 	if (vm->ctlfd >= 0)
19599127fd1SMark Johnston 		(void)close(vm->ctlfd);
196f0880ab7SVitaliy Gusev 	free(vm);
197f0880ab7SVitaliy Gusev }
198f0880ab7SVitaliy Gusev 
199f0880ab7SVitaliy Gusev void
vm_destroy(struct vmctx * vm)200366f6083SPeter Grehan vm_destroy(struct vmctx *vm)
201366f6083SPeter Grehan {
20299127fd1SMark Johnston 	struct vmmctl_vm_destroy vmd;
203366f6083SPeter Grehan 
20499127fd1SMark Johnston 	memset(&vmd, 0, sizeof(vmd));
20599127fd1SMark Johnston 	(void)strlcpy(vmd.name, vm->name, sizeof(vmd.name));
20699127fd1SMark Johnston 	if (ioctl(vm->ctlfd, VMMCTL_VM_DESTROY, &vmd) != 0)
20799127fd1SMark Johnston 		warn("ioctl(VMMCTL_VM_DESTROY)");
208f7d51510SNeel Natu 
20999127fd1SMark Johnston 	vm_close(vm);
210366f6083SPeter Grehan }
211366f6083SPeter Grehan 
2127d9ef309SJohn Baldwin struct vcpu *
vm_vcpu_open(struct vmctx * ctx,int vcpuid)2137d9ef309SJohn Baldwin vm_vcpu_open(struct vmctx *ctx, int vcpuid)
2147d9ef309SJohn Baldwin {
2157d9ef309SJohn Baldwin 	struct vcpu *vcpu;
2167d9ef309SJohn Baldwin 
2177d9ef309SJohn Baldwin 	vcpu = malloc(sizeof(*vcpu));
2187d9ef309SJohn Baldwin 	vcpu->ctx = ctx;
2197d9ef309SJohn Baldwin 	vcpu->vcpuid = vcpuid;
2207d9ef309SJohn Baldwin 	return (vcpu);
2217d9ef309SJohn Baldwin }
2227d9ef309SJohn Baldwin 
2237d9ef309SJohn Baldwin void
vm_vcpu_close(struct vcpu * vcpu)2247d9ef309SJohn Baldwin vm_vcpu_close(struct vcpu *vcpu)
2257d9ef309SJohn Baldwin {
2267d9ef309SJohn Baldwin 	free(vcpu);
2277d9ef309SJohn Baldwin }
2287d9ef309SJohn Baldwin 
2297d9ef309SJohn Baldwin int
vcpu_id(struct vcpu * vcpu)2307d9ef309SJohn Baldwin vcpu_id(struct vcpu *vcpu)
2317d9ef309SJohn Baldwin {
2327d9ef309SJohn Baldwin 	return (vcpu->vcpuid);
2337d9ef309SJohn Baldwin }
2347d9ef309SJohn Baldwin 
235366f6083SPeter Grehan int
vm_parse_memsize(const char * opt,size_t * ret_memsize)23645cd18ecSMark Johnston vm_parse_memsize(const char *opt, size_t *ret_memsize)
237200758f1SNeel Natu {
238200758f1SNeel Natu 	char *endptr;
239200758f1SNeel Natu 	size_t optval;
240200758f1SNeel Natu 	int error;
241200758f1SNeel Natu 
24245cd18ecSMark Johnston 	optval = strtoul(opt, &endptr, 0);
24345cd18ecSMark Johnston 	if (*opt != '\0' && *endptr == '\0') {
244200758f1SNeel Natu 		/*
245200758f1SNeel Natu 		 * For the sake of backward compatibility if the memory size
246200758f1SNeel Natu 		 * specified on the command line is less than a megabyte then
247200758f1SNeel Natu 		 * it is interpreted as being in units of MB.
248200758f1SNeel Natu 		 */
249200758f1SNeel Natu 		if (optval < MB)
250200758f1SNeel Natu 			optval *= MB;
251200758f1SNeel Natu 		*ret_memsize = optval;
252200758f1SNeel Natu 		error = 0;
253200758f1SNeel Natu 	} else
25445cd18ecSMark Johnston 		error = expand_number(opt, ret_memsize);
255200758f1SNeel Natu 
256200758f1SNeel Natu 	return (error);
257200758f1SNeel Natu }
258200758f1SNeel Natu 
259b060ba50SNeel Natu uint32_t
vm_get_lowmem_limit(struct vmctx * ctx __unused)2607e0fa794SMark Johnston vm_get_lowmem_limit(struct vmctx *ctx __unused)
261b060ba50SNeel Natu {
262b060ba50SNeel Natu 
2637e0fa794SMark Johnston 	return (VM_LOWMEM_LIMIT);
264b060ba50SNeel Natu }
265b060ba50SNeel Natu 
2660dd10c00SNeel Natu void
vm_set_memflags(struct vmctx * ctx,int flags)2670dd10c00SNeel Natu vm_set_memflags(struct vmctx *ctx, int flags)
2680dd10c00SNeel Natu {
2690dd10c00SNeel Natu 
2700dd10c00SNeel Natu 	ctx->memflags = flags;
2710dd10c00SNeel Natu }
2720dd10c00SNeel Natu 
2739b1aa8d6SNeel Natu int
vm_get_memflags(struct vmctx * ctx)2749b1aa8d6SNeel Natu vm_get_memflags(struct vmctx *ctx)
275366f6083SPeter Grehan {
2769b1aa8d6SNeel Natu 
2779b1aa8d6SNeel Natu 	return (ctx->memflags);
2789b1aa8d6SNeel Natu }
279366f6083SPeter Grehan 
280366f6083SPeter Grehan /*
2819b1aa8d6SNeel Natu  * Map segment 'segid' starting at 'off' into guest address range [gpa,gpa+len).
282366f6083SPeter Grehan  */
2839b1aa8d6SNeel Natu int
vm_mmap_memseg(struct vmctx * ctx,vm_paddr_t gpa,int segid,vm_ooffset_t off,size_t len,int prot)2849b1aa8d6SNeel Natu vm_mmap_memseg(struct vmctx *ctx, vm_paddr_t gpa, int segid, vm_ooffset_t off,
2859b1aa8d6SNeel Natu     size_t len, int prot)
2869b1aa8d6SNeel Natu {
2879b1aa8d6SNeel Natu 	struct vm_memmap memmap;
2889b1aa8d6SNeel Natu 	int error, flags;
2899b1aa8d6SNeel Natu 
2909b1aa8d6SNeel Natu 	memmap.gpa = gpa;
2919b1aa8d6SNeel Natu 	memmap.segid = segid;
2929b1aa8d6SNeel Natu 	memmap.segoff = off;
2939b1aa8d6SNeel Natu 	memmap.len = len;
2949b1aa8d6SNeel Natu 	memmap.prot = prot;
2959b1aa8d6SNeel Natu 	memmap.flags = 0;
2969b1aa8d6SNeel Natu 
2979b1aa8d6SNeel Natu 	if (ctx->memflags & VM_MEM_F_WIRED)
2989b1aa8d6SNeel Natu 		memmap.flags |= VM_MEMMAP_F_WIRED;
2999b1aa8d6SNeel Natu 
3009b1aa8d6SNeel Natu 	/*
3019b1aa8d6SNeel Natu 	 * If this mapping already exists then don't create it again. This
3029b1aa8d6SNeel Natu 	 * is the common case for SYSMEM mappings created by bhyveload(8).
3039b1aa8d6SNeel Natu 	 */
3049b1aa8d6SNeel Natu 	error = vm_mmap_getnext(ctx, &gpa, &segid, &off, &len, &prot, &flags);
3059b1aa8d6SNeel Natu 	if (error == 0 && gpa == memmap.gpa) {
3069b1aa8d6SNeel Natu 		if (segid != memmap.segid || off != memmap.segoff ||
3079b1aa8d6SNeel Natu 		    prot != memmap.prot || flags != memmap.flags) {
3089b1aa8d6SNeel Natu 			errno = EEXIST;
3099b1aa8d6SNeel Natu 			return (-1);
3109b1aa8d6SNeel Natu 		} else {
3119b1aa8d6SNeel Natu 			return (0);
3129b1aa8d6SNeel Natu 		}
3139b1aa8d6SNeel Natu 	}
3149b1aa8d6SNeel Natu 
3159b1aa8d6SNeel Natu 	error = ioctl(ctx->fd, VM_MMAP_MEMSEG, &memmap);
3169b1aa8d6SNeel Natu 	return (error);
3179b1aa8d6SNeel Natu }
3189b1aa8d6SNeel Natu 
3199b1aa8d6SNeel Natu int
vm_get_guestmem_from_ctx(struct vmctx * ctx,char ** guest_baseaddr,size_t * lowmem_size,size_t * highmem_size)320483d953aSJohn Baldwin vm_get_guestmem_from_ctx(struct vmctx *ctx, char **guest_baseaddr,
321483d953aSJohn Baldwin     size_t *lowmem_size, size_t *highmem_size)
322483d953aSJohn Baldwin {
323483d953aSJohn Baldwin 
324483d953aSJohn Baldwin 	*guest_baseaddr = ctx->baseaddr;
3257e0fa794SMark Johnston 	*lowmem_size = ctx->memsegs[VM_MEMSEG_LOW].size;
3267e0fa794SMark Johnston 	*highmem_size = ctx->memsegs[VM_MEMSEG_HIGH].size;
327483d953aSJohn Baldwin 	return (0);
328483d953aSJohn Baldwin }
329483d953aSJohn Baldwin 
330483d953aSJohn Baldwin int
vm_munmap_memseg(struct vmctx * ctx,vm_paddr_t gpa,size_t len)331f8a6ec2dSD Scott Phillips vm_munmap_memseg(struct vmctx *ctx, vm_paddr_t gpa, size_t len)
332f8a6ec2dSD Scott Phillips {
333f8a6ec2dSD Scott Phillips 	struct vm_munmap munmap;
334f8a6ec2dSD Scott Phillips 	int error;
335f8a6ec2dSD Scott Phillips 
336f8a6ec2dSD Scott Phillips 	munmap.gpa = gpa;
337f8a6ec2dSD Scott Phillips 	munmap.len = len;
338f8a6ec2dSD Scott Phillips 
339f8a6ec2dSD Scott Phillips 	error = ioctl(ctx->fd, VM_MUNMAP_MEMSEG, &munmap);
340f8a6ec2dSD Scott Phillips 	return (error);
341f8a6ec2dSD Scott Phillips }
342f8a6ec2dSD Scott Phillips 
343f8a6ec2dSD Scott Phillips int
vm_mmap_getnext(struct vmctx * ctx,vm_paddr_t * gpa,int * segid,vm_ooffset_t * segoff,size_t * len,int * prot,int * flags)3449b1aa8d6SNeel Natu vm_mmap_getnext(struct vmctx *ctx, vm_paddr_t *gpa, int *segid,
3459b1aa8d6SNeel Natu     vm_ooffset_t *segoff, size_t *len, int *prot, int *flags)
3469b1aa8d6SNeel Natu {
3479b1aa8d6SNeel Natu 	struct vm_memmap memmap;
3489b1aa8d6SNeel Natu 	int error;
3499b1aa8d6SNeel Natu 
3509b1aa8d6SNeel Natu 	bzero(&memmap, sizeof(struct vm_memmap));
3519b1aa8d6SNeel Natu 	memmap.gpa = *gpa;
3529b1aa8d6SNeel Natu 	error = ioctl(ctx->fd, VM_MMAP_GETNEXT, &memmap);
3539b1aa8d6SNeel Natu 	if (error == 0) {
3549b1aa8d6SNeel Natu 		*gpa = memmap.gpa;
3559b1aa8d6SNeel Natu 		*segid = memmap.segid;
3569b1aa8d6SNeel Natu 		*segoff = memmap.segoff;
3579b1aa8d6SNeel Natu 		*len = memmap.len;
3589b1aa8d6SNeel Natu 		*prot = memmap.prot;
3599b1aa8d6SNeel Natu 		*flags = memmap.flags;
360366f6083SPeter Grehan 	}
361366f6083SPeter Grehan 	return (error);
362366f6083SPeter Grehan }
363366f6083SPeter Grehan 
3649b1aa8d6SNeel Natu /*
3659b1aa8d6SNeel Natu  * Return 0 if the segments are identical and non-zero otherwise.
3669b1aa8d6SNeel Natu  *
3679b1aa8d6SNeel Natu  * This is slightly complicated by the fact that only device memory segments
3689b1aa8d6SNeel Natu  * are named.
3699b1aa8d6SNeel Natu  */
3709b1aa8d6SNeel Natu static int
cmpseg(size_t len,const char * str,size_t len2,const char * str2)3719b1aa8d6SNeel Natu cmpseg(size_t len, const char *str, size_t len2, const char *str2)
3729b1aa8d6SNeel Natu {
3739b1aa8d6SNeel Natu 
3749b1aa8d6SNeel Natu 	if (len == len2) {
3759b1aa8d6SNeel Natu 		if ((!str && !str2) || (str && str2 && !strcmp(str, str2)))
3769b1aa8d6SNeel Natu 			return (0);
3779b1aa8d6SNeel Natu 	}
3789b1aa8d6SNeel Natu 	return (-1);
3799b1aa8d6SNeel Natu }
3809b1aa8d6SNeel Natu 
3819b1aa8d6SNeel Natu static int
vm_alloc_memseg(struct vmctx * ctx,int segid,size_t len,const char * name)3829b1aa8d6SNeel Natu vm_alloc_memseg(struct vmctx *ctx, int segid, size_t len, const char *name)
3839b1aa8d6SNeel Natu {
3849b1aa8d6SNeel Natu 	struct vm_memseg memseg;
3859b1aa8d6SNeel Natu 	size_t n;
3869b1aa8d6SNeel Natu 	int error;
3879b1aa8d6SNeel Natu 
3889b1aa8d6SNeel Natu 	/*
3899b1aa8d6SNeel Natu 	 * If the memory segment has already been created then just return.
3909b1aa8d6SNeel Natu 	 * This is the usual case for the SYSMEM segment created by userspace
3919b1aa8d6SNeel Natu 	 * loaders like bhyveload(8).
3929b1aa8d6SNeel Natu 	 */
3939b1aa8d6SNeel Natu 	error = vm_get_memseg(ctx, segid, &memseg.len, memseg.name,
3949b1aa8d6SNeel Natu 	    sizeof(memseg.name));
3959b1aa8d6SNeel Natu 	if (error)
3969b1aa8d6SNeel Natu 		return (error);
3979b1aa8d6SNeel Natu 
3989b1aa8d6SNeel Natu 	if (memseg.len != 0) {
3999b1aa8d6SNeel Natu 		if (cmpseg(len, name, memseg.len, VM_MEMSEG_NAME(&memseg))) {
4009b1aa8d6SNeel Natu 			errno = EINVAL;
4019b1aa8d6SNeel Natu 			return (-1);
4029b1aa8d6SNeel Natu 		} else {
4039b1aa8d6SNeel Natu 			return (0);
4049b1aa8d6SNeel Natu 		}
4059b1aa8d6SNeel Natu 	}
4069b1aa8d6SNeel Natu 
4079b1aa8d6SNeel Natu 	bzero(&memseg, sizeof(struct vm_memseg));
4089b1aa8d6SNeel Natu 	memseg.segid = segid;
4099b1aa8d6SNeel Natu 	memseg.len = len;
4109b1aa8d6SNeel Natu 	if (name != NULL) {
4119b1aa8d6SNeel Natu 		n = strlcpy(memseg.name, name, sizeof(memseg.name));
4129b1aa8d6SNeel Natu 		if (n >= sizeof(memseg.name)) {
4139b1aa8d6SNeel Natu 			errno = ENAMETOOLONG;
4149b1aa8d6SNeel Natu 			return (-1);
4159b1aa8d6SNeel Natu 		}
4169b1aa8d6SNeel Natu 	}
4179b1aa8d6SNeel Natu 
4189b1aa8d6SNeel Natu 	error = ioctl(ctx->fd, VM_ALLOC_MEMSEG, &memseg);
4199b1aa8d6SNeel Natu 	return (error);
4209b1aa8d6SNeel Natu }
4219b1aa8d6SNeel Natu 
4229b1aa8d6SNeel Natu int
vm_get_memseg(struct vmctx * ctx,int segid,size_t * lenp,char * namebuf,size_t bufsize)4239b1aa8d6SNeel Natu vm_get_memseg(struct vmctx *ctx, int segid, size_t *lenp, char *namebuf,
4249b1aa8d6SNeel Natu     size_t bufsize)
4259b1aa8d6SNeel Natu {
4269b1aa8d6SNeel Natu 	struct vm_memseg memseg;
4279b1aa8d6SNeel Natu 	size_t n;
4289b1aa8d6SNeel Natu 	int error;
4299b1aa8d6SNeel Natu 
430e499fdcbSMark Johnston 	bzero(&memseg, sizeof(memseg));
4319b1aa8d6SNeel Natu 	memseg.segid = segid;
4329b1aa8d6SNeel Natu 	error = ioctl(ctx->fd, VM_GET_MEMSEG, &memseg);
4339b1aa8d6SNeel Natu 	if (error == 0) {
4349b1aa8d6SNeel Natu 		*lenp = memseg.len;
4359b1aa8d6SNeel Natu 		n = strlcpy(namebuf, memseg.name, bufsize);
4369b1aa8d6SNeel Natu 		if (n >= bufsize) {
4379b1aa8d6SNeel Natu 			errno = ENAMETOOLONG;
4389b1aa8d6SNeel Natu 			error = -1;
4399b1aa8d6SNeel Natu 		}
4409b1aa8d6SNeel Natu 	}
4419b1aa8d6SNeel Natu 	return (error);
4429b1aa8d6SNeel Natu }
4439b1aa8d6SNeel Natu 
4449b1aa8d6SNeel Natu static int
setup_memory_segment(struct vmctx * ctx,vm_paddr_t gpa,size_t len,char * base)4459b1aa8d6SNeel Natu setup_memory_segment(struct vmctx *ctx, vm_paddr_t gpa, size_t len, char *base)
4469b1aa8d6SNeel Natu {
4479b1aa8d6SNeel Natu 	char *ptr;
4489b1aa8d6SNeel Natu 	int error, flags;
4499b1aa8d6SNeel Natu 
4509b1aa8d6SNeel Natu 	/* Map 'len' bytes starting at 'gpa' in the guest address space */
4519b1aa8d6SNeel Natu 	error = vm_mmap_memseg(ctx, gpa, VM_SYSMEM, gpa, len, PROT_ALL);
4529b1aa8d6SNeel Natu 	if (error)
4539b1aa8d6SNeel Natu 		return (error);
4549b1aa8d6SNeel Natu 
4559b1aa8d6SNeel Natu 	flags = MAP_SHARED | MAP_FIXED;
4569b1aa8d6SNeel Natu 	if ((ctx->memflags & VM_MEM_F_INCORE) == 0)
4579b1aa8d6SNeel Natu 		flags |= MAP_NOCORE;
4589b1aa8d6SNeel Natu 
4599b1aa8d6SNeel Natu 	/* mmap into the process address space on the host */
4609b1aa8d6SNeel Natu 	ptr = mmap(base + gpa, len, PROT_RW, flags, ctx->fd, gpa);
4619b1aa8d6SNeel Natu 	if (ptr == MAP_FAILED)
4629b1aa8d6SNeel Natu 		return (-1);
4639b1aa8d6SNeel Natu 
4649b1aa8d6SNeel Natu 	return (0);
4659b1aa8d6SNeel Natu }
4669b1aa8d6SNeel Natu 
467b060ba50SNeel Natu int
vm_setup_memory(struct vmctx * ctx,size_t memsize,enum vm_mmap_style vms)468b060ba50SNeel Natu vm_setup_memory(struct vmctx *ctx, size_t memsize, enum vm_mmap_style vms)
469b060ba50SNeel Natu {
4709b1aa8d6SNeel Natu 	size_t objsize, len;
4719b1aa8d6SNeel Natu 	vm_paddr_t gpa;
4729b1aa8d6SNeel Natu 	char *baseaddr, *ptr;
4736a9648b5SJohn Baldwin 	int error;
474b060ba50SNeel Natu 
4759b1aa8d6SNeel Natu 	assert(vms == VM_MMAP_ALL);
476b060ba50SNeel Natu 
477b060ba50SNeel Natu 	/*
4787e0fa794SMark Johnston 	 * If 'memsize' cannot fit entirely in the 'lowmem' segment then create
4797e0fa794SMark Johnston 	 * another 'highmem' segment above VM_HIGHMEM_BASE for the remainder.
480b060ba50SNeel Natu 	 */
4817e0fa794SMark Johnston 	if (memsize > VM_LOWMEM_LIMIT) {
4827e0fa794SMark Johnston 		ctx->memsegs[VM_MEMSEG_LOW].size = VM_LOWMEM_LIMIT;
4837e0fa794SMark Johnston 		ctx->memsegs[VM_MEMSEG_HIGH].size = memsize - VM_LOWMEM_LIMIT;
4847e0fa794SMark Johnston 		objsize = VM_HIGHMEM_BASE + ctx->memsegs[VM_MEMSEG_HIGH].size;
485b060ba50SNeel Natu 	} else {
4867e0fa794SMark Johnston 		ctx->memsegs[VM_MEMSEG_LOW].size = memsize;
4877e0fa794SMark Johnston 		ctx->memsegs[VM_MEMSEG_HIGH].size = 0;
4887e0fa794SMark Johnston 		objsize = memsize;
4899b1aa8d6SNeel Natu 	}
4909b1aa8d6SNeel Natu 
4919b1aa8d6SNeel Natu 	error = vm_alloc_memseg(ctx, VM_SYSMEM, objsize, NULL);
4929b1aa8d6SNeel Natu 	if (error)
4939b1aa8d6SNeel Natu 		return (error);
4949b1aa8d6SNeel Natu 
4959b1aa8d6SNeel Natu 	/*
4969b1aa8d6SNeel Natu 	 * Stake out a contiguous region covering the guest physical memory
4979b1aa8d6SNeel Natu 	 * and the adjoining guard regions.
4989b1aa8d6SNeel Natu 	 */
4999b1aa8d6SNeel Natu 	len = VM_MMAP_GUARD_SIZE + objsize + VM_MMAP_GUARD_SIZE;
5006a9648b5SJohn Baldwin 	ptr = mmap(NULL, len, PROT_NONE, MAP_GUARD | MAP_ALIGNED_SUPER, -1, 0);
5019b1aa8d6SNeel Natu 	if (ptr == MAP_FAILED)
5029b1aa8d6SNeel Natu 		return (-1);
5039b1aa8d6SNeel Natu 
5049b1aa8d6SNeel Natu 	baseaddr = ptr + VM_MMAP_GUARD_SIZE;
5057e0fa794SMark Johnston 	if (ctx->memsegs[VM_MEMSEG_HIGH].size > 0) {
5067e0fa794SMark Johnston 		gpa = VM_HIGHMEM_BASE;
5077e0fa794SMark Johnston 		len = ctx->memsegs[VM_MEMSEG_HIGH].size;
5089b1aa8d6SNeel Natu 		error = setup_memory_segment(ctx, gpa, len, baseaddr);
5099b1aa8d6SNeel Natu 		if (error)
5109b1aa8d6SNeel Natu 			return (error);
511b060ba50SNeel Natu 	}
512b060ba50SNeel Natu 
5137e0fa794SMark Johnston 	if (ctx->memsegs[VM_MEMSEG_LOW].size > 0) {
5149b1aa8d6SNeel Natu 		gpa = 0;
5157e0fa794SMark Johnston 		len = ctx->memsegs[VM_MEMSEG_LOW].size;
5169b1aa8d6SNeel Natu 		error = setup_memory_segment(ctx, gpa, len, baseaddr);
517b060ba50SNeel Natu 		if (error)
518b060ba50SNeel Natu 			return (error);
519b060ba50SNeel Natu 	}
520b060ba50SNeel Natu 
5219b1aa8d6SNeel Natu 	ctx->baseaddr = baseaddr;
522b060ba50SNeel Natu 
523b060ba50SNeel Natu 	return (0);
524b060ba50SNeel Natu }
525b060ba50SNeel Natu 
52636e8356eSNeel Natu /*
52736e8356eSNeel Natu  * Returns a non-NULL pointer if [gaddr, gaddr+len) is entirely contained in
52836e8356eSNeel Natu  * the lowmem or highmem regions.
52936e8356eSNeel Natu  *
53036e8356eSNeel Natu  * In particular return NULL if [gaddr, gaddr+len) falls in guest MMIO region.
53136e8356eSNeel Natu  * The instruction emulation code depends on this behavior.
53236e8356eSNeel Natu  */
533b060ba50SNeel Natu void *
vm_map_gpa(struct vmctx * ctx,vm_paddr_t gaddr,size_t len)534b060ba50SNeel Natu vm_map_gpa(struct vmctx *ctx, vm_paddr_t gaddr, size_t len)
535366f6083SPeter Grehan {
5367e0fa794SMark Johnston 	vm_size_t lowsize, highsize;
537366f6083SPeter Grehan 
5387e0fa794SMark Johnston 	lowsize = ctx->memsegs[VM_MEMSEG_LOW].size;
5397e0fa794SMark Johnston 	if (lowsize > 0) {
5407e0fa794SMark Johnston 		if (gaddr < lowsize && len <= lowsize && gaddr + len <= lowsize)
54136e8356eSNeel Natu 			return (ctx->baseaddr + gaddr);
54236e8356eSNeel Natu 	}
543b060ba50SNeel Natu 
5447e0fa794SMark Johnston 	highsize = ctx->memsegs[VM_MEMSEG_HIGH].size;
5457e0fa794SMark Johnston 	if (highsize > 0 && gaddr >= VM_HIGHMEM_BASE) {
5467e0fa794SMark Johnston 		if (gaddr < VM_HIGHMEM_BASE + highsize && len <= highsize &&
5477e0fa794SMark Johnston 		    gaddr + len <= VM_HIGHMEM_BASE + highsize)
54836e8356eSNeel Natu 			return (ctx->baseaddr + gaddr);
54936e8356eSNeel Natu 	}
55036e8356eSNeel Natu 
551b060ba50SNeel Natu 	return (NULL);
552366f6083SPeter Grehan }
553366f6083SPeter Grehan 
554483d953aSJohn Baldwin vm_paddr_t
vm_rev_map_gpa(struct vmctx * ctx,void * addr)555483d953aSJohn Baldwin vm_rev_map_gpa(struct vmctx *ctx, void *addr)
556483d953aSJohn Baldwin {
557483d953aSJohn Baldwin 	vm_paddr_t offaddr;
5587e0fa794SMark Johnston 	vm_size_t lowsize, highsize;
559483d953aSJohn Baldwin 
560483d953aSJohn Baldwin 	offaddr = (char *)addr - ctx->baseaddr;
561483d953aSJohn Baldwin 
5627e0fa794SMark Johnston 	lowsize = ctx->memsegs[VM_MEMSEG_LOW].size;
5637e0fa794SMark Johnston 	if (lowsize > 0)
5647e0fa794SMark Johnston 		if (offaddr <= lowsize)
565483d953aSJohn Baldwin 			return (offaddr);
566483d953aSJohn Baldwin 
5677e0fa794SMark Johnston 	highsize = ctx->memsegs[VM_MEMSEG_HIGH].size;
5687e0fa794SMark Johnston 	if (highsize > 0)
5697e0fa794SMark Johnston 		if (offaddr >= VM_HIGHMEM_BASE &&
5707e0fa794SMark Johnston 		    offaddr < VM_HIGHMEM_BASE + highsize)
571483d953aSJohn Baldwin 			return (offaddr);
572483d953aSJohn Baldwin 
573483d953aSJohn Baldwin 	return ((vm_paddr_t)-1);
574483d953aSJohn Baldwin }
575483d953aSJohn Baldwin 
5763efc45f3SRobert Wing const char *
vm_get_name(struct vmctx * ctx)5773efc45f3SRobert Wing vm_get_name(struct vmctx *ctx)
578483d953aSJohn Baldwin {
579483d953aSJohn Baldwin 
5803efc45f3SRobert Wing 	return (ctx->name);
581483d953aSJohn Baldwin }
582483d953aSJohn Baldwin 
583be679db4SNeel Natu size_t
vm_get_lowmem_size(struct vmctx * ctx)584be679db4SNeel Natu vm_get_lowmem_size(struct vmctx *ctx)
585be679db4SNeel Natu {
586be679db4SNeel Natu 
5877e0fa794SMark Johnston 	return (ctx->memsegs[VM_MEMSEG_LOW].size);
5887e0fa794SMark Johnston }
5897e0fa794SMark Johnston 
5907e0fa794SMark Johnston vm_paddr_t
vm_get_highmem_base(struct vmctx * ctx __unused)5917e0fa794SMark Johnston vm_get_highmem_base(struct vmctx *ctx __unused)
5927e0fa794SMark Johnston {
5937e0fa794SMark Johnston 
5947e0fa794SMark Johnston 	return (VM_HIGHMEM_BASE);
595be679db4SNeel Natu }
596be679db4SNeel Natu 
597be679db4SNeel Natu size_t
vm_get_highmem_size(struct vmctx * ctx)598be679db4SNeel Natu vm_get_highmem_size(struct vmctx *ctx)
599be679db4SNeel Natu {
600be679db4SNeel Natu 
6017e0fa794SMark Johnston 	return (ctx->memsegs[VM_MEMSEG_HIGH].size);
602be679db4SNeel Natu }
603be679db4SNeel Natu 
6049b1aa8d6SNeel Natu void *
vm_create_devmem(struct vmctx * ctx,int segid,const char * name,size_t len)6059b1aa8d6SNeel Natu vm_create_devmem(struct vmctx *ctx, int segid, const char *name, size_t len)
6069b1aa8d6SNeel Natu {
6079b1aa8d6SNeel Natu 	char pathname[MAXPATHLEN];
6089b1aa8d6SNeel Natu 	size_t len2;
6099b1aa8d6SNeel Natu 	char *base, *ptr;
6109b1aa8d6SNeel Natu 	int fd, error, flags;
6119b1aa8d6SNeel Natu 
6129b1aa8d6SNeel Natu 	fd = -1;
6139b1aa8d6SNeel Natu 	ptr = MAP_FAILED;
6149b1aa8d6SNeel Natu 	if (name == NULL || strlen(name) == 0) {
6159b1aa8d6SNeel Natu 		errno = EINVAL;
6169b1aa8d6SNeel Natu 		goto done;
6179b1aa8d6SNeel Natu 	}
6189b1aa8d6SNeel Natu 
6199b1aa8d6SNeel Natu 	error = vm_alloc_memseg(ctx, segid, len, name);
6209b1aa8d6SNeel Natu 	if (error)
6219b1aa8d6SNeel Natu 		goto done;
6229b1aa8d6SNeel Natu 
6235e4f29c0SNeel Natu 	strlcpy(pathname, "/dev/vmm.io/", sizeof(pathname));
6249b1aa8d6SNeel Natu 	strlcat(pathname, ctx->name, sizeof(pathname));
6259b1aa8d6SNeel Natu 	strlcat(pathname, ".", sizeof(pathname));
6269b1aa8d6SNeel Natu 	strlcat(pathname, name, sizeof(pathname));
6279b1aa8d6SNeel Natu 
6289b1aa8d6SNeel Natu 	fd = open(pathname, O_RDWR);
6299b1aa8d6SNeel Natu 	if (fd < 0)
6309b1aa8d6SNeel Natu 		goto done;
6319b1aa8d6SNeel Natu 
6329b1aa8d6SNeel Natu 	/*
6339b1aa8d6SNeel Natu 	 * Stake out a contiguous region covering the device memory and the
6349b1aa8d6SNeel Natu 	 * adjoining guard regions.
6359b1aa8d6SNeel Natu 	 */
6369b1aa8d6SNeel Natu 	len2 = VM_MMAP_GUARD_SIZE + len + VM_MMAP_GUARD_SIZE;
6376a9648b5SJohn Baldwin 	base = mmap(NULL, len2, PROT_NONE, MAP_GUARD | MAP_ALIGNED_SUPER, -1,
6386a9648b5SJohn Baldwin 	    0);
6399b1aa8d6SNeel Natu 	if (base == MAP_FAILED)
6409b1aa8d6SNeel Natu 		goto done;
6419b1aa8d6SNeel Natu 
6429b1aa8d6SNeel Natu 	flags = MAP_SHARED | MAP_FIXED;
6439b1aa8d6SNeel Natu 	if ((ctx->memflags & VM_MEM_F_INCORE) == 0)
6449b1aa8d6SNeel Natu 		flags |= MAP_NOCORE;
6459b1aa8d6SNeel Natu 
6469b1aa8d6SNeel Natu 	/* mmap the devmem region in the host address space */
6479b1aa8d6SNeel Natu 	ptr = mmap(base + VM_MMAP_GUARD_SIZE, len, PROT_RW, flags, fd, 0);
6489b1aa8d6SNeel Natu done:
6499b1aa8d6SNeel Natu 	if (fd >= 0)
6509b1aa8d6SNeel Natu 		close(fd);
6519b1aa8d6SNeel Natu 	return (ptr);
6529b1aa8d6SNeel Natu }
6539b1aa8d6SNeel Natu 
654e4656e10SMark Johnston int
vcpu_ioctl(struct vcpu * vcpu,u_long cmd,void * arg)6557d9ef309SJohn Baldwin vcpu_ioctl(struct vcpu *vcpu, u_long cmd, void *arg)
6567d9ef309SJohn Baldwin {
6577d9ef309SJohn Baldwin 	/*
6587d9ef309SJohn Baldwin 	 * XXX: fragile, handle with care
6597d9ef309SJohn Baldwin 	 * Assumes that the first field of the ioctl data
6607d9ef309SJohn Baldwin 	 * is the vcpuid.
6617d9ef309SJohn Baldwin 	 */
6627d9ef309SJohn Baldwin 	*(int *)arg = vcpu->vcpuid;
6637d9ef309SJohn Baldwin 	return (ioctl(vcpu->ctx->fd, cmd, arg));
6647d9ef309SJohn Baldwin }
6657d9ef309SJohn Baldwin 
666366f6083SPeter Grehan int
vm_set_register(struct vcpu * vcpu,int reg,uint64_t val)6677d9ef309SJohn Baldwin vm_set_register(struct vcpu *vcpu, int reg, uint64_t val)
668366f6083SPeter Grehan {
669366f6083SPeter Grehan 	int error;
670366f6083SPeter Grehan 	struct vm_register vmreg;
671366f6083SPeter Grehan 
672366f6083SPeter Grehan 	bzero(&vmreg, sizeof(vmreg));
673366f6083SPeter Grehan 	vmreg.regnum = reg;
674366f6083SPeter Grehan 	vmreg.regval = val;
675366f6083SPeter Grehan 
6767d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_SET_REGISTER, &vmreg);
677366f6083SPeter Grehan 	return (error);
678366f6083SPeter Grehan }
679366f6083SPeter Grehan 
680366f6083SPeter Grehan int
vm_get_register(struct vcpu * vcpu,int reg,uint64_t * ret_val)6817d9ef309SJohn Baldwin vm_get_register(struct vcpu *vcpu, int reg, uint64_t *ret_val)
682366f6083SPeter Grehan {
683366f6083SPeter Grehan 	int error;
684366f6083SPeter Grehan 	struct vm_register vmreg;
685366f6083SPeter Grehan 
686366f6083SPeter Grehan 	bzero(&vmreg, sizeof(vmreg));
687366f6083SPeter Grehan 	vmreg.regnum = reg;
688366f6083SPeter Grehan 
6897d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GET_REGISTER, &vmreg);
690366f6083SPeter Grehan 	*ret_val = vmreg.regval;
691366f6083SPeter Grehan 	return (error);
692366f6083SPeter Grehan }
693366f6083SPeter Grehan 
694366f6083SPeter Grehan int
vm_set_register_set(struct vcpu * vcpu,unsigned int count,const int * regnums,uint64_t * regvals)6957d9ef309SJohn Baldwin vm_set_register_set(struct vcpu *vcpu, unsigned int count,
6964f866698SJohn Baldwin     const int *regnums, uint64_t *regvals)
6974f866698SJohn Baldwin {
6984f866698SJohn Baldwin 	int error;
6994f866698SJohn Baldwin 	struct vm_register_set vmregset;
7004f866698SJohn Baldwin 
7014f866698SJohn Baldwin 	bzero(&vmregset, sizeof(vmregset));
7024f866698SJohn Baldwin 	vmregset.count = count;
7034f866698SJohn Baldwin 	vmregset.regnums = regnums;
7044f866698SJohn Baldwin 	vmregset.regvals = regvals;
7054f866698SJohn Baldwin 
7067d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_SET_REGISTER_SET, &vmregset);
7074f866698SJohn Baldwin 	return (error);
7084f866698SJohn Baldwin }
7094f866698SJohn Baldwin 
7104f866698SJohn Baldwin int
vm_get_register_set(struct vcpu * vcpu,unsigned int count,const int * regnums,uint64_t * regvals)7117d9ef309SJohn Baldwin vm_get_register_set(struct vcpu *vcpu, unsigned int count,
7124f866698SJohn Baldwin     const int *regnums, uint64_t *regvals)
7134f866698SJohn Baldwin {
7144f866698SJohn Baldwin 	int error;
7154f866698SJohn Baldwin 	struct vm_register_set vmregset;
7164f866698SJohn Baldwin 
7174f866698SJohn Baldwin 	bzero(&vmregset, sizeof(vmregset));
7184f866698SJohn Baldwin 	vmregset.count = count;
7194f866698SJohn Baldwin 	vmregset.regnums = regnums;
7204f866698SJohn Baldwin 	vmregset.regvals = regvals;
7214f866698SJohn Baldwin 
7227d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GET_REGISTER_SET, &vmregset);
7234f866698SJohn Baldwin 	return (error);
7244f866698SJohn Baldwin }
7254f866698SJohn Baldwin 
7264f866698SJohn Baldwin int
vm_run(struct vcpu * vcpu,struct vm_run * vmrun)727e17eca32SMark Johnston vm_run(struct vcpu *vcpu, struct vm_run *vmrun)
728366f6083SPeter Grehan {
729e17eca32SMark Johnston 	return (vcpu_ioctl(vcpu, VM_RUN, vmrun));
730366f6083SPeter Grehan }
731366f6083SPeter Grehan 
732b15a09c0SNeel Natu int
vm_suspend(struct vmctx * ctx,enum vm_suspend_how how)733f0fdcfe2SNeel Natu vm_suspend(struct vmctx *ctx, enum vm_suspend_how how)
734b15a09c0SNeel Natu {
735f0fdcfe2SNeel Natu 	struct vm_suspend vmsuspend;
736b15a09c0SNeel Natu 
737f0fdcfe2SNeel Natu 	bzero(&vmsuspend, sizeof(vmsuspend));
738f0fdcfe2SNeel Natu 	vmsuspend.how = how;
739f0fdcfe2SNeel Natu 	return (ioctl(ctx->fd, VM_SUSPEND, &vmsuspend));
740b15a09c0SNeel Natu }
741b15a09c0SNeel Natu 
7425fcf252fSNeel Natu int
vm_reinit(struct vmctx * ctx)7435fcf252fSNeel Natu vm_reinit(struct vmctx *ctx)
7445fcf252fSNeel Natu {
7455fcf252fSNeel Natu 
7465fcf252fSNeel Natu 	return (ioctl(ctx->fd, VM_REINIT, 0));
7475fcf252fSNeel Natu }
7485fcf252fSNeel Natu 
749d087a399SNeel Natu int
vm_capability_name2type(const char * capname)75013f4cf6cSNeel Natu vm_capability_name2type(const char *capname)
75113f4cf6cSNeel Natu {
75213f4cf6cSNeel Natu 	int i;
75313f4cf6cSNeel Natu 
75485efb31dSMark Johnston 	for (i = 0; i < VM_CAP_MAX; i++) {
75585efb31dSMark Johnston 		if (vm_capstrmap[i] != NULL &&
75685efb31dSMark Johnston 		    strcmp(vm_capstrmap[i], capname) == 0)
757d000623aSJohn Baldwin 			return (i);
758366f6083SPeter Grehan 	}
759366f6083SPeter Grehan 
760366f6083SPeter Grehan 	return (-1);
761366f6083SPeter Grehan }
762366f6083SPeter Grehan 
76313f4cf6cSNeel Natu const char *
vm_capability_type2name(int type)76413f4cf6cSNeel Natu vm_capability_type2name(int type)
76513f4cf6cSNeel Natu {
76685efb31dSMark Johnston 	if (type >= 0 && type < VM_CAP_MAX)
76785efb31dSMark Johnston 		return (vm_capstrmap[type]);
76813f4cf6cSNeel Natu 
76913f4cf6cSNeel Natu 	return (NULL);
77013f4cf6cSNeel Natu }
77113f4cf6cSNeel Natu 
772366f6083SPeter Grehan int
vm_get_capability(struct vcpu * vcpu,enum vm_cap_type cap,int * retval)7737d9ef309SJohn Baldwin vm_get_capability(struct vcpu *vcpu, enum vm_cap_type cap, int *retval)
774366f6083SPeter Grehan {
775366f6083SPeter Grehan 	int error;
776366f6083SPeter Grehan 	struct vm_capability vmcap;
777366f6083SPeter Grehan 
778366f6083SPeter Grehan 	bzero(&vmcap, sizeof(vmcap));
779366f6083SPeter Grehan 	vmcap.captype = cap;
780366f6083SPeter Grehan 
7817d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GET_CAPABILITY, &vmcap);
782366f6083SPeter Grehan 	*retval = vmcap.capval;
783366f6083SPeter Grehan 	return (error);
784366f6083SPeter Grehan }
785366f6083SPeter Grehan 
786366f6083SPeter Grehan int
vm_set_capability(struct vcpu * vcpu,enum vm_cap_type cap,int val)7877d9ef309SJohn Baldwin vm_set_capability(struct vcpu *vcpu, enum vm_cap_type cap, int val)
788366f6083SPeter Grehan {
789366f6083SPeter Grehan 	struct vm_capability vmcap;
790366f6083SPeter Grehan 
791366f6083SPeter Grehan 	bzero(&vmcap, sizeof(vmcap));
792366f6083SPeter Grehan 	vmcap.captype = cap;
793366f6083SPeter Grehan 	vmcap.capval = val;
794366f6083SPeter Grehan 
7957d9ef309SJohn Baldwin 	return (vcpu_ioctl(vcpu, VM_SET_CAPABILITY, &vmcap));
796366f6083SPeter Grehan }
797366f6083SPeter Grehan 
798366f6083SPeter Grehan uint64_t *
vm_get_stats(struct vcpu * vcpu,struct timeval * ret_tv,int * ret_entries)7997d9ef309SJohn Baldwin vm_get_stats(struct vcpu *vcpu, struct timeval *ret_tv,
800366f6083SPeter Grehan 	     int *ret_entries)
801366f6083SPeter Grehan {
80264269786SJohn Baldwin 	static _Thread_local uint64_t *stats_buf;
80364269786SJohn Baldwin 	static _Thread_local u_int stats_count;
80464269786SJohn Baldwin 	uint64_t *new_stats;
80564269786SJohn Baldwin 	struct vm_stats vmstats;
80664269786SJohn Baldwin 	u_int count, index;
80764269786SJohn Baldwin 	bool have_stats;
808366f6083SPeter Grehan 
80964269786SJohn Baldwin 	have_stats = false;
81064269786SJohn Baldwin 	count = 0;
81164269786SJohn Baldwin 	for (index = 0;; index += nitems(vmstats.statbuf)) {
81264269786SJohn Baldwin 		vmstats.index = index;
8137d9ef309SJohn Baldwin 		if (vcpu_ioctl(vcpu, VM_STATS, &vmstats) != 0)
81464269786SJohn Baldwin 			break;
81564269786SJohn Baldwin 		if (stats_count < index + vmstats.num_entries) {
81664269786SJohn Baldwin 			new_stats = realloc(stats_buf,
81764269786SJohn Baldwin 			    (index + vmstats.num_entries) * sizeof(uint64_t));
81864269786SJohn Baldwin 			if (new_stats == NULL) {
81964269786SJohn Baldwin 				errno = ENOMEM;
82064269786SJohn Baldwin 				return (NULL);
82164269786SJohn Baldwin 			}
82264269786SJohn Baldwin 			stats_count = index + vmstats.num_entries;
82364269786SJohn Baldwin 			stats_buf = new_stats;
82464269786SJohn Baldwin 		}
82564269786SJohn Baldwin 		memcpy(stats_buf + index, vmstats.statbuf,
82664269786SJohn Baldwin 		    vmstats.num_entries * sizeof(uint64_t));
82764269786SJohn Baldwin 		count += vmstats.num_entries;
82864269786SJohn Baldwin 		have_stats = true;
829366f6083SPeter Grehan 
83064269786SJohn Baldwin 		if (vmstats.num_entries != nitems(vmstats.statbuf))
83164269786SJohn Baldwin 			break;
83264269786SJohn Baldwin 	}
83364269786SJohn Baldwin 	if (have_stats) {
834366f6083SPeter Grehan 		if (ret_entries)
83564269786SJohn Baldwin 			*ret_entries = count;
836366f6083SPeter Grehan 		if (ret_tv)
837366f6083SPeter Grehan 			*ret_tv = vmstats.tv;
83864269786SJohn Baldwin 		return (stats_buf);
839366f6083SPeter Grehan 	} else
840366f6083SPeter Grehan 		return (NULL);
841366f6083SPeter Grehan }
842366f6083SPeter Grehan 
843366f6083SPeter Grehan const char *
vm_get_stat_desc(struct vmctx * ctx,int index)844366f6083SPeter Grehan vm_get_stat_desc(struct vmctx *ctx, int index)
845366f6083SPeter Grehan {
846366f6083SPeter Grehan 	static struct vm_stat_desc statdesc;
847366f6083SPeter Grehan 
848366f6083SPeter Grehan 	statdesc.index = index;
849366f6083SPeter Grehan 	if (ioctl(ctx->fd, VM_STAT_DESC, &statdesc) == 0)
850366f6083SPeter Grehan 		return (statdesc.desc);
851366f6083SPeter Grehan 	else
852366f6083SPeter Grehan 		return (NULL);
853366f6083SPeter Grehan }
854366f6083SPeter Grehan 
85556a26fc1SMark Johnston #ifdef __amd64__
856e9027382SNeel Natu int
vm_get_gpa_pmap(struct vmctx * ctx,uint64_t gpa,uint64_t * pte,int * num)857318224bbSNeel Natu vm_get_gpa_pmap(struct vmctx *ctx, uint64_t gpa, uint64_t *pte, int *num)
858318224bbSNeel Natu {
859318224bbSNeel Natu 	int error, i;
860318224bbSNeel Natu 	struct vm_gpa_pte gpapte;
861318224bbSNeel Natu 
862318224bbSNeel Natu 	bzero(&gpapte, sizeof(gpapte));
863318224bbSNeel Natu 	gpapte.gpa = gpa;
864318224bbSNeel Natu 
865318224bbSNeel Natu 	error = ioctl(ctx->fd, VM_GET_GPA_PMAP, &gpapte);
866318224bbSNeel Natu 
867318224bbSNeel Natu 	if (error == 0) {
868318224bbSNeel Natu 		*num = gpapte.ptenum;
869318224bbSNeel Natu 		for (i = 0; i < gpapte.ptenum; i++)
870318224bbSNeel Natu 			pte[i] = gpapte.pte[i];
871318224bbSNeel Natu 	}
872318224bbSNeel Natu 
873318224bbSNeel Natu 	return (error);
874318224bbSNeel Natu }
87508e3ff32SNeel Natu 
87608e3ff32SNeel Natu int
vm_gla2gpa(struct vcpu * vcpu,struct vm_guest_paging * paging,uint64_t gla,int prot,uint64_t * gpa,int * fault)8777d9ef309SJohn Baldwin vm_gla2gpa(struct vcpu *vcpu, struct vm_guest_paging *paging,
8789c4d5478SNeel Natu     uint64_t gla, int prot, uint64_t *gpa, int *fault)
879da11f4aaSNeel Natu {
880da11f4aaSNeel Natu 	struct vm_gla2gpa gg;
881da11f4aaSNeel Natu 	int error;
882da11f4aaSNeel Natu 
883da11f4aaSNeel Natu 	bzero(&gg, sizeof(struct vm_gla2gpa));
884da11f4aaSNeel Natu 	gg.prot = prot;
885da11f4aaSNeel Natu 	gg.gla = gla;
886da11f4aaSNeel Natu 	gg.paging = *paging;
887da11f4aaSNeel Natu 
8887d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GLA2GPA, &gg);
889da11f4aaSNeel Natu 	if (error == 0) {
890da11f4aaSNeel Natu 		*fault = gg.fault;
891da11f4aaSNeel Natu 		*gpa = gg.gpa;
892da11f4aaSNeel Natu 	}
893da11f4aaSNeel Natu 	return (error);
894da11f4aaSNeel Natu }
89556a26fc1SMark Johnston #endif
896da11f4aaSNeel Natu 
8975f8754c0SJohn Baldwin int
vm_gla2gpa_nofault(struct vcpu * vcpu,struct vm_guest_paging * paging,uint64_t gla,int prot,uint64_t * gpa,int * fault)8987d9ef309SJohn Baldwin vm_gla2gpa_nofault(struct vcpu *vcpu, struct vm_guest_paging *paging,
8995f8754c0SJohn Baldwin     uint64_t gla, int prot, uint64_t *gpa, int *fault)
9005f8754c0SJohn Baldwin {
9015f8754c0SJohn Baldwin 	struct vm_gla2gpa gg;
9025f8754c0SJohn Baldwin 	int error;
9035f8754c0SJohn Baldwin 
9045f8754c0SJohn Baldwin 	bzero(&gg, sizeof(struct vm_gla2gpa));
9055f8754c0SJohn Baldwin 	gg.prot = prot;
9065f8754c0SJohn Baldwin 	gg.gla = gla;
9075f8754c0SJohn Baldwin 	gg.paging = *paging;
9085f8754c0SJohn Baldwin 
9097d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GLA2GPA_NOFAULT, &gg);
9105f8754c0SJohn Baldwin 	if (error == 0) {
9115f8754c0SJohn Baldwin 		*fault = gg.fault;
9125f8754c0SJohn Baldwin 		*gpa = gg.gpa;
9135f8754c0SJohn Baldwin 	}
9145f8754c0SJohn Baldwin 	return (error);
9155f8754c0SJohn Baldwin }
9165f8754c0SJohn Baldwin 
917da11f4aaSNeel Natu #ifndef min
918da11f4aaSNeel Natu #define	min(a,b)	(((a) < (b)) ? (a) : (b))
919da11f4aaSNeel Natu #endif
920da11f4aaSNeel Natu 
92156a26fc1SMark Johnston #ifdef __amd64__
922da11f4aaSNeel Natu int
vm_copy_setup(struct vcpu * vcpu,struct vm_guest_paging * paging,uint64_t gla,size_t len,int prot,struct iovec * iov,int iovcnt,int * fault)9237d9ef309SJohn Baldwin vm_copy_setup(struct vcpu *vcpu, struct vm_guest_paging *paging,
9249c4d5478SNeel Natu     uint64_t gla, size_t len, int prot, struct iovec *iov, int iovcnt,
9259c4d5478SNeel Natu     int *fault)
926da11f4aaSNeel Natu {
927009e2acbSNeel Natu 	void *va;
92845cd18ecSMark Johnston 	uint64_t gpa, off;
92945cd18ecSMark Johnston 	int error, i, n;
9306303b65dSNeel Natu 
9316303b65dSNeel Natu 	for (i = 0; i < iovcnt; i++) {
9326303b65dSNeel Natu 		iov[i].iov_base = 0;
9336303b65dSNeel Natu 		iov[i].iov_len = 0;
9346303b65dSNeel Natu 	}
9356303b65dSNeel Natu 
9366303b65dSNeel Natu 	while (len) {
9376303b65dSNeel Natu 		assert(iovcnt > 0);
9387d9ef309SJohn Baldwin 		error = vm_gla2gpa(vcpu, paging, gla, prot, &gpa, fault);
9399c4d5478SNeel Natu 		if (error || *fault)
9409c4d5478SNeel Natu 			return (error);
9416303b65dSNeel Natu 
9426303b65dSNeel Natu 		off = gpa & PAGE_MASK;
94345cd18ecSMark Johnston 		n = MIN(len, PAGE_SIZE - off);
9446303b65dSNeel Natu 
9457d9ef309SJohn Baldwin 		va = vm_map_gpa(vcpu->ctx, gpa, n);
946009e2acbSNeel Natu 		if (va == NULL)
9479c4d5478SNeel Natu 			return (EFAULT);
948009e2acbSNeel Natu 
949009e2acbSNeel Natu 		iov->iov_base = va;
9506303b65dSNeel Natu 		iov->iov_len = n;
9516303b65dSNeel Natu 		iov++;
9526303b65dSNeel Natu 		iovcnt--;
9536303b65dSNeel Natu 
9546303b65dSNeel Natu 		gla += n;
9556303b65dSNeel Natu 		len -= n;
9566303b65dSNeel Natu 	}
9576303b65dSNeel Natu 	return (0);
9586303b65dSNeel Natu }
95956a26fc1SMark Johnston #endif
9606303b65dSNeel Natu 
9616303b65dSNeel Natu void
vm_copy_teardown(struct iovec * iov __unused,int iovcnt __unused)9622b4fe856SJohn Baldwin vm_copy_teardown(struct iovec *iov __unused, int iovcnt __unused)
963009e2acbSNeel Natu {
9642b4fe856SJohn Baldwin 	/*
9652b4fe856SJohn Baldwin 	 * Intentionally empty.  This is used by the instruction
9662b4fe856SJohn Baldwin 	 * emulation code shared with the kernel.  The in-kernel
9672b4fe856SJohn Baldwin 	 * version of this is non-empty.
9682b4fe856SJohn Baldwin 	 */
969009e2acbSNeel Natu }
970009e2acbSNeel Natu 
971009e2acbSNeel Natu void
vm_copyin(struct iovec * iov,void * vp,size_t len)9722b4fe856SJohn Baldwin vm_copyin(struct iovec *iov, void *vp, size_t len)
9736303b65dSNeel Natu {
9746303b65dSNeel Natu 	const char *src;
9756303b65dSNeel Natu 	char *dst;
9766303b65dSNeel Natu 	size_t n;
977da11f4aaSNeel Natu 
978da11f4aaSNeel Natu 	dst = vp;
979da11f4aaSNeel Natu 	while (len) {
9806303b65dSNeel Natu 		assert(iov->iov_len);
9816303b65dSNeel Natu 		n = min(len, iov->iov_len);
982009e2acbSNeel Natu 		src = iov->iov_base;
983da11f4aaSNeel Natu 		bcopy(src, dst, n);
984da11f4aaSNeel Natu 
9856303b65dSNeel Natu 		iov++;
986da11f4aaSNeel Natu 		dst += n;
987da11f4aaSNeel Natu 		len -= n;
988da11f4aaSNeel Natu 	}
989da11f4aaSNeel Natu }
990da11f4aaSNeel Natu 
9916303b65dSNeel Natu void
vm_copyout(const void * vp,struct iovec * iov,size_t len)9922b4fe856SJohn Baldwin vm_copyout(const void *vp, struct iovec *iov, size_t len)
993da11f4aaSNeel Natu {
994da11f4aaSNeel Natu 	const char *src;
9956303b65dSNeel Natu 	char *dst;
9966303b65dSNeel Natu 	size_t n;
997da11f4aaSNeel Natu 
998da11f4aaSNeel Natu 	src = vp;
999da11f4aaSNeel Natu 	while (len) {
10006303b65dSNeel Natu 		assert(iov->iov_len);
10016303b65dSNeel Natu 		n = min(len, iov->iov_len);
1002009e2acbSNeel Natu 		dst = iov->iov_base;
1003da11f4aaSNeel Natu 		bcopy(src, dst, n);
1004da11f4aaSNeel Natu 
10056303b65dSNeel Natu 		iov++;
1006da11f4aaSNeel Natu 		src += n;
1007da11f4aaSNeel Natu 		len -= n;
1008da11f4aaSNeel Natu 	}
1009da11f4aaSNeel Natu }
101095ebc360SNeel Natu 
101195ebc360SNeel Natu static int
vm_get_cpus(struct vmctx * ctx,int which,cpuset_t * cpus)101295ebc360SNeel Natu vm_get_cpus(struct vmctx *ctx, int which, cpuset_t *cpus)
101395ebc360SNeel Natu {
101495ebc360SNeel Natu 	struct vm_cpuset vm_cpuset;
101595ebc360SNeel Natu 	int error;
101695ebc360SNeel Natu 
101795ebc360SNeel Natu 	bzero(&vm_cpuset, sizeof(struct vm_cpuset));
101895ebc360SNeel Natu 	vm_cpuset.which = which;
101995ebc360SNeel Natu 	vm_cpuset.cpusetsize = sizeof(cpuset_t);
102095ebc360SNeel Natu 	vm_cpuset.cpus = cpus;
102195ebc360SNeel Natu 
102295ebc360SNeel Natu 	error = ioctl(ctx->fd, VM_GET_CPUS, &vm_cpuset);
102395ebc360SNeel Natu 	return (error);
102495ebc360SNeel Natu }
102595ebc360SNeel Natu 
102695ebc360SNeel Natu int
vm_active_cpus(struct vmctx * ctx,cpuset_t * cpus)102795ebc360SNeel Natu vm_active_cpus(struct vmctx *ctx, cpuset_t *cpus)
102895ebc360SNeel Natu {
102995ebc360SNeel Natu 
103095ebc360SNeel Natu 	return (vm_get_cpus(ctx, VM_ACTIVE_CPUS, cpus));
103195ebc360SNeel Natu }
103295ebc360SNeel Natu 
103395ebc360SNeel Natu int
vm_suspended_cpus(struct vmctx * ctx,cpuset_t * cpus)103495ebc360SNeel Natu vm_suspended_cpus(struct vmctx *ctx, cpuset_t *cpus)
103595ebc360SNeel Natu {
103695ebc360SNeel Natu 
103795ebc360SNeel Natu 	return (vm_get_cpus(ctx, VM_SUSPENDED_CPUS, cpus));
103895ebc360SNeel Natu }
103995ebc360SNeel Natu 
104095ebc360SNeel Natu int
vm_debug_cpus(struct vmctx * ctx,cpuset_t * cpus)1041fc276d92SJohn Baldwin vm_debug_cpus(struct vmctx *ctx, cpuset_t *cpus)
1042fc276d92SJohn Baldwin {
1043fc276d92SJohn Baldwin 
1044fc276d92SJohn Baldwin 	return (vm_get_cpus(ctx, VM_DEBUG_CPUS, cpus));
1045fc276d92SJohn Baldwin }
1046fc276d92SJohn Baldwin 
1047fc276d92SJohn Baldwin int
vm_activate_cpu(struct vcpu * vcpu)10487d9ef309SJohn Baldwin vm_activate_cpu(struct vcpu *vcpu)
104995ebc360SNeel Natu {
105095ebc360SNeel Natu 	struct vm_activate_cpu ac;
105195ebc360SNeel Natu 	int error;
105295ebc360SNeel Natu 
105395ebc360SNeel Natu 	bzero(&ac, sizeof(struct vm_activate_cpu));
10547d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_ACTIVATE_CPU, &ac);
105595ebc360SNeel Natu 	return (error);
105695ebc360SNeel Natu }
1057091d4532SNeel Natu 
1058091d4532SNeel Natu int
vm_suspend_all_cpus(struct vmctx * ctx)10597d9ef309SJohn Baldwin vm_suspend_all_cpus(struct vmctx *ctx)
1060fc276d92SJohn Baldwin {
1061fc276d92SJohn Baldwin 	struct vm_activate_cpu ac;
1062fc276d92SJohn Baldwin 	int error;
1063fc276d92SJohn Baldwin 
1064fc276d92SJohn Baldwin 	bzero(&ac, sizeof(struct vm_activate_cpu));
10657d9ef309SJohn Baldwin 	ac.vcpuid = -1;
1066fc276d92SJohn Baldwin 	error = ioctl(ctx->fd, VM_SUSPEND_CPU, &ac);
1067fc276d92SJohn Baldwin 	return (error);
1068fc276d92SJohn Baldwin }
1069fc276d92SJohn Baldwin 
1070fc276d92SJohn Baldwin int
vm_suspend_cpu(struct vcpu * vcpu)10717d9ef309SJohn Baldwin vm_suspend_cpu(struct vcpu *vcpu)
1072fc276d92SJohn Baldwin {
1073fc276d92SJohn Baldwin 	struct vm_activate_cpu ac;
1074fc276d92SJohn Baldwin 	int error;
1075fc276d92SJohn Baldwin 
1076fc276d92SJohn Baldwin 	bzero(&ac, sizeof(struct vm_activate_cpu));
10777d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_SUSPEND_CPU, &ac);
10787d9ef309SJohn Baldwin 	return (error);
10797d9ef309SJohn Baldwin }
10807d9ef309SJohn Baldwin 
10817d9ef309SJohn Baldwin int
vm_resume_cpu(struct vcpu * vcpu)10827d9ef309SJohn Baldwin vm_resume_cpu(struct vcpu *vcpu)
10837d9ef309SJohn Baldwin {
10847d9ef309SJohn Baldwin 	struct vm_activate_cpu ac;
10857d9ef309SJohn Baldwin 	int error;
10867d9ef309SJohn Baldwin 
10877d9ef309SJohn Baldwin 	bzero(&ac, sizeof(struct vm_activate_cpu));
10887d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_RESUME_CPU, &ac);
10897d9ef309SJohn Baldwin 	return (error);
10907d9ef309SJohn Baldwin }
10917d9ef309SJohn Baldwin 
10927d9ef309SJohn Baldwin int
vm_resume_all_cpus(struct vmctx * ctx)10937d9ef309SJohn Baldwin vm_resume_all_cpus(struct vmctx *ctx)
10947d9ef309SJohn Baldwin {
10957d9ef309SJohn Baldwin 	struct vm_activate_cpu ac;
10967d9ef309SJohn Baldwin 	int error;
10977d9ef309SJohn Baldwin 
10987d9ef309SJohn Baldwin 	bzero(&ac, sizeof(struct vm_activate_cpu));
10997d9ef309SJohn Baldwin 	ac.vcpuid = -1;
1100fc276d92SJohn Baldwin 	error = ioctl(ctx->fd, VM_RESUME_CPU, &ac);
1101fc276d92SJohn Baldwin 	return (error);
1102fc276d92SJohn Baldwin }
1103fc276d92SJohn Baldwin 
110456a26fc1SMark Johnston #ifdef __amd64__
1105fc276d92SJohn Baldwin int
vm_get_intinfo(struct vcpu * vcpu,uint64_t * info1,uint64_t * info2)11067d9ef309SJohn Baldwin vm_get_intinfo(struct vcpu *vcpu, uint64_t *info1, uint64_t *info2)
1107091d4532SNeel Natu {
1108091d4532SNeel Natu 	struct vm_intinfo vmii;
1109091d4532SNeel Natu 	int error;
1110091d4532SNeel Natu 
1111091d4532SNeel Natu 	bzero(&vmii, sizeof(struct vm_intinfo));
11127d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_GET_INTINFO, &vmii);
1113091d4532SNeel Natu 	if (error == 0) {
1114091d4532SNeel Natu 		*info1 = vmii.info1;
1115091d4532SNeel Natu 		*info2 = vmii.info2;
1116091d4532SNeel Natu 	}
1117091d4532SNeel Natu 	return (error);
1118091d4532SNeel Natu }
1119091d4532SNeel Natu 
1120091d4532SNeel Natu int
vm_set_intinfo(struct vcpu * vcpu,uint64_t info1)11217d9ef309SJohn Baldwin vm_set_intinfo(struct vcpu *vcpu, uint64_t info1)
1122091d4532SNeel Natu {
1123091d4532SNeel Natu 	struct vm_intinfo vmii;
1124091d4532SNeel Natu 	int error;
1125091d4532SNeel Natu 
1126091d4532SNeel Natu 	bzero(&vmii, sizeof(struct vm_intinfo));
1127091d4532SNeel Natu 	vmii.info1 = info1;
11287d9ef309SJohn Baldwin 	error = vcpu_ioctl(vcpu, VM_SET_INTINFO, &vmii);
1129091d4532SNeel Natu 	return (error);
1130091d4532SNeel Natu }
113156a26fc1SMark Johnston #endif
11320dafa5cdSNeel Natu 
113356a26fc1SMark Johnston #ifdef WITH_VMMAPI_SNAPSHOT
11340dafa5cdSNeel Natu int
vm_restart_instruction(struct vcpu * vcpu)11357d9ef309SJohn Baldwin vm_restart_instruction(struct vcpu *vcpu)
1136d087a399SNeel Natu {
11377d9ef309SJohn Baldwin 	int arg;
1138d087a399SNeel Natu 
11397d9ef309SJohn Baldwin 	return (vcpu_ioctl(vcpu, VM_RESTART_INSTRUCTION, &arg));
1140d087a399SNeel Natu }
114100ef17beSBartek Rutkowski 
114200ef17beSBartek Rutkowski int
vm_snapshot_req(struct vmctx * ctx,struct vm_snapshot_meta * meta)11430f735657SJohn Baldwin vm_snapshot_req(struct vmctx *ctx, struct vm_snapshot_meta *meta)
1144483d953aSJohn Baldwin {
1145483d953aSJohn Baldwin 
11460f735657SJohn Baldwin 	if (ioctl(ctx->fd, VM_SNAPSHOT_REQ, meta) == -1) {
1147483d953aSJohn Baldwin #ifdef SNAPSHOT_DEBUG
1148483d953aSJohn Baldwin 		fprintf(stderr, "%s: snapshot failed for %s: %d\r\n",
1149483d953aSJohn Baldwin 		    __func__, meta->dev_name, errno);
1150483d953aSJohn Baldwin #endif
1151483d953aSJohn Baldwin 		return (-1);
1152483d953aSJohn Baldwin 	}
1153483d953aSJohn Baldwin 	return (0);
1154483d953aSJohn Baldwin }
1155483d953aSJohn Baldwin 
1156483d953aSJohn Baldwin int
vm_restore_time(struct vmctx * ctx)1157483d953aSJohn Baldwin vm_restore_time(struct vmctx *ctx)
1158483d953aSJohn Baldwin {
1159483d953aSJohn Baldwin 	int dummy;
1160483d953aSJohn Baldwin 
1161483d953aSJohn Baldwin 	dummy = 0;
1162483d953aSJohn Baldwin 	return (ioctl(ctx->fd, VM_RESTORE_TIME, &dummy));
1163483d953aSJohn Baldwin }
116456a26fc1SMark Johnston #endif
1165483d953aSJohn Baldwin 
1166483d953aSJohn Baldwin int
vm_set_topology(struct vmctx * ctx,uint16_t sockets,uint16_t cores,uint16_t threads,uint16_t maxcpus)116701d822d3SRodney W. Grimes vm_set_topology(struct vmctx *ctx,
116801d822d3SRodney W. Grimes     uint16_t sockets, uint16_t cores, uint16_t threads, uint16_t maxcpus)
116901d822d3SRodney W. Grimes {
117001d822d3SRodney W. Grimes 	struct vm_cpu_topology topology;
117101d822d3SRodney W. Grimes 
117201d822d3SRodney W. Grimes 	bzero(&topology, sizeof (struct vm_cpu_topology));
117301d822d3SRodney W. Grimes 	topology.sockets = sockets;
117401d822d3SRodney W. Grimes 	topology.cores = cores;
117501d822d3SRodney W. Grimes 	topology.threads = threads;
117601d822d3SRodney W. Grimes 	topology.maxcpus = maxcpus;
117701d822d3SRodney W. Grimes 	return (ioctl(ctx->fd, VM_SET_TOPOLOGY, &topology));
117801d822d3SRodney W. Grimes }
117901d822d3SRodney W. Grimes 
118001d822d3SRodney W. Grimes int
vm_get_topology(struct vmctx * ctx,uint16_t * sockets,uint16_t * cores,uint16_t * threads,uint16_t * maxcpus)118101d822d3SRodney W. Grimes vm_get_topology(struct vmctx *ctx,
118201d822d3SRodney W. Grimes     uint16_t *sockets, uint16_t *cores, uint16_t *threads, uint16_t *maxcpus)
118301d822d3SRodney W. Grimes {
118401d822d3SRodney W. Grimes 	struct vm_cpu_topology topology;
118501d822d3SRodney W. Grimes 	int error;
118601d822d3SRodney W. Grimes 
118701d822d3SRodney W. Grimes 	bzero(&topology, sizeof (struct vm_cpu_topology));
118801d822d3SRodney W. Grimes 	error = ioctl(ctx->fd, VM_GET_TOPOLOGY, &topology);
118901d822d3SRodney W. Grimes 	if (error == 0) {
119001d822d3SRodney W. Grimes 		*sockets = topology.sockets;
119101d822d3SRodney W. Grimes 		*cores = topology.cores;
119201d822d3SRodney W. Grimes 		*threads = topology.threads;
119301d822d3SRodney W. Grimes 		*maxcpus = topology.maxcpus;
119401d822d3SRodney W. Grimes 	}
119501d822d3SRodney W. Grimes 	return (error);
119601d822d3SRodney W. Grimes }
119701d822d3SRodney W. Grimes 
11983e9b4532SMark Johnston int
vm_limit_rights(struct vmctx * ctx)11993e9b4532SMark Johnston vm_limit_rights(struct vmctx *ctx)
12003e9b4532SMark Johnston {
12013e9b4532SMark Johnston 	cap_rights_t rights;
12023e9b4532SMark Johnston 
12033e9b4532SMark Johnston 	cap_rights_init(&rights, CAP_IOCTL, CAP_MMAP_RW);
12043e9b4532SMark Johnston 	if (caph_rights_limit(ctx->fd, &rights) != 0)
12053e9b4532SMark Johnston 		return (-1);
12067f00e46bSMark Johnston 	if (caph_ioctls_limit(ctx->fd, vm_ioctl_cmds, vm_ioctl_ncmds) != 0)
12073e9b4532SMark Johnston 		return (-1);
12083e9b4532SMark Johnston 	return (0);
12093e9b4532SMark Johnston }
12103e9b4532SMark Johnston 
12113e9b4532SMark Johnston /*
12123e9b4532SMark Johnston  * Avoid using in new code.  Operations on the fd should be wrapped here so that
12133e9b4532SMark Johnston  * capability rights can be kept in sync.
12143e9b4532SMark Johnston  */
12153e9b4532SMark Johnston int
vm_get_device_fd(struct vmctx * ctx)12163e9b4532SMark Johnston vm_get_device_fd(struct vmctx *ctx)
12173e9b4532SMark Johnston {
12183e9b4532SMark Johnston 
12193e9b4532SMark Johnston 	return (ctx->fd);
12203e9b4532SMark Johnston }
12213e9b4532SMark Johnston 
12223e9b4532SMark Johnston /* Legacy interface, do not use. */
12233e9b4532SMark Johnston const cap_ioctl_t *
vm_get_ioctls(size_t * len)12243e9b4532SMark Johnston vm_get_ioctls(size_t *len)
12253e9b4532SMark Johnston {
12263e9b4532SMark Johnston 	cap_ioctl_t *cmds;
12277f00e46bSMark Johnston 	size_t sz;
122800ef17beSBartek Rutkowski 
122900ef17beSBartek Rutkowski 	if (len == NULL) {
12307f00e46bSMark Johnston 		sz = vm_ioctl_ncmds * sizeof(vm_ioctl_cmds[0]);
12317f00e46bSMark Johnston 		cmds = malloc(sz);
123200ef17beSBartek Rutkowski 		if (cmds == NULL)
123300ef17beSBartek Rutkowski 			return (NULL);
12347f00e46bSMark Johnston 		bcopy(vm_ioctl_cmds, cmds, sz);
123500ef17beSBartek Rutkowski 		return (cmds);
123600ef17beSBartek Rutkowski 	}
123700ef17beSBartek Rutkowski 
12387f00e46bSMark Johnston 	*len = vm_ioctl_ncmds;
123900ef17beSBartek Rutkowski 	return (NULL);
124000ef17beSBartek Rutkowski }
1241