xref: /freebsd/sys/x86/iommu/intel_ctx.c (revision 1abfd35537153d63e6d8d1453de6271ee5860844)
186be9f0dSKonstantin Belousov /*-
286be9f0dSKonstantin Belousov  * Copyright (c) 2013 The FreeBSD Foundation
386be9f0dSKonstantin Belousov  * All rights reserved.
486be9f0dSKonstantin Belousov  *
586be9f0dSKonstantin Belousov  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
686be9f0dSKonstantin Belousov  * under sponsorship from the FreeBSD Foundation.
786be9f0dSKonstantin Belousov  *
886be9f0dSKonstantin Belousov  * Redistribution and use in source and binary forms, with or without
986be9f0dSKonstantin Belousov  * modification, are permitted provided that the following conditions
1086be9f0dSKonstantin Belousov  * are met:
1186be9f0dSKonstantin Belousov  * 1. Redistributions of source code must retain the above copyright
1286be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer.
1386be9f0dSKonstantin Belousov  * 2. Redistributions in binary form must reproduce the above copyright
1486be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer in the
1586be9f0dSKonstantin Belousov  *    documentation and/or other materials provided with the distribution.
1686be9f0dSKonstantin Belousov  *
1786be9f0dSKonstantin Belousov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1886be9f0dSKonstantin Belousov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1986be9f0dSKonstantin Belousov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2086be9f0dSKonstantin Belousov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2186be9f0dSKonstantin Belousov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2286be9f0dSKonstantin Belousov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2386be9f0dSKonstantin Belousov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2486be9f0dSKonstantin Belousov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2586be9f0dSKonstantin Belousov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2686be9f0dSKonstantin Belousov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2786be9f0dSKonstantin Belousov  * SUCH DAMAGE.
2886be9f0dSKonstantin Belousov  */
2986be9f0dSKonstantin Belousov 
3086be9f0dSKonstantin Belousov #include <sys/cdefs.h>
3186be9f0dSKonstantin Belousov __FBSDID("$FreeBSD$");
3286be9f0dSKonstantin Belousov 
3386be9f0dSKonstantin Belousov #include <sys/param.h>
3486be9f0dSKonstantin Belousov #include <sys/systm.h>
3586be9f0dSKonstantin Belousov #include <sys/malloc.h>
3686be9f0dSKonstantin Belousov #include <sys/bus.h>
3786be9f0dSKonstantin Belousov #include <sys/interrupt.h>
3886be9f0dSKonstantin Belousov #include <sys/kernel.h>
3986be9f0dSKonstantin Belousov #include <sys/ktr.h>
4086be9f0dSKonstantin Belousov #include <sys/limits.h>
4186be9f0dSKonstantin Belousov #include <sys/lock.h>
4286be9f0dSKonstantin Belousov #include <sys/memdesc.h>
4386be9f0dSKonstantin Belousov #include <sys/mutex.h>
4486be9f0dSKonstantin Belousov #include <sys/proc.h>
4586be9f0dSKonstantin Belousov #include <sys/rwlock.h>
4686be9f0dSKonstantin Belousov #include <sys/rman.h>
4786be9f0dSKonstantin Belousov #include <sys/sysctl.h>
4886be9f0dSKonstantin Belousov #include <sys/taskqueue.h>
4986be9f0dSKonstantin Belousov #include <sys/tree.h>
5086be9f0dSKonstantin Belousov #include <sys/uio.h>
510a110d5bSKonstantin Belousov #include <sys/vmem.h>
5286be9f0dSKonstantin Belousov #include <vm/vm.h>
5386be9f0dSKonstantin Belousov #include <vm/vm_extern.h>
5486be9f0dSKonstantin Belousov #include <vm/vm_kern.h>
5586be9f0dSKonstantin Belousov #include <vm/vm_object.h>
5686be9f0dSKonstantin Belousov #include <vm/vm_page.h>
5786be9f0dSKonstantin Belousov #include <vm/vm_pager.h>
5886be9f0dSKonstantin Belousov #include <vm/vm_map.h>
5986be9f0dSKonstantin Belousov #include <machine/atomic.h>
6086be9f0dSKonstantin Belousov #include <machine/bus.h>
6186be9f0dSKonstantin Belousov #include <machine/md_var.h>
6286be9f0dSKonstantin Belousov #include <machine/specialreg.h>
6386be9f0dSKonstantin Belousov #include <x86/include/busdma_impl.h>
6486be9f0dSKonstantin Belousov #include <x86/iommu/intel_reg.h>
6586be9f0dSKonstantin Belousov #include <x86/iommu/busdma_dmar.h>
6686be9f0dSKonstantin Belousov #include <x86/iommu/intel_dmar.h>
6767499354SRyan Stone #include <dev/pci/pcireg.h>
6886be9f0dSKonstantin Belousov #include <dev/pci/pcivar.h>
6986be9f0dSKonstantin Belousov 
7086be9f0dSKonstantin Belousov static MALLOC_DEFINE(M_DMAR_CTX, "dmar_ctx", "Intel DMAR Context");
71*1abfd355SKonstantin Belousov static MALLOC_DEFINE(M_DMAR_DOMAIN, "dmar_dom", "Intel DMAR Domain");
7286be9f0dSKonstantin Belousov 
73*1abfd355SKonstantin Belousov static void dmar_domain_unload_task(void *arg, int pending);
74*1abfd355SKonstantin Belousov static void dmar_unref_domain_locked(struct dmar_unit *dmar,
75*1abfd355SKonstantin Belousov     struct dmar_domain *domain);
76*1abfd355SKonstantin Belousov static void dmar_domain_destroy(struct dmar_domain *domain);
77*1abfd355SKonstantin Belousov static void dmar_ctx_dtr(struct dmar_ctx *ctx);
7886be9f0dSKonstantin Belousov 
7986be9f0dSKonstantin Belousov static void
8086be9f0dSKonstantin Belousov dmar_ensure_ctx_page(struct dmar_unit *dmar, int bus)
8186be9f0dSKonstantin Belousov {
8286be9f0dSKonstantin Belousov 	struct sf_buf *sf;
8386be9f0dSKonstantin Belousov 	dmar_root_entry_t *re;
8486be9f0dSKonstantin Belousov 	vm_page_t ctxm;
8586be9f0dSKonstantin Belousov 
8686be9f0dSKonstantin Belousov 	/*
8786be9f0dSKonstantin Belousov 	 * Allocated context page must be linked.
8886be9f0dSKonstantin Belousov 	 */
8986be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_NOALLOC);
9086be9f0dSKonstantin Belousov 	if (ctxm != NULL)
9186be9f0dSKonstantin Belousov 		return;
9286be9f0dSKonstantin Belousov 
9386be9f0dSKonstantin Belousov 	/*
9486be9f0dSKonstantin Belousov 	 * Page not present, allocate and link.  Note that other
9586be9f0dSKonstantin Belousov 	 * thread might execute this sequence in parallel.  This
9686be9f0dSKonstantin Belousov 	 * should be safe, because the context entries written by both
9786be9f0dSKonstantin Belousov 	 * threads are equal.
9886be9f0dSKonstantin Belousov 	 */
9986be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
10086be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_ZERO |
10186be9f0dSKonstantin Belousov 	    DMAR_PGF_WAITOK);
10286be9f0dSKonstantin Belousov 	re = dmar_map_pgtbl(dmar->ctx_obj, 0, DMAR_PGF_NOALLOC, &sf);
10386be9f0dSKonstantin Belousov 	re += bus;
10486be9f0dSKonstantin Belousov 	dmar_pte_store(&re->r1, DMAR_ROOT_R1_P | (DMAR_ROOT_R1_CTP_MASK &
10586be9f0dSKonstantin Belousov 	    VM_PAGE_TO_PHYS(ctxm)));
1066b7c46afSKonstantin Belousov 	dmar_flush_root_to_ram(dmar, re);
1076b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
10886be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
10986be9f0dSKonstantin Belousov }
11086be9f0dSKonstantin Belousov 
11186be9f0dSKonstantin Belousov static dmar_ctx_entry_t *
11286be9f0dSKonstantin Belousov dmar_map_ctx_entry(struct dmar_ctx *ctx, struct sf_buf **sfp)
11386be9f0dSKonstantin Belousov {
11486be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
11586be9f0dSKonstantin Belousov 
116*1abfd355SKonstantin Belousov 	ctxp = dmar_map_pgtbl(ctx->domain->dmar->ctx_obj, 1 +
117*1abfd355SKonstantin Belousov 	    PCI_RID2BUS(ctx->rid), DMAR_PGF_NOALLOC | DMAR_PGF_WAITOK, sfp);
11867499354SRyan Stone 	ctxp += ctx->rid & 0xff;
11986be9f0dSKonstantin Belousov 	return (ctxp);
12086be9f0dSKonstantin Belousov }
12186be9f0dSKonstantin Belousov 
12286be9f0dSKonstantin Belousov static void
12367499354SRyan Stone ctx_tag_init(struct dmar_ctx *ctx, device_t dev)
12486be9f0dSKonstantin Belousov {
12586be9f0dSKonstantin Belousov 	bus_addr_t maxaddr;
12686be9f0dSKonstantin Belousov 
127*1abfd355SKonstantin Belousov 	maxaddr = MIN(ctx->domain->end, BUS_SPACE_MAXADDR);
12886be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.ref_count = 1; /* Prevent free */
12986be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.impl = &bus_dma_dmar_impl;
13086be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.boundary = PCI_DMA_BOUNDARY;
13186be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.lowaddr = maxaddr;
13286be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.highaddr = maxaddr;
13386be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsize = maxaddr;
13486be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.nsegments = BUS_SPACE_UNRESTRICTED;
13586be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsegsz = maxaddr;
13686be9f0dSKonstantin Belousov 	ctx->ctx_tag.ctx = ctx;
13767499354SRyan Stone 	ctx->ctx_tag.owner = dev;
13886be9f0dSKonstantin Belousov }
13986be9f0dSKonstantin Belousov 
14086be9f0dSKonstantin Belousov static void
141*1abfd355SKonstantin Belousov ctx_id_entry_init(struct dmar_ctx *ctx, dmar_ctx_entry_t *ctxp, bool move)
14286be9f0dSKonstantin Belousov {
14386be9f0dSKonstantin Belousov 	struct dmar_unit *unit;
144*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
14586be9f0dSKonstantin Belousov 	vm_page_t ctx_root;
14686be9f0dSKonstantin Belousov 
147*1abfd355SKonstantin Belousov 	domain = ctx->domain;
148*1abfd355SKonstantin Belousov 	unit = domain->dmar;
149*1abfd355SKonstantin Belousov 	KASSERT(move || (ctxp->ctx1 == 0 && ctxp->ctx2 == 0),
15086be9f0dSKonstantin Belousov 	    ("dmar%d: initialized ctx entry %d:%d:%d 0x%jx 0x%jx",
15167499354SRyan Stone 	    unit->unit, pci_get_bus(ctx->ctx_tag.owner),
15267499354SRyan Stone 	    pci_get_slot(ctx->ctx_tag.owner),
15367499354SRyan Stone 	    pci_get_function(ctx->ctx_tag.owner),
154*1abfd355SKonstantin Belousov 	    ctxp->ctx1, ctxp->ctx2));
155*1abfd355SKonstantin Belousov 	/*
156*1abfd355SKonstantin Belousov 	 * For update due to move, the store is not atomic.  It is
157*1abfd355SKonstantin Belousov 	 * possible that DMAR read upper doubleword, while low
158*1abfd355SKonstantin Belousov 	 * doubleword is not yet updated.  The domain id is stored in
159*1abfd355SKonstantin Belousov 	 * the upper doubleword, while the table pointer in the lower.
160*1abfd355SKonstantin Belousov 	 *
161*1abfd355SKonstantin Belousov 	 * There is no good solution, for the same reason it is wrong
162*1abfd355SKonstantin Belousov 	 * to clear P bit in the ctx entry for update.
163*1abfd355SKonstantin Belousov 	 */
164*1abfd355SKonstantin Belousov 	dmar_pte_store1(&ctxp->ctx2, DMAR_CTX2_DID(domain->domain) |
165*1abfd355SKonstantin Belousov 	    domain->awlvl);
166*1abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_IDMAP) != 0 &&
16786be9f0dSKonstantin Belousov 	    (unit->hw_ecap & DMAR_ECAP_PT) != 0) {
168*1abfd355SKonstantin Belousov 		KASSERT(domain->pgtbl_obj == NULL,
16986be9f0dSKonstantin Belousov 		    ("ctx %p non-null pgtbl_obj", ctx));
170*1abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_PASS | DMAR_CTX1_P);
17186be9f0dSKonstantin Belousov 	} else {
172*1abfd355SKonstantin Belousov 		ctx_root = dmar_pgalloc(domain->pgtbl_obj, 0, DMAR_PGF_NOALLOC);
173*1abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_UNTR |
17486be9f0dSKonstantin Belousov 		    (DMAR_CTX1_ASR_MASK & VM_PAGE_TO_PHYS(ctx_root)) |
17586be9f0dSKonstantin Belousov 		    DMAR_CTX1_P);
17686be9f0dSKonstantin Belousov 	}
1776b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(unit, ctxp);
17886be9f0dSKonstantin Belousov }
17986be9f0dSKonstantin Belousov 
18086be9f0dSKonstantin Belousov static int
181*1abfd355SKonstantin Belousov dmar_flush_for_ctx_entry(struct dmar_unit *dmar, bool force)
182*1abfd355SKonstantin Belousov {
183*1abfd355SKonstantin Belousov 	int error;
184*1abfd355SKonstantin Belousov 
185*1abfd355SKonstantin Belousov 	/*
186*1abfd355SKonstantin Belousov 	 * If dmar declares Caching Mode as Set, follow 11.5 "Caching
187*1abfd355SKonstantin Belousov 	 * Mode Consideration" and do the (global) invalidation of the
188*1abfd355SKonstantin Belousov 	 * negative TLB entries.
189*1abfd355SKonstantin Belousov 	 */
190*1abfd355SKonstantin Belousov 	if ((dmar->hw_cap & DMAR_CAP_CM) == 0 && !force)
191*1abfd355SKonstantin Belousov 		return (0);
192*1abfd355SKonstantin Belousov 	if (dmar->qi_enabled) {
193*1abfd355SKonstantin Belousov 		dmar_qi_invalidate_ctx_glob_locked(dmar);
194*1abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force)
195*1abfd355SKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
196*1abfd355SKonstantin Belousov 		return (0);
197*1abfd355SKonstantin Belousov 	}
198*1abfd355SKonstantin Belousov 	error = dmar_inv_ctx_glob(dmar);
199*1abfd355SKonstantin Belousov 	if (error == 0 && ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force))
200*1abfd355SKonstantin Belousov 		error = dmar_inv_iotlb_glob(dmar);
201*1abfd355SKonstantin Belousov 	return (error);
202*1abfd355SKonstantin Belousov }
203*1abfd355SKonstantin Belousov 
204*1abfd355SKonstantin Belousov static int
205*1abfd355SKonstantin Belousov domain_init_rmrr(struct dmar_domain *domain, device_t dev)
20686be9f0dSKonstantin Belousov {
20786be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq rmrr_entries;
20886be9f0dSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
20986be9f0dSKonstantin Belousov 	vm_page_t *ma;
21086be9f0dSKonstantin Belousov 	dmar_gaddr_t start, end;
21186be9f0dSKonstantin Belousov 	vm_pindex_t size, i;
21286be9f0dSKonstantin Belousov 	int error, error1;
21386be9f0dSKonstantin Belousov 
21486be9f0dSKonstantin Belousov 	error = 0;
21586be9f0dSKonstantin Belousov 	TAILQ_INIT(&rmrr_entries);
216*1abfd355SKonstantin Belousov 	dmar_dev_parse_rmrr(domain, dev, &rmrr_entries);
21786be9f0dSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, &rmrr_entries, unroll_link, entry1) {
21886be9f0dSKonstantin Belousov 		/*
21986be9f0dSKonstantin Belousov 		 * VT-d specification requires that the start of an
22086be9f0dSKonstantin Belousov 		 * RMRR entry is 4k-aligned.  Buggy BIOSes put
22186be9f0dSKonstantin Belousov 		 * anything into the start and end fields.  Truncate
22286be9f0dSKonstantin Belousov 		 * and round as neccesary.
22386be9f0dSKonstantin Belousov 		 *
22486be9f0dSKonstantin Belousov 		 * We also allow the overlapping RMRR entries, see
22586be9f0dSKonstantin Belousov 		 * dmar_gas_alloc_region().
22686be9f0dSKonstantin Belousov 		 */
22786be9f0dSKonstantin Belousov 		start = entry->start;
22886be9f0dSKonstantin Belousov 		end = entry->end;
22986be9f0dSKonstantin Belousov 		entry->start = trunc_page(start);
23086be9f0dSKonstantin Belousov 		entry->end = round_page(end);
231e02b05b3SKonstantin Belousov 		if (entry->start == entry->end) {
232e02b05b3SKonstantin Belousov 			/* Workaround for some AMI (?) BIOSes */
233e02b05b3SKonstantin Belousov 			if (bootverbose) {
234e02b05b3SKonstantin Belousov 				device_printf(dev, "BIOS bug: dmar%d RMRR "
235e02b05b3SKonstantin Belousov 				    "region (%jx, %jx) corrected\n",
236*1abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end);
237e02b05b3SKonstantin Belousov 			}
238e02b05b3SKonstantin Belousov 			entry->end += DMAR_PAGE_SIZE * 0x20;
239e02b05b3SKonstantin Belousov 		}
24086be9f0dSKonstantin Belousov 		size = OFF_TO_IDX(entry->end - entry->start);
24186be9f0dSKonstantin Belousov 		ma = malloc(sizeof(vm_page_t) * size, M_TEMP, M_WAITOK);
24286be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++) {
24386be9f0dSKonstantin Belousov 			ma[i] = vm_page_getfake(entry->start + PAGE_SIZE * i,
24486be9f0dSKonstantin Belousov 			    VM_MEMATTR_DEFAULT);
24586be9f0dSKonstantin Belousov 		}
246*1abfd355SKonstantin Belousov 		error1 = dmar_gas_map_region(domain, entry,
247*1abfd355SKonstantin Belousov 		    DMAR_MAP_ENTRY_READ | DMAR_MAP_ENTRY_WRITE,
248*1abfd355SKonstantin Belousov 		    DMAR_GM_CANWAIT, ma);
24986be9f0dSKonstantin Belousov 		/*
25086be9f0dSKonstantin Belousov 		 * Non-failed RMRR entries are owned by context rb
25186be9f0dSKonstantin Belousov 		 * tree.  Get rid of the failed entry, but do not stop
25286be9f0dSKonstantin Belousov 		 * the loop.  Rest of the parsed RMRR entries are
25386be9f0dSKonstantin Belousov 		 * loaded and removed on the context destruction.
25486be9f0dSKonstantin Belousov 		 */
25586be9f0dSKonstantin Belousov 		if (error1 == 0 && entry->end != entry->start) {
256*1abfd355SKonstantin Belousov 			DMAR_LOCK(domain->dmar);
257*1abfd355SKonstantin Belousov 			domain->refs++; /* XXXKIB prevent free */
258*1abfd355SKonstantin Belousov 			domain->flags |= DMAR_DOMAIN_RMRR;
259*1abfd355SKonstantin Belousov 			DMAR_UNLOCK(domain->dmar);
26086be9f0dSKonstantin Belousov 		} else {
26186be9f0dSKonstantin Belousov 			if (error1 != 0) {
26286be9f0dSKonstantin Belousov 				device_printf(dev,
26386be9f0dSKonstantin Belousov 			    "dmar%d failed to map RMRR region (%jx, %jx) %d\n",
264*1abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end, error1);
26586be9f0dSKonstantin Belousov 				error = error1;
26686be9f0dSKonstantin Belousov 			}
26786be9f0dSKonstantin Belousov 			TAILQ_REMOVE(&rmrr_entries, entry, unroll_link);
268*1abfd355SKonstantin Belousov 			dmar_gas_free_entry(domain, entry);
26986be9f0dSKonstantin Belousov 		}
27086be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++)
27186be9f0dSKonstantin Belousov 			vm_page_putfake(ma[i]);
27286be9f0dSKonstantin Belousov 		free(ma, M_TEMP);
27386be9f0dSKonstantin Belousov 	}
27486be9f0dSKonstantin Belousov 	return (error);
27586be9f0dSKonstantin Belousov }
27686be9f0dSKonstantin Belousov 
277*1abfd355SKonstantin Belousov static struct dmar_domain *
278*1abfd355SKonstantin Belousov dmar_domain_alloc(struct dmar_unit *dmar, bool id_mapped)
279*1abfd355SKonstantin Belousov {
280*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
281*1abfd355SKonstantin Belousov 	int error, id, mgaw;
282*1abfd355SKonstantin Belousov 
283*1abfd355SKonstantin Belousov 	id = alloc_unr(dmar->domids);
284*1abfd355SKonstantin Belousov 	if (id == -1)
285*1abfd355SKonstantin Belousov 		return (NULL);
286*1abfd355SKonstantin Belousov 	domain = malloc(sizeof(*domain), M_DMAR_DOMAIN, M_WAITOK | M_ZERO);
287*1abfd355SKonstantin Belousov 	domain->domain = id;
288*1abfd355SKonstantin Belousov 	LIST_INIT(&domain->contexts);
289*1abfd355SKonstantin Belousov 	RB_INIT(&domain->rb_root);
290*1abfd355SKonstantin Belousov 	TAILQ_INIT(&domain->unload_entries);
291*1abfd355SKonstantin Belousov 	TASK_INIT(&domain->unload_task, 0, dmar_domain_unload_task, domain);
292*1abfd355SKonstantin Belousov 	mtx_init(&domain->lock, "dmardom", NULL, MTX_DEF);
293*1abfd355SKonstantin Belousov 	domain->dmar = dmar;
294*1abfd355SKonstantin Belousov 
295*1abfd355SKonstantin Belousov 	/*
296*1abfd355SKonstantin Belousov 	 * For now, use the maximal usable physical address of the
297*1abfd355SKonstantin Belousov 	 * installed memory to calculate the mgaw on id_mapped domain.
298*1abfd355SKonstantin Belousov 	 * It is useful for the identity mapping, and less so for the
299*1abfd355SKonstantin Belousov 	 * virtualized bus address space.
300*1abfd355SKonstantin Belousov 	 */
301*1abfd355SKonstantin Belousov 	domain->end = id_mapped ? ptoa(Maxmem) : BUS_SPACE_MAXADDR;
302*1abfd355SKonstantin Belousov 	mgaw = dmar_maxaddr2mgaw(dmar, domain->end, !id_mapped);
303*1abfd355SKonstantin Belousov 	error = domain_set_agaw(domain, mgaw);
304*1abfd355SKonstantin Belousov 	if (error != 0)
305*1abfd355SKonstantin Belousov 		goto fail;
306*1abfd355SKonstantin Belousov 	if (!id_mapped)
307*1abfd355SKonstantin Belousov 		/* Use all supported address space for remapping. */
308*1abfd355SKonstantin Belousov 		domain->end = 1ULL << (domain->agaw - 1);
309*1abfd355SKonstantin Belousov 
310*1abfd355SKonstantin Belousov 	dmar_gas_init_domain(domain);
311*1abfd355SKonstantin Belousov 
312*1abfd355SKonstantin Belousov 	if (id_mapped) {
313*1abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_PT) == 0) {
314*1abfd355SKonstantin Belousov 			domain->pgtbl_obj = domain_get_idmap_pgtbl(domain,
315*1abfd355SKonstantin Belousov 			    domain->end);
316*1abfd355SKonstantin Belousov 		}
317*1abfd355SKonstantin Belousov 		domain->flags |= DMAR_DOMAIN_IDMAP;
318*1abfd355SKonstantin Belousov 	} else {
319*1abfd355SKonstantin Belousov 		error = domain_alloc_pgtbl(domain);
320*1abfd355SKonstantin Belousov 		if (error != 0)
321*1abfd355SKonstantin Belousov 			goto fail;
322*1abfd355SKonstantin Belousov 		/* Disable local apic region access */
323*1abfd355SKonstantin Belousov 		error = dmar_gas_reserve_region(domain, 0xfee00000,
324*1abfd355SKonstantin Belousov 		    0xfeefffff + 1);
325*1abfd355SKonstantin Belousov 		if (error != 0)
326*1abfd355SKonstantin Belousov 			goto fail;
327*1abfd355SKonstantin Belousov 	}
328*1abfd355SKonstantin Belousov 	return (domain);
329*1abfd355SKonstantin Belousov 
330*1abfd355SKonstantin Belousov fail:
331*1abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
332*1abfd355SKonstantin Belousov 	return (NULL);
333*1abfd355SKonstantin Belousov }
334*1abfd355SKonstantin Belousov 
33586be9f0dSKonstantin Belousov static struct dmar_ctx *
336*1abfd355SKonstantin Belousov dmar_ctx_alloc(struct dmar_domain *domain, uint16_t rid)
33786be9f0dSKonstantin Belousov {
33886be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
33986be9f0dSKonstantin Belousov 
34086be9f0dSKonstantin Belousov 	ctx = malloc(sizeof(*ctx), M_DMAR_CTX, M_WAITOK | M_ZERO);
341*1abfd355SKonstantin Belousov 	ctx->domain = domain;
34267499354SRyan Stone 	ctx->rid = rid;
343*1abfd355SKonstantin Belousov 	ctx->refs = 1;
34486be9f0dSKonstantin Belousov 	return (ctx);
34586be9f0dSKonstantin Belousov }
34686be9f0dSKonstantin Belousov 
34786be9f0dSKonstantin Belousov static void
348*1abfd355SKonstantin Belousov dmar_ctx_link(struct dmar_ctx *ctx)
349*1abfd355SKonstantin Belousov {
350*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
351*1abfd355SKonstantin Belousov 
352*1abfd355SKonstantin Belousov 	domain = ctx->domain;
353*1abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
354*1abfd355SKonstantin Belousov 	KASSERT(domain->refs >= domain->ctx_cnt,
355*1abfd355SKonstantin Belousov 	    ("dom %p ref underflow %d %d", domain, domain->refs,
356*1abfd355SKonstantin Belousov 	    domain->ctx_cnt));
357*1abfd355SKonstantin Belousov 	domain->refs++;
358*1abfd355SKonstantin Belousov 	domain->ctx_cnt++;
359*1abfd355SKonstantin Belousov 	LIST_INSERT_HEAD(&domain->contexts, ctx, link);
360*1abfd355SKonstantin Belousov }
361*1abfd355SKonstantin Belousov 
362*1abfd355SKonstantin Belousov static void
363*1abfd355SKonstantin Belousov dmar_ctx_unlink(struct dmar_ctx *ctx)
364*1abfd355SKonstantin Belousov {
365*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
366*1abfd355SKonstantin Belousov 
367*1abfd355SKonstantin Belousov 	domain = ctx->domain;
368*1abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
369*1abfd355SKonstantin Belousov 	KASSERT(domain->refs > 0,
370*1abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d", domain, domain->refs));
371*1abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt >= domain->refs,
372*1abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d ctx_cnt %d", domain,
373*1abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
374*1abfd355SKonstantin Belousov 	domain->refs--;
375*1abfd355SKonstantin Belousov 	domain->ctx_cnt--;
376*1abfd355SKonstantin Belousov 	LIST_REMOVE(ctx, link);
377*1abfd355SKonstantin Belousov }
378*1abfd355SKonstantin Belousov 
379*1abfd355SKonstantin Belousov static void
380*1abfd355SKonstantin Belousov dmar_domain_destroy(struct dmar_domain *domain)
38186be9f0dSKonstantin Belousov {
38286be9f0dSKonstantin Belousov 
383*1abfd355SKonstantin Belousov 	KASSERT(TAILQ_EMPTY(&domain->unload_entries),
384*1abfd355SKonstantin Belousov 	    ("unfinished unloads %p", domain));
385*1abfd355SKonstantin Belousov 	KASSERT(LIST_EMPTY(&domain->contexts),
386*1abfd355SKonstantin Belousov 	    ("destroying dom %p with contexts", domain));
387*1abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt == 0,
388*1abfd355SKonstantin Belousov 	    ("destroying dom %p with ctx_cnt %d", domain, domain->ctx_cnt));
389*1abfd355SKonstantin Belousov 	KASSERT(domain->refs == 0,
390*1abfd355SKonstantin Belousov 	    ("destroying dom %p with refs %d", domain, domain->refs));
391*1abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_GAS_INITED) != 0) {
392*1abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
393*1abfd355SKonstantin Belousov 		dmar_gas_fini_domain(domain);
394*1abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
39586be9f0dSKonstantin Belousov 	}
396*1abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_PGTBL_INITED) != 0) {
397*1abfd355SKonstantin Belousov 		if (domain->pgtbl_obj != NULL)
398*1abfd355SKonstantin Belousov 			DMAR_DOMAIN_PGLOCK(domain);
399*1abfd355SKonstantin Belousov 		domain_free_pgtbl(domain);
40086be9f0dSKonstantin Belousov 	}
401*1abfd355SKonstantin Belousov 	mtx_destroy(&domain->lock);
402*1abfd355SKonstantin Belousov 	free_unr(domain->dmar->domids, domain->domain);
403*1abfd355SKonstantin Belousov 	free(domain, M_DMAR_DOMAIN);
40486be9f0dSKonstantin Belousov }
40586be9f0dSKonstantin Belousov 
40686be9f0dSKonstantin Belousov struct dmar_ctx *
407*1abfd355SKonstantin Belousov dmar_get_ctx_for_dev(struct dmar_unit *dmar, device_t dev, uint16_t rid,
408*1abfd355SKonstantin Belousov     bool id_mapped, bool rmrr_init)
40986be9f0dSKonstantin Belousov {
410*1abfd355SKonstantin Belousov 	struct dmar_domain *domain, *domain1;
41186be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx, *ctx1;
41286be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
41386be9f0dSKonstantin Belousov 	struct sf_buf *sf;
414*1abfd355SKonstantin Belousov 	int bus, slot, func, error;
41586be9f0dSKonstantin Belousov 	bool enable;
41686be9f0dSKonstantin Belousov 
41767499354SRyan Stone 	bus = pci_get_bus(dev);
41867499354SRyan Stone 	slot = pci_get_slot(dev);
41967499354SRyan Stone 	func = pci_get_function(dev);
42086be9f0dSKonstantin Belousov 	enable = false;
42186be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
42286be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
42367499354SRyan Stone 	ctx = dmar_find_ctx_locked(dmar, rid);
42486be9f0dSKonstantin Belousov 	error = 0;
42586be9f0dSKonstantin Belousov 	if (ctx == NULL) {
42686be9f0dSKonstantin Belousov 		/*
42786be9f0dSKonstantin Belousov 		 * Perform the allocations which require sleep or have
42886be9f0dSKonstantin Belousov 		 * higher chance to succeed if the sleep is allowed.
42986be9f0dSKonstantin Belousov 		 */
43086be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
431b29d186cSKonstantin Belousov 		dmar_ensure_ctx_page(dmar, PCI_RID2BUS(rid));
432*1abfd355SKonstantin Belousov 		domain1 = dmar_domain_alloc(dmar, id_mapped);
433*1abfd355SKonstantin Belousov 		if (domain1 == NULL) {
43486be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
43586be9f0dSKonstantin Belousov 			return (NULL);
43686be9f0dSKonstantin Belousov 		}
437*1abfd355SKonstantin Belousov 		error = domain_init_rmrr(domain1, dev);
43886be9f0dSKonstantin Belousov 		if (error != 0) {
439*1abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
44086be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
44186be9f0dSKonstantin Belousov 			return (NULL);
44286be9f0dSKonstantin Belousov 		}
443*1abfd355SKonstantin Belousov 		ctx1 = dmar_ctx_alloc(domain1, rid);
44486be9f0dSKonstantin Belousov 		ctxp = dmar_map_ctx_entry(ctx1, &sf);
44586be9f0dSKonstantin Belousov 		DMAR_LOCK(dmar);
44686be9f0dSKonstantin Belousov 
44786be9f0dSKonstantin Belousov 		/*
44886be9f0dSKonstantin Belousov 		 * Recheck the contexts, other thread might have
44986be9f0dSKonstantin Belousov 		 * already allocated needed one.
45086be9f0dSKonstantin Belousov 		 */
45167499354SRyan Stone 		ctx = dmar_find_ctx_locked(dmar, rid);
45286be9f0dSKonstantin Belousov 		if (ctx == NULL) {
453*1abfd355SKonstantin Belousov 			domain = domain1;
45486be9f0dSKonstantin Belousov 			ctx = ctx1;
455*1abfd355SKonstantin Belousov 			dmar_ctx_link(ctx);
4569d0bc6d8SKonstantin Belousov 			ctx->ctx_tag.owner = dev;
45767499354SRyan Stone 			ctx_tag_init(ctx, dev);
45886be9f0dSKonstantin Belousov 
45986be9f0dSKonstantin Belousov 			/*
46086be9f0dSKonstantin Belousov 			 * This is the first activated context for the
46186be9f0dSKonstantin Belousov 			 * DMAR unit.  Enable the translation after
46286be9f0dSKonstantin Belousov 			 * everything is set up.
46386be9f0dSKonstantin Belousov 			 */
464*1abfd355SKonstantin Belousov 			if (LIST_EMPTY(&dmar->domains))
46586be9f0dSKonstantin Belousov 				enable = true;
466*1abfd355SKonstantin Belousov 			LIST_INSERT_HEAD(&dmar->domains, domain, link);
467*1abfd355SKonstantin Belousov 			ctx_id_entry_init(ctx, ctxp, false);
46886be9f0dSKonstantin Belousov 			device_printf(dev,
46934e8337bSKonstantin Belousov 			    "dmar%d pci%d:%d:%d:%d rid %x domain %d mgaw %d "
4709d0bc6d8SKonstantin Belousov 			    "agaw %d %s-mapped\n",
47186be9f0dSKonstantin Belousov 			    dmar->unit, dmar->segment, bus, slot,
472*1abfd355SKonstantin Belousov 			    func, rid, domain->domain, domain->mgaw,
473*1abfd355SKonstantin Belousov 			    domain->agaw, id_mapped ? "id" : "re");
47486be9f0dSKonstantin Belousov 		} else {
475*1abfd355SKonstantin Belousov 			/* Nothing needs to be done to destroy ctx1. */
476*1abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
477*1abfd355SKonstantin Belousov 			domain = ctx->domain;
478*1abfd355SKonstantin Belousov 			ctx->refs++; /* tag referenced us */
47986be9f0dSKonstantin Belousov 		}
4806b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
48168eeb96aSKonstantin Belousov 	} else {
482*1abfd355SKonstantin Belousov 		domain = ctx->domain;
483*1abfd355SKonstantin Belousov 		ctx->refs++; /* tag referenced us */
484*1abfd355SKonstantin Belousov 	}
485*1abfd355SKonstantin Belousov 
486*1abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, enable);
48786be9f0dSKonstantin Belousov 	if (error != 0) {
48886be9f0dSKonstantin Belousov 		dmar_free_ctx_locked(dmar, ctx);
48986be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
49086be9f0dSKonstantin Belousov 		return (NULL);
49186be9f0dSKonstantin Belousov 	}
49268eeb96aSKonstantin Belousov 
49368eeb96aSKonstantin Belousov 	/*
49468eeb96aSKonstantin Belousov 	 * The dmar lock was potentially dropped between check for the
49568eeb96aSKonstantin Belousov 	 * empty context list and now.  Recheck the state of GCMD_TE
49668eeb96aSKonstantin Belousov 	 * to avoid unneeded command.
49768eeb96aSKonstantin Belousov 	 */
49868eeb96aSKonstantin Belousov 	if (enable && !rmrr_init && (dmar->hw_gcmd & DMAR_GCMD_TE) == 0) {
49986be9f0dSKonstantin Belousov 		error = dmar_enable_translation(dmar);
50086be9f0dSKonstantin Belousov 		if (error != 0) {
50186be9f0dSKonstantin Belousov 			dmar_free_ctx_locked(dmar, ctx);
50286be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
50386be9f0dSKonstantin Belousov 			return (NULL);
50486be9f0dSKonstantin Belousov 		}
50586be9f0dSKonstantin Belousov 	}
50686be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
50786be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
50886be9f0dSKonstantin Belousov 	return (ctx);
50986be9f0dSKonstantin Belousov }
51086be9f0dSKonstantin Belousov 
511*1abfd355SKonstantin Belousov int
512*1abfd355SKonstantin Belousov dmar_move_ctx_to_domain(struct dmar_domain *domain, struct dmar_ctx *ctx)
513*1abfd355SKonstantin Belousov {
514*1abfd355SKonstantin Belousov 	struct dmar_unit *dmar;
515*1abfd355SKonstantin Belousov 	struct dmar_domain *old_domain;
516*1abfd355SKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
517*1abfd355SKonstantin Belousov 	struct sf_buf *sf;
518*1abfd355SKonstantin Belousov 	int error;
519*1abfd355SKonstantin Belousov 
520*1abfd355SKonstantin Belousov 	dmar = domain->dmar;
521*1abfd355SKonstantin Belousov 	old_domain = ctx->domain;
522*1abfd355SKonstantin Belousov 	if (domain == old_domain)
523*1abfd355SKonstantin Belousov 		return (0);
524*1abfd355SKonstantin Belousov 	KASSERT(old_domain->dmar == dmar,
525*1abfd355SKonstantin Belousov 	    ("domain %p %u moving between dmars %u %u", domain,
526*1abfd355SKonstantin Belousov 	    domain->domain, old_domain->dmar->unit, domain->dmar->unit));
527*1abfd355SKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
528*1abfd355SKonstantin Belousov 
529*1abfd355SKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
530*1abfd355SKonstantin Belousov 	DMAR_LOCK(dmar);
531*1abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
532*1abfd355SKonstantin Belousov 	ctx->domain = domain;
533*1abfd355SKonstantin Belousov 	dmar_ctx_link(ctx);
534*1abfd355SKonstantin Belousov 	ctx_id_entry_init(ctx, ctxp, true);
535*1abfd355SKonstantin Belousov 	dmar_unmap_pgtbl(sf);
536*1abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, true);
537*1abfd355SKonstantin Belousov 	/* If flush failed, rolling back would not work as well. */
538*1abfd355SKonstantin Belousov 	printf("dmar%d rid %x domain %d->%d %s-mapped\n",
539*1abfd355SKonstantin Belousov 	    dmar->unit, ctx->rid, old_domain->domain, domain->domain,
540*1abfd355SKonstantin Belousov 	    (domain->flags & DMAR_DOMAIN_IDMAP) != 0 ? "id" : "re");
541*1abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, old_domain);
542*1abfd355SKonstantin Belousov 	TD_PINNED_ASSERT;
543*1abfd355SKonstantin Belousov 	return (error);
544*1abfd355SKonstantin Belousov }
545*1abfd355SKonstantin Belousov 
546*1abfd355SKonstantin Belousov static void
547*1abfd355SKonstantin Belousov dmar_unref_domain_locked(struct dmar_unit *dmar, struct dmar_domain *domain)
548*1abfd355SKonstantin Belousov {
549*1abfd355SKonstantin Belousov 
550*1abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
551*1abfd355SKonstantin Belousov 	KASSERT(domain->refs >= 1,
552*1abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %u", dmar->unit, domain, domain->refs));
553*1abfd355SKonstantin Belousov 	KASSERT(domain->refs > domain->ctx_cnt,
554*1abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %d ctx_cnt %d", dmar->unit, domain,
555*1abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
556*1abfd355SKonstantin Belousov 
557*1abfd355SKonstantin Belousov 	if (domain->refs > 1) {
558*1abfd355SKonstantin Belousov 		domain->refs--;
559*1abfd355SKonstantin Belousov 		DMAR_UNLOCK(dmar);
560*1abfd355SKonstantin Belousov 		return;
561*1abfd355SKonstantin Belousov 	}
562*1abfd355SKonstantin Belousov 
563*1abfd355SKonstantin Belousov 	KASSERT((domain->flags & DMAR_DOMAIN_RMRR) == 0,
564*1abfd355SKonstantin Belousov 	    ("lost ref on RMRR domain %p", domain));
565*1abfd355SKonstantin Belousov 
566*1abfd355SKonstantin Belousov 	LIST_REMOVE(domain, link);
567*1abfd355SKonstantin Belousov 	DMAR_UNLOCK(dmar);
568*1abfd355SKonstantin Belousov 
569*1abfd355SKonstantin Belousov 	taskqueue_drain(dmar->delayed_taskqueue, &domain->unload_task);
570*1abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
571*1abfd355SKonstantin Belousov }
572*1abfd355SKonstantin Belousov 
57386be9f0dSKonstantin Belousov void
57486be9f0dSKonstantin Belousov dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx)
57586be9f0dSKonstantin Belousov {
57686be9f0dSKonstantin Belousov 	struct sf_buf *sf;
57786be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
578*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
57986be9f0dSKonstantin Belousov 
58086be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
58186be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
58286be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
58386be9f0dSKonstantin Belousov 
58486be9f0dSKonstantin Belousov 	/*
58586be9f0dSKonstantin Belousov 	 * If our reference is not last, only the dereference should
58686be9f0dSKonstantin Belousov 	 * be performed.
58786be9f0dSKonstantin Belousov 	 */
58886be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
58986be9f0dSKonstantin Belousov 		ctx->refs--;
59086be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
59186be9f0dSKonstantin Belousov 		return;
59286be9f0dSKonstantin Belousov 	}
59386be9f0dSKonstantin Belousov 
59486be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
59586be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
59686be9f0dSKonstantin Belousov 
59786be9f0dSKonstantin Belousov 	/*
59886be9f0dSKonstantin Belousov 	 * Otherwise, the context entry must be cleared before the
59986be9f0dSKonstantin Belousov 	 * page table is destroyed.  The mapping of the context
60086be9f0dSKonstantin Belousov 	 * entries page could require sleep, unlock the dmar.
60186be9f0dSKonstantin Belousov 	 */
60286be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
60386be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
60486be9f0dSKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
60586be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
60686be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
60786be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
60886be9f0dSKonstantin Belousov 
60986be9f0dSKonstantin Belousov 	/*
61086be9f0dSKonstantin Belousov 	 * Other thread might have referenced the context, in which
61186be9f0dSKonstantin Belousov 	 * case again only the dereference should be performed.
61286be9f0dSKonstantin Belousov 	 */
61386be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
61486be9f0dSKonstantin Belousov 		ctx->refs--;
61586be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
6166b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
61786be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
61886be9f0dSKonstantin Belousov 		return;
61986be9f0dSKonstantin Belousov 	}
62086be9f0dSKonstantin Belousov 
62186be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
62286be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
62386be9f0dSKonstantin Belousov 
62486be9f0dSKonstantin Belousov 	/*
62586be9f0dSKonstantin Belousov 	 * Clear the context pointer and flush the caches.
62686be9f0dSKonstantin Belousov 	 * XXXKIB: cannot do this if any RMRR entries are still present.
62786be9f0dSKonstantin Belousov 	 */
62886be9f0dSKonstantin Belousov 	dmar_pte_clear(&ctxp->ctx1);
62986be9f0dSKonstantin Belousov 	ctxp->ctx2 = 0;
6306b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(dmar, ctxp);
63186be9f0dSKonstantin Belousov 	dmar_inv_ctx_glob(dmar);
63268eeb96aSKonstantin Belousov 	if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0) {
63368eeb96aSKonstantin Belousov 		if (dmar->qi_enabled)
63468eeb96aSKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
63568eeb96aSKonstantin Belousov 		else
63686be9f0dSKonstantin Belousov 			dmar_inv_iotlb_glob(dmar);
63768eeb96aSKonstantin Belousov 	}
6386b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
639*1abfd355SKonstantin Belousov 	domain = ctx->domain;
640*1abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
641*1abfd355SKonstantin Belousov 	free(ctx, M_DMAR_CTX);
642*1abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, domain);
64386be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
64486be9f0dSKonstantin Belousov }
64586be9f0dSKonstantin Belousov 
64686be9f0dSKonstantin Belousov void
64786be9f0dSKonstantin Belousov dmar_free_ctx(struct dmar_ctx *ctx)
64886be9f0dSKonstantin Belousov {
64986be9f0dSKonstantin Belousov 	struct dmar_unit *dmar;
65086be9f0dSKonstantin Belousov 
651*1abfd355SKonstantin Belousov 	dmar = ctx->domain->dmar;
65286be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
65386be9f0dSKonstantin Belousov 	dmar_free_ctx_locked(dmar, ctx);
65486be9f0dSKonstantin Belousov }
65586be9f0dSKonstantin Belousov 
656*1abfd355SKonstantin Belousov /*
657*1abfd355SKonstantin Belousov  * Returns with the domain locked.
658*1abfd355SKonstantin Belousov  */
65986be9f0dSKonstantin Belousov struct dmar_ctx *
66067499354SRyan Stone dmar_find_ctx_locked(struct dmar_unit *dmar, uint16_t rid)
66186be9f0dSKonstantin Belousov {
662*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
66386be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
66486be9f0dSKonstantin Belousov 
66586be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
66686be9f0dSKonstantin Belousov 
667*1abfd355SKonstantin Belousov 	LIST_FOREACH(domain, &dmar->domains, link) {
668*1abfd355SKonstantin Belousov 		LIST_FOREACH(ctx, &domain->contexts, link) {
66967499354SRyan Stone 			if (ctx->rid == rid)
67086be9f0dSKonstantin Belousov 				return (ctx);
67186be9f0dSKonstantin Belousov 		}
672*1abfd355SKonstantin Belousov 	}
67386be9f0dSKonstantin Belousov 	return (NULL);
67486be9f0dSKonstantin Belousov }
67586be9f0dSKonstantin Belousov 
67686be9f0dSKonstantin Belousov void
677*1abfd355SKonstantin Belousov dmar_domain_free_entry(struct dmar_map_entry *entry, bool free)
67868eeb96aSKonstantin Belousov {
679*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
68068eeb96aSKonstantin Belousov 
681*1abfd355SKonstantin Belousov 	domain = entry->domain;
682*1abfd355SKonstantin Belousov 	DMAR_DOMAIN_LOCK(domain);
68368eeb96aSKonstantin Belousov 	if ((entry->flags & DMAR_MAP_ENTRY_RMRR) != 0)
684*1abfd355SKonstantin Belousov 		dmar_gas_free_region(domain, entry);
68568eeb96aSKonstantin Belousov 	else
686*1abfd355SKonstantin Belousov 		dmar_gas_free_space(domain, entry);
687*1abfd355SKonstantin Belousov 	DMAR_DOMAIN_UNLOCK(domain);
68868eeb96aSKonstantin Belousov 	if (free)
689*1abfd355SKonstantin Belousov 		dmar_gas_free_entry(domain, entry);
69068eeb96aSKonstantin Belousov 	else
69168eeb96aSKonstantin Belousov 		entry->flags = 0;
69268eeb96aSKonstantin Belousov }
69368eeb96aSKonstantin Belousov 
69468eeb96aSKonstantin Belousov void
695*1abfd355SKonstantin Belousov dmar_domain_unload_entry(struct dmar_map_entry *entry, bool free)
69668eeb96aSKonstantin Belousov {
69768eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
69868eeb96aSKonstantin Belousov 
699*1abfd355SKonstantin Belousov 	unit = entry->domain->dmar;
70068eeb96aSKonstantin Belousov 	if (unit->qi_enabled) {
70168eeb96aSKonstantin Belousov 		DMAR_LOCK(unit);
702*1abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(entry->domain, entry->start,
70368eeb96aSKonstantin Belousov 		    entry->end - entry->start, &entry->gseq);
70468eeb96aSKonstantin Belousov 		if (!free)
70568eeb96aSKonstantin Belousov 			entry->flags |= DMAR_MAP_ENTRY_QI_NF;
70668eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
70768eeb96aSKonstantin Belousov 		DMAR_UNLOCK(unit);
70868eeb96aSKonstantin Belousov 	} else {
709*1abfd355SKonstantin Belousov 		domain_flush_iotlb_sync(entry->domain, entry->start,
710*1abfd355SKonstantin Belousov 		    entry->end - entry->start);
711*1abfd355SKonstantin Belousov 		dmar_domain_free_entry(entry, free);
71268eeb96aSKonstantin Belousov 	}
71368eeb96aSKonstantin Belousov }
71468eeb96aSKonstantin Belousov 
71568eeb96aSKonstantin Belousov void
716*1abfd355SKonstantin Belousov dmar_domain_unload(struct dmar_domain *domain,
717*1abfd355SKonstantin Belousov     struct dmar_map_entries_tailq *entries, bool cansleep)
71886be9f0dSKonstantin Belousov {
71968eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
72068eeb96aSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
72168eeb96aSKonstantin Belousov 	struct dmar_qi_genseq gseq;
72286be9f0dSKonstantin Belousov 	int error;
72386be9f0dSKonstantin Belousov 
724*1abfd355SKonstantin Belousov 	unit = domain->dmar;
72568eeb96aSKonstantin Belousov 
72668eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
72786be9f0dSKonstantin Belousov 		KASSERT((entry->flags & DMAR_MAP_ENTRY_MAP) != 0,
728*1abfd355SKonstantin Belousov 		    ("not mapped entry %p %p", domain, entry));
729*1abfd355SKonstantin Belousov 		error = domain_unmap_buf(domain, entry->start, entry->end -
73086be9f0dSKonstantin Belousov 		    entry->start, cansleep ? DMAR_PGF_WAITOK : 0);
731*1abfd355SKonstantin Belousov 		KASSERT(error == 0, ("unmap %p error %d", domain, error));
73268eeb96aSKonstantin Belousov 		if (!unit->qi_enabled) {
733*1abfd355SKonstantin Belousov 			domain_flush_iotlb_sync(domain, entry->start,
73468eeb96aSKonstantin Belousov 			    entry->end - entry->start);
73568eeb96aSKonstantin Belousov 			TAILQ_REMOVE(entries, entry, dmamap_link);
736*1abfd355SKonstantin Belousov 			dmar_domain_free_entry(entry, true);
73786be9f0dSKonstantin Belousov 		}
73886be9f0dSKonstantin Belousov 	}
73968eeb96aSKonstantin Belousov 	if (TAILQ_EMPTY(entries))
74068eeb96aSKonstantin Belousov 		return;
74168eeb96aSKonstantin Belousov 
74268eeb96aSKonstantin Belousov 	KASSERT(unit->qi_enabled, ("loaded entry left"));
74368eeb96aSKonstantin Belousov 	DMAR_LOCK(unit);
74468eeb96aSKonstantin Belousov 	TAILQ_FOREACH(entry, entries, dmamap_link) {
74568eeb96aSKonstantin Belousov 		entry->gseq.gen = 0;
74668eeb96aSKonstantin Belousov 		entry->gseq.seq = 0;
747*1abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(domain, entry->start, entry->end -
74868eeb96aSKonstantin Belousov 		    entry->start, TAILQ_NEXT(entry, dmamap_link) == NULL ?
74968eeb96aSKonstantin Belousov 		    &gseq : NULL);
75068eeb96aSKonstantin Belousov 	}
75168eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
75268eeb96aSKonstantin Belousov 		entry->gseq = gseq;
75368eeb96aSKonstantin Belousov 		TAILQ_REMOVE(entries, entry, dmamap_link);
75468eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
75568eeb96aSKonstantin Belousov 	}
75668eeb96aSKonstantin Belousov 	DMAR_UNLOCK(unit);
75768eeb96aSKonstantin Belousov }
75886be9f0dSKonstantin Belousov 
75986be9f0dSKonstantin Belousov static void
760*1abfd355SKonstantin Belousov dmar_domain_unload_task(void *arg, int pending)
76186be9f0dSKonstantin Belousov {
762*1abfd355SKonstantin Belousov 	struct dmar_domain *domain;
76386be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq entries;
76486be9f0dSKonstantin Belousov 
765*1abfd355SKonstantin Belousov 	domain = arg;
76686be9f0dSKonstantin Belousov 	TAILQ_INIT(&entries);
76786be9f0dSKonstantin Belousov 
76886be9f0dSKonstantin Belousov 	for (;;) {
769*1abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
770*1abfd355SKonstantin Belousov 		TAILQ_SWAP(&domain->unload_entries, &entries, dmar_map_entry,
77186be9f0dSKonstantin Belousov 		    dmamap_link);
772*1abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
77386be9f0dSKonstantin Belousov 		if (TAILQ_EMPTY(&entries))
77486be9f0dSKonstantin Belousov 			break;
775*1abfd355SKonstantin Belousov 		dmar_domain_unload(domain, &entries, true);
77686be9f0dSKonstantin Belousov 	}
77786be9f0dSKonstantin Belousov }
778