xref: /freebsd/sys/x86/iommu/intel_ctx.c (revision 3d47c58b98e4757a13be1fb1ae3911b5635162be)
186be9f0dSKonstantin Belousov /*-
286be9f0dSKonstantin Belousov  * Copyright (c) 2013 The FreeBSD Foundation
386be9f0dSKonstantin Belousov  * All rights reserved.
486be9f0dSKonstantin Belousov  *
586be9f0dSKonstantin Belousov  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
686be9f0dSKonstantin Belousov  * under sponsorship from the FreeBSD Foundation.
786be9f0dSKonstantin Belousov  *
886be9f0dSKonstantin Belousov  * Redistribution and use in source and binary forms, with or without
986be9f0dSKonstantin Belousov  * modification, are permitted provided that the following conditions
1086be9f0dSKonstantin Belousov  * are met:
1186be9f0dSKonstantin Belousov  * 1. Redistributions of source code must retain the above copyright
1286be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer.
1386be9f0dSKonstantin Belousov  * 2. Redistributions in binary form must reproduce the above copyright
1486be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer in the
1586be9f0dSKonstantin Belousov  *    documentation and/or other materials provided with the distribution.
1686be9f0dSKonstantin Belousov  *
1786be9f0dSKonstantin Belousov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1886be9f0dSKonstantin Belousov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1986be9f0dSKonstantin Belousov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2086be9f0dSKonstantin Belousov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2186be9f0dSKonstantin Belousov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2286be9f0dSKonstantin Belousov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2386be9f0dSKonstantin Belousov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2486be9f0dSKonstantin Belousov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2586be9f0dSKonstantin Belousov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2686be9f0dSKonstantin Belousov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2786be9f0dSKonstantin Belousov  * SUCH DAMAGE.
2886be9f0dSKonstantin Belousov  */
2986be9f0dSKonstantin Belousov 
3086be9f0dSKonstantin Belousov #include <sys/cdefs.h>
3186be9f0dSKonstantin Belousov __FBSDID("$FreeBSD$");
3286be9f0dSKonstantin Belousov 
3386be9f0dSKonstantin Belousov #include <sys/param.h>
3486be9f0dSKonstantin Belousov #include <sys/systm.h>
3586be9f0dSKonstantin Belousov #include <sys/malloc.h>
3686be9f0dSKonstantin Belousov #include <sys/bus.h>
3786be9f0dSKonstantin Belousov #include <sys/interrupt.h>
3886be9f0dSKonstantin Belousov #include <sys/kernel.h>
3986be9f0dSKonstantin Belousov #include <sys/ktr.h>
4086be9f0dSKonstantin Belousov #include <sys/limits.h>
4186be9f0dSKonstantin Belousov #include <sys/lock.h>
4286be9f0dSKonstantin Belousov #include <sys/memdesc.h>
4386be9f0dSKonstantin Belousov #include <sys/mutex.h>
4486be9f0dSKonstantin Belousov #include <sys/proc.h>
4586be9f0dSKonstantin Belousov #include <sys/rwlock.h>
4686be9f0dSKonstantin Belousov #include <sys/rman.h>
4786be9f0dSKonstantin Belousov #include <sys/sysctl.h>
4886be9f0dSKonstantin Belousov #include <sys/taskqueue.h>
4986be9f0dSKonstantin Belousov #include <sys/tree.h>
5086be9f0dSKonstantin Belousov #include <sys/uio.h>
510a110d5bSKonstantin Belousov #include <sys/vmem.h>
5286be9f0dSKonstantin Belousov #include <vm/vm.h>
5386be9f0dSKonstantin Belousov #include <vm/vm_extern.h>
5486be9f0dSKonstantin Belousov #include <vm/vm_kern.h>
5586be9f0dSKonstantin Belousov #include <vm/vm_object.h>
5686be9f0dSKonstantin Belousov #include <vm/vm_page.h>
5786be9f0dSKonstantin Belousov #include <vm/vm_pager.h>
5886be9f0dSKonstantin Belousov #include <vm/vm_map.h>
5986be9f0dSKonstantin Belousov #include <machine/atomic.h>
6086be9f0dSKonstantin Belousov #include <machine/bus.h>
6186be9f0dSKonstantin Belousov #include <machine/md_var.h>
6286be9f0dSKonstantin Belousov #include <machine/specialreg.h>
6386be9f0dSKonstantin Belousov #include <x86/include/busdma_impl.h>
6486be9f0dSKonstantin Belousov #include <x86/iommu/intel_reg.h>
6586be9f0dSKonstantin Belousov #include <x86/iommu/busdma_dmar.h>
6686be9f0dSKonstantin Belousov #include <x86/iommu/intel_dmar.h>
6767499354SRyan Stone #include <dev/pci/pcireg.h>
6886be9f0dSKonstantin Belousov #include <dev/pci/pcivar.h>
6986be9f0dSKonstantin Belousov 
7086be9f0dSKonstantin Belousov static MALLOC_DEFINE(M_DMAR_CTX, "dmar_ctx", "Intel DMAR Context");
711abfd355SKonstantin Belousov static MALLOC_DEFINE(M_DMAR_DOMAIN, "dmar_dom", "Intel DMAR Domain");
7286be9f0dSKonstantin Belousov 
731abfd355SKonstantin Belousov static void dmar_domain_unload_task(void *arg, int pending);
741abfd355SKonstantin Belousov static void dmar_unref_domain_locked(struct dmar_unit *dmar,
751abfd355SKonstantin Belousov     struct dmar_domain *domain);
761abfd355SKonstantin Belousov static void dmar_domain_destroy(struct dmar_domain *domain);
7786be9f0dSKonstantin Belousov 
7886be9f0dSKonstantin Belousov static void
7986be9f0dSKonstantin Belousov dmar_ensure_ctx_page(struct dmar_unit *dmar, int bus)
8086be9f0dSKonstantin Belousov {
8186be9f0dSKonstantin Belousov 	struct sf_buf *sf;
8286be9f0dSKonstantin Belousov 	dmar_root_entry_t *re;
8386be9f0dSKonstantin Belousov 	vm_page_t ctxm;
8486be9f0dSKonstantin Belousov 
8586be9f0dSKonstantin Belousov 	/*
8686be9f0dSKonstantin Belousov 	 * Allocated context page must be linked.
8786be9f0dSKonstantin Belousov 	 */
8886be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_NOALLOC);
8986be9f0dSKonstantin Belousov 	if (ctxm != NULL)
9086be9f0dSKonstantin Belousov 		return;
9186be9f0dSKonstantin Belousov 
9286be9f0dSKonstantin Belousov 	/*
9386be9f0dSKonstantin Belousov 	 * Page not present, allocate and link.  Note that other
9486be9f0dSKonstantin Belousov 	 * thread might execute this sequence in parallel.  This
9586be9f0dSKonstantin Belousov 	 * should be safe, because the context entries written by both
9686be9f0dSKonstantin Belousov 	 * threads are equal.
9786be9f0dSKonstantin Belousov 	 */
9886be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
9986be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_ZERO |
10086be9f0dSKonstantin Belousov 	    DMAR_PGF_WAITOK);
10186be9f0dSKonstantin Belousov 	re = dmar_map_pgtbl(dmar->ctx_obj, 0, DMAR_PGF_NOALLOC, &sf);
10286be9f0dSKonstantin Belousov 	re += bus;
10386be9f0dSKonstantin Belousov 	dmar_pte_store(&re->r1, DMAR_ROOT_R1_P | (DMAR_ROOT_R1_CTP_MASK &
10486be9f0dSKonstantin Belousov 	    VM_PAGE_TO_PHYS(ctxm)));
1056b7c46afSKonstantin Belousov 	dmar_flush_root_to_ram(dmar, re);
1066b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
10786be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
10886be9f0dSKonstantin Belousov }
10986be9f0dSKonstantin Belousov 
11086be9f0dSKonstantin Belousov static dmar_ctx_entry_t *
11186be9f0dSKonstantin Belousov dmar_map_ctx_entry(struct dmar_ctx *ctx, struct sf_buf **sfp)
11286be9f0dSKonstantin Belousov {
11386be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
11486be9f0dSKonstantin Belousov 
1151abfd355SKonstantin Belousov 	ctxp = dmar_map_pgtbl(ctx->domain->dmar->ctx_obj, 1 +
1161abfd355SKonstantin Belousov 	    PCI_RID2BUS(ctx->rid), DMAR_PGF_NOALLOC | DMAR_PGF_WAITOK, sfp);
11767499354SRyan Stone 	ctxp += ctx->rid & 0xff;
11886be9f0dSKonstantin Belousov 	return (ctxp);
11986be9f0dSKonstantin Belousov }
12086be9f0dSKonstantin Belousov 
12186be9f0dSKonstantin Belousov static void
12267499354SRyan Stone ctx_tag_init(struct dmar_ctx *ctx, device_t dev)
12386be9f0dSKonstantin Belousov {
12486be9f0dSKonstantin Belousov 	bus_addr_t maxaddr;
12586be9f0dSKonstantin Belousov 
1261abfd355SKonstantin Belousov 	maxaddr = MIN(ctx->domain->end, BUS_SPACE_MAXADDR);
12786be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.ref_count = 1; /* Prevent free */
12886be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.impl = &bus_dma_dmar_impl;
12986be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.boundary = PCI_DMA_BOUNDARY;
13086be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.lowaddr = maxaddr;
13186be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.highaddr = maxaddr;
13286be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsize = maxaddr;
13386be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.nsegments = BUS_SPACE_UNRESTRICTED;
13486be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsegsz = maxaddr;
13586be9f0dSKonstantin Belousov 	ctx->ctx_tag.ctx = ctx;
13667499354SRyan Stone 	ctx->ctx_tag.owner = dev;
13786be9f0dSKonstantin Belousov }
13886be9f0dSKonstantin Belousov 
13986be9f0dSKonstantin Belousov static void
1401abfd355SKonstantin Belousov ctx_id_entry_init(struct dmar_ctx *ctx, dmar_ctx_entry_t *ctxp, bool move)
14186be9f0dSKonstantin Belousov {
14286be9f0dSKonstantin Belousov 	struct dmar_unit *unit;
1431abfd355SKonstantin Belousov 	struct dmar_domain *domain;
14486be9f0dSKonstantin Belousov 	vm_page_t ctx_root;
14586be9f0dSKonstantin Belousov 
1461abfd355SKonstantin Belousov 	domain = ctx->domain;
1471abfd355SKonstantin Belousov 	unit = domain->dmar;
1481abfd355SKonstantin Belousov 	KASSERT(move || (ctxp->ctx1 == 0 && ctxp->ctx2 == 0),
14986be9f0dSKonstantin Belousov 	    ("dmar%d: initialized ctx entry %d:%d:%d 0x%jx 0x%jx",
15067499354SRyan Stone 	    unit->unit, pci_get_bus(ctx->ctx_tag.owner),
15167499354SRyan Stone 	    pci_get_slot(ctx->ctx_tag.owner),
15267499354SRyan Stone 	    pci_get_function(ctx->ctx_tag.owner),
1531abfd355SKonstantin Belousov 	    ctxp->ctx1, ctxp->ctx2));
1541abfd355SKonstantin Belousov 	/*
1551abfd355SKonstantin Belousov 	 * For update due to move, the store is not atomic.  It is
1561abfd355SKonstantin Belousov 	 * possible that DMAR read upper doubleword, while low
1571abfd355SKonstantin Belousov 	 * doubleword is not yet updated.  The domain id is stored in
1581abfd355SKonstantin Belousov 	 * the upper doubleword, while the table pointer in the lower.
1591abfd355SKonstantin Belousov 	 *
1601abfd355SKonstantin Belousov 	 * There is no good solution, for the same reason it is wrong
1611abfd355SKonstantin Belousov 	 * to clear P bit in the ctx entry for update.
1621abfd355SKonstantin Belousov 	 */
1631abfd355SKonstantin Belousov 	dmar_pte_store1(&ctxp->ctx2, DMAR_CTX2_DID(domain->domain) |
1641abfd355SKonstantin Belousov 	    domain->awlvl);
1651abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_IDMAP) != 0 &&
16686be9f0dSKonstantin Belousov 	    (unit->hw_ecap & DMAR_ECAP_PT) != 0) {
1671abfd355SKonstantin Belousov 		KASSERT(domain->pgtbl_obj == NULL,
16886be9f0dSKonstantin Belousov 		    ("ctx %p non-null pgtbl_obj", ctx));
1691abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_PASS | DMAR_CTX1_P);
17086be9f0dSKonstantin Belousov 	} else {
1711abfd355SKonstantin Belousov 		ctx_root = dmar_pgalloc(domain->pgtbl_obj, 0, DMAR_PGF_NOALLOC);
1721abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_UNTR |
17386be9f0dSKonstantin Belousov 		    (DMAR_CTX1_ASR_MASK & VM_PAGE_TO_PHYS(ctx_root)) |
17486be9f0dSKonstantin Belousov 		    DMAR_CTX1_P);
17586be9f0dSKonstantin Belousov 	}
1766b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(unit, ctxp);
17786be9f0dSKonstantin Belousov }
17886be9f0dSKonstantin Belousov 
17986be9f0dSKonstantin Belousov static int
1801abfd355SKonstantin Belousov dmar_flush_for_ctx_entry(struct dmar_unit *dmar, bool force)
1811abfd355SKonstantin Belousov {
1821abfd355SKonstantin Belousov 	int error;
1831abfd355SKonstantin Belousov 
1841abfd355SKonstantin Belousov 	/*
1851abfd355SKonstantin Belousov 	 * If dmar declares Caching Mode as Set, follow 11.5 "Caching
1861abfd355SKonstantin Belousov 	 * Mode Consideration" and do the (global) invalidation of the
1871abfd355SKonstantin Belousov 	 * negative TLB entries.
1881abfd355SKonstantin Belousov 	 */
1891abfd355SKonstantin Belousov 	if ((dmar->hw_cap & DMAR_CAP_CM) == 0 && !force)
1901abfd355SKonstantin Belousov 		return (0);
1911abfd355SKonstantin Belousov 	if (dmar->qi_enabled) {
1921abfd355SKonstantin Belousov 		dmar_qi_invalidate_ctx_glob_locked(dmar);
1931abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force)
1941abfd355SKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
1951abfd355SKonstantin Belousov 		return (0);
1961abfd355SKonstantin Belousov 	}
1971abfd355SKonstantin Belousov 	error = dmar_inv_ctx_glob(dmar);
1981abfd355SKonstantin Belousov 	if (error == 0 && ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force))
1991abfd355SKonstantin Belousov 		error = dmar_inv_iotlb_glob(dmar);
2001abfd355SKonstantin Belousov 	return (error);
2011abfd355SKonstantin Belousov }
2021abfd355SKonstantin Belousov 
2031abfd355SKonstantin Belousov static int
2041abfd355SKonstantin Belousov domain_init_rmrr(struct dmar_domain *domain, device_t dev)
20586be9f0dSKonstantin Belousov {
20686be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq rmrr_entries;
20786be9f0dSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
20886be9f0dSKonstantin Belousov 	vm_page_t *ma;
20986be9f0dSKonstantin Belousov 	dmar_gaddr_t start, end;
21086be9f0dSKonstantin Belousov 	vm_pindex_t size, i;
21186be9f0dSKonstantin Belousov 	int error, error1;
21286be9f0dSKonstantin Belousov 
21386be9f0dSKonstantin Belousov 	error = 0;
21486be9f0dSKonstantin Belousov 	TAILQ_INIT(&rmrr_entries);
2151abfd355SKonstantin Belousov 	dmar_dev_parse_rmrr(domain, dev, &rmrr_entries);
21686be9f0dSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, &rmrr_entries, unroll_link, entry1) {
21786be9f0dSKonstantin Belousov 		/*
21886be9f0dSKonstantin Belousov 		 * VT-d specification requires that the start of an
21986be9f0dSKonstantin Belousov 		 * RMRR entry is 4k-aligned.  Buggy BIOSes put
22086be9f0dSKonstantin Belousov 		 * anything into the start and end fields.  Truncate
22186be9f0dSKonstantin Belousov 		 * and round as neccesary.
22286be9f0dSKonstantin Belousov 		 *
22386be9f0dSKonstantin Belousov 		 * We also allow the overlapping RMRR entries, see
22486be9f0dSKonstantin Belousov 		 * dmar_gas_alloc_region().
22586be9f0dSKonstantin Belousov 		 */
22686be9f0dSKonstantin Belousov 		start = entry->start;
22786be9f0dSKonstantin Belousov 		end = entry->end;
22886be9f0dSKonstantin Belousov 		entry->start = trunc_page(start);
22986be9f0dSKonstantin Belousov 		entry->end = round_page(end);
230e02b05b3SKonstantin Belousov 		if (entry->start == entry->end) {
231e02b05b3SKonstantin Belousov 			/* Workaround for some AMI (?) BIOSes */
232e02b05b3SKonstantin Belousov 			if (bootverbose) {
233e02b05b3SKonstantin Belousov 				device_printf(dev, "BIOS bug: dmar%d RMRR "
234e02b05b3SKonstantin Belousov 				    "region (%jx, %jx) corrected\n",
2351abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end);
236e02b05b3SKonstantin Belousov 			}
237e02b05b3SKonstantin Belousov 			entry->end += DMAR_PAGE_SIZE * 0x20;
238e02b05b3SKonstantin Belousov 		}
23986be9f0dSKonstantin Belousov 		size = OFF_TO_IDX(entry->end - entry->start);
24086be9f0dSKonstantin Belousov 		ma = malloc(sizeof(vm_page_t) * size, M_TEMP, M_WAITOK);
24186be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++) {
24286be9f0dSKonstantin Belousov 			ma[i] = vm_page_getfake(entry->start + PAGE_SIZE * i,
24386be9f0dSKonstantin Belousov 			    VM_MEMATTR_DEFAULT);
24486be9f0dSKonstantin Belousov 		}
2451abfd355SKonstantin Belousov 		error1 = dmar_gas_map_region(domain, entry,
2461abfd355SKonstantin Belousov 		    DMAR_MAP_ENTRY_READ | DMAR_MAP_ENTRY_WRITE,
2471abfd355SKonstantin Belousov 		    DMAR_GM_CANWAIT, ma);
24886be9f0dSKonstantin Belousov 		/*
24986be9f0dSKonstantin Belousov 		 * Non-failed RMRR entries are owned by context rb
25086be9f0dSKonstantin Belousov 		 * tree.  Get rid of the failed entry, but do not stop
25186be9f0dSKonstantin Belousov 		 * the loop.  Rest of the parsed RMRR entries are
25286be9f0dSKonstantin Belousov 		 * loaded and removed on the context destruction.
25386be9f0dSKonstantin Belousov 		 */
25486be9f0dSKonstantin Belousov 		if (error1 == 0 && entry->end != entry->start) {
2551abfd355SKonstantin Belousov 			DMAR_LOCK(domain->dmar);
2561abfd355SKonstantin Belousov 			domain->refs++; /* XXXKIB prevent free */
2571abfd355SKonstantin Belousov 			domain->flags |= DMAR_DOMAIN_RMRR;
2581abfd355SKonstantin Belousov 			DMAR_UNLOCK(domain->dmar);
25986be9f0dSKonstantin Belousov 		} else {
26086be9f0dSKonstantin Belousov 			if (error1 != 0) {
26186be9f0dSKonstantin Belousov 				device_printf(dev,
26286be9f0dSKonstantin Belousov 			    "dmar%d failed to map RMRR region (%jx, %jx) %d\n",
2631abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end, error1);
26486be9f0dSKonstantin Belousov 				error = error1;
26586be9f0dSKonstantin Belousov 			}
26686be9f0dSKonstantin Belousov 			TAILQ_REMOVE(&rmrr_entries, entry, unroll_link);
2671abfd355SKonstantin Belousov 			dmar_gas_free_entry(domain, entry);
26886be9f0dSKonstantin Belousov 		}
26986be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++)
27086be9f0dSKonstantin Belousov 			vm_page_putfake(ma[i]);
27186be9f0dSKonstantin Belousov 		free(ma, M_TEMP);
27286be9f0dSKonstantin Belousov 	}
27386be9f0dSKonstantin Belousov 	return (error);
27486be9f0dSKonstantin Belousov }
27586be9f0dSKonstantin Belousov 
2761abfd355SKonstantin Belousov static struct dmar_domain *
2771abfd355SKonstantin Belousov dmar_domain_alloc(struct dmar_unit *dmar, bool id_mapped)
2781abfd355SKonstantin Belousov {
2791abfd355SKonstantin Belousov 	struct dmar_domain *domain;
2801abfd355SKonstantin Belousov 	int error, id, mgaw;
2811abfd355SKonstantin Belousov 
2821abfd355SKonstantin Belousov 	id = alloc_unr(dmar->domids);
2831abfd355SKonstantin Belousov 	if (id == -1)
2841abfd355SKonstantin Belousov 		return (NULL);
2851abfd355SKonstantin Belousov 	domain = malloc(sizeof(*domain), M_DMAR_DOMAIN, M_WAITOK | M_ZERO);
2861abfd355SKonstantin Belousov 	domain->domain = id;
2871abfd355SKonstantin Belousov 	LIST_INIT(&domain->contexts);
2881abfd355SKonstantin Belousov 	RB_INIT(&domain->rb_root);
2891abfd355SKonstantin Belousov 	TAILQ_INIT(&domain->unload_entries);
2901abfd355SKonstantin Belousov 	TASK_INIT(&domain->unload_task, 0, dmar_domain_unload_task, domain);
2911abfd355SKonstantin Belousov 	mtx_init(&domain->lock, "dmardom", NULL, MTX_DEF);
2921abfd355SKonstantin Belousov 	domain->dmar = dmar;
2931abfd355SKonstantin Belousov 
2941abfd355SKonstantin Belousov 	/*
2951abfd355SKonstantin Belousov 	 * For now, use the maximal usable physical address of the
2961abfd355SKonstantin Belousov 	 * installed memory to calculate the mgaw on id_mapped domain.
2971abfd355SKonstantin Belousov 	 * It is useful for the identity mapping, and less so for the
2981abfd355SKonstantin Belousov 	 * virtualized bus address space.
2991abfd355SKonstantin Belousov 	 */
3001abfd355SKonstantin Belousov 	domain->end = id_mapped ? ptoa(Maxmem) : BUS_SPACE_MAXADDR;
3011abfd355SKonstantin Belousov 	mgaw = dmar_maxaddr2mgaw(dmar, domain->end, !id_mapped);
3021abfd355SKonstantin Belousov 	error = domain_set_agaw(domain, mgaw);
3031abfd355SKonstantin Belousov 	if (error != 0)
3041abfd355SKonstantin Belousov 		goto fail;
3051abfd355SKonstantin Belousov 	if (!id_mapped)
3061abfd355SKonstantin Belousov 		/* Use all supported address space for remapping. */
3071abfd355SKonstantin Belousov 		domain->end = 1ULL << (domain->agaw - 1);
3081abfd355SKonstantin Belousov 
3091abfd355SKonstantin Belousov 	dmar_gas_init_domain(domain);
3101abfd355SKonstantin Belousov 
3111abfd355SKonstantin Belousov 	if (id_mapped) {
3121abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_PT) == 0) {
3131abfd355SKonstantin Belousov 			domain->pgtbl_obj = domain_get_idmap_pgtbl(domain,
3141abfd355SKonstantin Belousov 			    domain->end);
3151abfd355SKonstantin Belousov 		}
3161abfd355SKonstantin Belousov 		domain->flags |= DMAR_DOMAIN_IDMAP;
3171abfd355SKonstantin Belousov 	} else {
3181abfd355SKonstantin Belousov 		error = domain_alloc_pgtbl(domain);
3191abfd355SKonstantin Belousov 		if (error != 0)
3201abfd355SKonstantin Belousov 			goto fail;
3211abfd355SKonstantin Belousov 		/* Disable local apic region access */
3221abfd355SKonstantin Belousov 		error = dmar_gas_reserve_region(domain, 0xfee00000,
3231abfd355SKonstantin Belousov 		    0xfeefffff + 1);
3241abfd355SKonstantin Belousov 		if (error != 0)
3251abfd355SKonstantin Belousov 			goto fail;
3261abfd355SKonstantin Belousov 	}
3271abfd355SKonstantin Belousov 	return (domain);
3281abfd355SKonstantin Belousov 
3291abfd355SKonstantin Belousov fail:
3301abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
3311abfd355SKonstantin Belousov 	return (NULL);
3321abfd355SKonstantin Belousov }
3331abfd355SKonstantin Belousov 
33486be9f0dSKonstantin Belousov static struct dmar_ctx *
3351abfd355SKonstantin Belousov dmar_ctx_alloc(struct dmar_domain *domain, uint16_t rid)
33686be9f0dSKonstantin Belousov {
33786be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
33886be9f0dSKonstantin Belousov 
33986be9f0dSKonstantin Belousov 	ctx = malloc(sizeof(*ctx), M_DMAR_CTX, M_WAITOK | M_ZERO);
3401abfd355SKonstantin Belousov 	ctx->domain = domain;
34167499354SRyan Stone 	ctx->rid = rid;
3421abfd355SKonstantin Belousov 	ctx->refs = 1;
34386be9f0dSKonstantin Belousov 	return (ctx);
34486be9f0dSKonstantin Belousov }
34586be9f0dSKonstantin Belousov 
34686be9f0dSKonstantin Belousov static void
3471abfd355SKonstantin Belousov dmar_ctx_link(struct dmar_ctx *ctx)
3481abfd355SKonstantin Belousov {
3491abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3501abfd355SKonstantin Belousov 
3511abfd355SKonstantin Belousov 	domain = ctx->domain;
3521abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
3531abfd355SKonstantin Belousov 	KASSERT(domain->refs >= domain->ctx_cnt,
3541abfd355SKonstantin Belousov 	    ("dom %p ref underflow %d %d", domain, domain->refs,
3551abfd355SKonstantin Belousov 	    domain->ctx_cnt));
3561abfd355SKonstantin Belousov 	domain->refs++;
3571abfd355SKonstantin Belousov 	domain->ctx_cnt++;
3581abfd355SKonstantin Belousov 	LIST_INSERT_HEAD(&domain->contexts, ctx, link);
3591abfd355SKonstantin Belousov }
3601abfd355SKonstantin Belousov 
3611abfd355SKonstantin Belousov static void
3621abfd355SKonstantin Belousov dmar_ctx_unlink(struct dmar_ctx *ctx)
3631abfd355SKonstantin Belousov {
3641abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3651abfd355SKonstantin Belousov 
3661abfd355SKonstantin Belousov 	domain = ctx->domain;
3671abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
3681abfd355SKonstantin Belousov 	KASSERT(domain->refs > 0,
3691abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d", domain, domain->refs));
3701abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt >= domain->refs,
3711abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d ctx_cnt %d", domain,
3721abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
3731abfd355SKonstantin Belousov 	domain->refs--;
3741abfd355SKonstantin Belousov 	domain->ctx_cnt--;
3751abfd355SKonstantin Belousov 	LIST_REMOVE(ctx, link);
3761abfd355SKonstantin Belousov }
3771abfd355SKonstantin Belousov 
3781abfd355SKonstantin Belousov static void
3791abfd355SKonstantin Belousov dmar_domain_destroy(struct dmar_domain *domain)
38086be9f0dSKonstantin Belousov {
38186be9f0dSKonstantin Belousov 
3821abfd355SKonstantin Belousov 	KASSERT(TAILQ_EMPTY(&domain->unload_entries),
3831abfd355SKonstantin Belousov 	    ("unfinished unloads %p", domain));
3841abfd355SKonstantin Belousov 	KASSERT(LIST_EMPTY(&domain->contexts),
3851abfd355SKonstantin Belousov 	    ("destroying dom %p with contexts", domain));
3861abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt == 0,
3871abfd355SKonstantin Belousov 	    ("destroying dom %p with ctx_cnt %d", domain, domain->ctx_cnt));
3881abfd355SKonstantin Belousov 	KASSERT(domain->refs == 0,
3891abfd355SKonstantin Belousov 	    ("destroying dom %p with refs %d", domain, domain->refs));
3901abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_GAS_INITED) != 0) {
3911abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
3921abfd355SKonstantin Belousov 		dmar_gas_fini_domain(domain);
3931abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
39486be9f0dSKonstantin Belousov 	}
3951abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_PGTBL_INITED) != 0) {
3961abfd355SKonstantin Belousov 		if (domain->pgtbl_obj != NULL)
3971abfd355SKonstantin Belousov 			DMAR_DOMAIN_PGLOCK(domain);
3981abfd355SKonstantin Belousov 		domain_free_pgtbl(domain);
39986be9f0dSKonstantin Belousov 	}
4001abfd355SKonstantin Belousov 	mtx_destroy(&domain->lock);
4011abfd355SKonstantin Belousov 	free_unr(domain->dmar->domids, domain->domain);
4021abfd355SKonstantin Belousov 	free(domain, M_DMAR_DOMAIN);
40386be9f0dSKonstantin Belousov }
40486be9f0dSKonstantin Belousov 
40586be9f0dSKonstantin Belousov struct dmar_ctx *
4061abfd355SKonstantin Belousov dmar_get_ctx_for_dev(struct dmar_unit *dmar, device_t dev, uint16_t rid,
4071abfd355SKonstantin Belousov     bool id_mapped, bool rmrr_init)
40886be9f0dSKonstantin Belousov {
4091abfd355SKonstantin Belousov 	struct dmar_domain *domain, *domain1;
41086be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx, *ctx1;
41186be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
41286be9f0dSKonstantin Belousov 	struct sf_buf *sf;
4131abfd355SKonstantin Belousov 	int bus, slot, func, error;
41486be9f0dSKonstantin Belousov 	bool enable;
41586be9f0dSKonstantin Belousov 
41667499354SRyan Stone 	bus = pci_get_bus(dev);
41767499354SRyan Stone 	slot = pci_get_slot(dev);
41867499354SRyan Stone 	func = pci_get_function(dev);
41986be9f0dSKonstantin Belousov 	enable = false;
42086be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
42186be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
42267499354SRyan Stone 	ctx = dmar_find_ctx_locked(dmar, rid);
42386be9f0dSKonstantin Belousov 	error = 0;
42486be9f0dSKonstantin Belousov 	if (ctx == NULL) {
42586be9f0dSKonstantin Belousov 		/*
42686be9f0dSKonstantin Belousov 		 * Perform the allocations which require sleep or have
42786be9f0dSKonstantin Belousov 		 * higher chance to succeed if the sleep is allowed.
42886be9f0dSKonstantin Belousov 		 */
42986be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
430b29d186cSKonstantin Belousov 		dmar_ensure_ctx_page(dmar, PCI_RID2BUS(rid));
4311abfd355SKonstantin Belousov 		domain1 = dmar_domain_alloc(dmar, id_mapped);
4321abfd355SKonstantin Belousov 		if (domain1 == NULL) {
43386be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
43486be9f0dSKonstantin Belousov 			return (NULL);
43586be9f0dSKonstantin Belousov 		}
4365f8e5c7fSKonstantin Belousov 		if (!id_mapped) {
4371abfd355SKonstantin Belousov 			error = domain_init_rmrr(domain1, dev);
43886be9f0dSKonstantin Belousov 			if (error != 0) {
4391abfd355SKonstantin Belousov 				dmar_domain_destroy(domain1);
44086be9f0dSKonstantin Belousov 				TD_PINNED_ASSERT;
44186be9f0dSKonstantin Belousov 				return (NULL);
44286be9f0dSKonstantin Belousov 			}
4435f8e5c7fSKonstantin Belousov 		}
4441abfd355SKonstantin Belousov 		ctx1 = dmar_ctx_alloc(domain1, rid);
44586be9f0dSKonstantin Belousov 		ctxp = dmar_map_ctx_entry(ctx1, &sf);
44686be9f0dSKonstantin Belousov 		DMAR_LOCK(dmar);
44786be9f0dSKonstantin Belousov 
44886be9f0dSKonstantin Belousov 		/*
44986be9f0dSKonstantin Belousov 		 * Recheck the contexts, other thread might have
45086be9f0dSKonstantin Belousov 		 * already allocated needed one.
45186be9f0dSKonstantin Belousov 		 */
45267499354SRyan Stone 		ctx = dmar_find_ctx_locked(dmar, rid);
45386be9f0dSKonstantin Belousov 		if (ctx == NULL) {
4541abfd355SKonstantin Belousov 			domain = domain1;
45586be9f0dSKonstantin Belousov 			ctx = ctx1;
4561abfd355SKonstantin Belousov 			dmar_ctx_link(ctx);
4579d0bc6d8SKonstantin Belousov 			ctx->ctx_tag.owner = dev;
45867499354SRyan Stone 			ctx_tag_init(ctx, dev);
45986be9f0dSKonstantin Belousov 
46086be9f0dSKonstantin Belousov 			/*
46186be9f0dSKonstantin Belousov 			 * This is the first activated context for the
46286be9f0dSKonstantin Belousov 			 * DMAR unit.  Enable the translation after
46386be9f0dSKonstantin Belousov 			 * everything is set up.
46486be9f0dSKonstantin Belousov 			 */
4651abfd355SKonstantin Belousov 			if (LIST_EMPTY(&dmar->domains))
46686be9f0dSKonstantin Belousov 				enable = true;
4671abfd355SKonstantin Belousov 			LIST_INSERT_HEAD(&dmar->domains, domain, link);
4681abfd355SKonstantin Belousov 			ctx_id_entry_init(ctx, ctxp, false);
46986be9f0dSKonstantin Belousov 			device_printf(dev,
47034e8337bSKonstantin Belousov 			    "dmar%d pci%d:%d:%d:%d rid %x domain %d mgaw %d "
4719d0bc6d8SKonstantin Belousov 			    "agaw %d %s-mapped\n",
47286be9f0dSKonstantin Belousov 			    dmar->unit, dmar->segment, bus, slot,
4731abfd355SKonstantin Belousov 			    func, rid, domain->domain, domain->mgaw,
4741abfd355SKonstantin Belousov 			    domain->agaw, id_mapped ? "id" : "re");
475*3d47c58bSKonstantin Belousov 			dmar_unmap_pgtbl(sf);
47686be9f0dSKonstantin Belousov 		} else {
477*3d47c58bSKonstantin Belousov 			dmar_unmap_pgtbl(sf);
4781abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
479*3d47c58bSKonstantin Belousov 			/* Nothing needs to be done to destroy ctx1. */
480*3d47c58bSKonstantin Belousov 			free(ctx1, M_DMAR_CTX);
4811abfd355SKonstantin Belousov 			domain = ctx->domain;
4821abfd355SKonstantin Belousov 			ctx->refs++; /* tag referenced us */
48386be9f0dSKonstantin Belousov 		}
48468eeb96aSKonstantin Belousov 	} else {
4851abfd355SKonstantin Belousov 		domain = ctx->domain;
4861abfd355SKonstantin Belousov 		ctx->refs++; /* tag referenced us */
4871abfd355SKonstantin Belousov 	}
4881abfd355SKonstantin Belousov 
4891abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, enable);
49086be9f0dSKonstantin Belousov 	if (error != 0) {
49186be9f0dSKonstantin Belousov 		dmar_free_ctx_locked(dmar, ctx);
49286be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
49386be9f0dSKonstantin Belousov 		return (NULL);
49486be9f0dSKonstantin Belousov 	}
49568eeb96aSKonstantin Belousov 
49668eeb96aSKonstantin Belousov 	/*
49768eeb96aSKonstantin Belousov 	 * The dmar lock was potentially dropped between check for the
49868eeb96aSKonstantin Belousov 	 * empty context list and now.  Recheck the state of GCMD_TE
49968eeb96aSKonstantin Belousov 	 * to avoid unneeded command.
50068eeb96aSKonstantin Belousov 	 */
50168eeb96aSKonstantin Belousov 	if (enable && !rmrr_init && (dmar->hw_gcmd & DMAR_GCMD_TE) == 0) {
50286be9f0dSKonstantin Belousov 		error = dmar_enable_translation(dmar);
50386be9f0dSKonstantin Belousov 		if (error != 0) {
50486be9f0dSKonstantin Belousov 			dmar_free_ctx_locked(dmar, ctx);
50586be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
50686be9f0dSKonstantin Belousov 			return (NULL);
50786be9f0dSKonstantin Belousov 		}
50886be9f0dSKonstantin Belousov 	}
50986be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
51086be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
51186be9f0dSKonstantin Belousov 	return (ctx);
51286be9f0dSKonstantin Belousov }
51386be9f0dSKonstantin Belousov 
5141abfd355SKonstantin Belousov int
5151abfd355SKonstantin Belousov dmar_move_ctx_to_domain(struct dmar_domain *domain, struct dmar_ctx *ctx)
5161abfd355SKonstantin Belousov {
5171abfd355SKonstantin Belousov 	struct dmar_unit *dmar;
5181abfd355SKonstantin Belousov 	struct dmar_domain *old_domain;
5191abfd355SKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
5201abfd355SKonstantin Belousov 	struct sf_buf *sf;
5211abfd355SKonstantin Belousov 	int error;
5221abfd355SKonstantin Belousov 
5231abfd355SKonstantin Belousov 	dmar = domain->dmar;
5241abfd355SKonstantin Belousov 	old_domain = ctx->domain;
5251abfd355SKonstantin Belousov 	if (domain == old_domain)
5261abfd355SKonstantin Belousov 		return (0);
5271abfd355SKonstantin Belousov 	KASSERT(old_domain->dmar == dmar,
5281abfd355SKonstantin Belousov 	    ("domain %p %u moving between dmars %u %u", domain,
5291abfd355SKonstantin Belousov 	    domain->domain, old_domain->dmar->unit, domain->dmar->unit));
5301abfd355SKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
5311abfd355SKonstantin Belousov 
5321abfd355SKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
5331abfd355SKonstantin Belousov 	DMAR_LOCK(dmar);
5341abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
5351abfd355SKonstantin Belousov 	ctx->domain = domain;
5361abfd355SKonstantin Belousov 	dmar_ctx_link(ctx);
5371abfd355SKonstantin Belousov 	ctx_id_entry_init(ctx, ctxp, true);
5381abfd355SKonstantin Belousov 	dmar_unmap_pgtbl(sf);
5391abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, true);
5401abfd355SKonstantin Belousov 	/* If flush failed, rolling back would not work as well. */
5411abfd355SKonstantin Belousov 	printf("dmar%d rid %x domain %d->%d %s-mapped\n",
5421abfd355SKonstantin Belousov 	    dmar->unit, ctx->rid, old_domain->domain, domain->domain,
5431abfd355SKonstantin Belousov 	    (domain->flags & DMAR_DOMAIN_IDMAP) != 0 ? "id" : "re");
5441abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, old_domain);
5451abfd355SKonstantin Belousov 	TD_PINNED_ASSERT;
5461abfd355SKonstantin Belousov 	return (error);
5471abfd355SKonstantin Belousov }
5481abfd355SKonstantin Belousov 
5491abfd355SKonstantin Belousov static void
5501abfd355SKonstantin Belousov dmar_unref_domain_locked(struct dmar_unit *dmar, struct dmar_domain *domain)
5511abfd355SKonstantin Belousov {
5521abfd355SKonstantin Belousov 
5531abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
5541abfd355SKonstantin Belousov 	KASSERT(domain->refs >= 1,
5551abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %u", dmar->unit, domain, domain->refs));
5561abfd355SKonstantin Belousov 	KASSERT(domain->refs > domain->ctx_cnt,
5571abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %d ctx_cnt %d", dmar->unit, domain,
5581abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
5591abfd355SKonstantin Belousov 
5601abfd355SKonstantin Belousov 	if (domain->refs > 1) {
5611abfd355SKonstantin Belousov 		domain->refs--;
5621abfd355SKonstantin Belousov 		DMAR_UNLOCK(dmar);
5631abfd355SKonstantin Belousov 		return;
5641abfd355SKonstantin Belousov 	}
5651abfd355SKonstantin Belousov 
5661abfd355SKonstantin Belousov 	KASSERT((domain->flags & DMAR_DOMAIN_RMRR) == 0,
5671abfd355SKonstantin Belousov 	    ("lost ref on RMRR domain %p", domain));
5681abfd355SKonstantin Belousov 
5691abfd355SKonstantin Belousov 	LIST_REMOVE(domain, link);
5701abfd355SKonstantin Belousov 	DMAR_UNLOCK(dmar);
5711abfd355SKonstantin Belousov 
5721abfd355SKonstantin Belousov 	taskqueue_drain(dmar->delayed_taskqueue, &domain->unload_task);
5731abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
5741abfd355SKonstantin Belousov }
5751abfd355SKonstantin Belousov 
57686be9f0dSKonstantin Belousov void
57786be9f0dSKonstantin Belousov dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx)
57886be9f0dSKonstantin Belousov {
57986be9f0dSKonstantin Belousov 	struct sf_buf *sf;
58086be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
5811abfd355SKonstantin Belousov 	struct dmar_domain *domain;
58286be9f0dSKonstantin Belousov 
58386be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
58486be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
58586be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
58686be9f0dSKonstantin Belousov 
58786be9f0dSKonstantin Belousov 	/*
58886be9f0dSKonstantin Belousov 	 * If our reference is not last, only the dereference should
58986be9f0dSKonstantin Belousov 	 * be performed.
59086be9f0dSKonstantin Belousov 	 */
59186be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
59286be9f0dSKonstantin Belousov 		ctx->refs--;
59386be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
59486be9f0dSKonstantin Belousov 		return;
59586be9f0dSKonstantin Belousov 	}
59686be9f0dSKonstantin Belousov 
59786be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
59886be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
59986be9f0dSKonstantin Belousov 
60086be9f0dSKonstantin Belousov 	/*
60186be9f0dSKonstantin Belousov 	 * Otherwise, the context entry must be cleared before the
60286be9f0dSKonstantin Belousov 	 * page table is destroyed.  The mapping of the context
60386be9f0dSKonstantin Belousov 	 * entries page could require sleep, unlock the dmar.
60486be9f0dSKonstantin Belousov 	 */
60586be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
60686be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
60786be9f0dSKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
60886be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
60986be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
61086be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
61186be9f0dSKonstantin Belousov 
61286be9f0dSKonstantin Belousov 	/*
61386be9f0dSKonstantin Belousov 	 * Other thread might have referenced the context, in which
61486be9f0dSKonstantin Belousov 	 * case again only the dereference should be performed.
61586be9f0dSKonstantin Belousov 	 */
61686be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
61786be9f0dSKonstantin Belousov 		ctx->refs--;
61886be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
6196b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
62086be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
62186be9f0dSKonstantin Belousov 		return;
62286be9f0dSKonstantin Belousov 	}
62386be9f0dSKonstantin Belousov 
62486be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
62586be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
62686be9f0dSKonstantin Belousov 
62786be9f0dSKonstantin Belousov 	/*
62886be9f0dSKonstantin Belousov 	 * Clear the context pointer and flush the caches.
62986be9f0dSKonstantin Belousov 	 * XXXKIB: cannot do this if any RMRR entries are still present.
63086be9f0dSKonstantin Belousov 	 */
63186be9f0dSKonstantin Belousov 	dmar_pte_clear(&ctxp->ctx1);
63286be9f0dSKonstantin Belousov 	ctxp->ctx2 = 0;
6336b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(dmar, ctxp);
63486be9f0dSKonstantin Belousov 	dmar_inv_ctx_glob(dmar);
63568eeb96aSKonstantin Belousov 	if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0) {
63668eeb96aSKonstantin Belousov 		if (dmar->qi_enabled)
63768eeb96aSKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
63868eeb96aSKonstantin Belousov 		else
63986be9f0dSKonstantin Belousov 			dmar_inv_iotlb_glob(dmar);
64068eeb96aSKonstantin Belousov 	}
6416b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
6421abfd355SKonstantin Belousov 	domain = ctx->domain;
6431abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
6441abfd355SKonstantin Belousov 	free(ctx, M_DMAR_CTX);
6451abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, domain);
64686be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
64786be9f0dSKonstantin Belousov }
64886be9f0dSKonstantin Belousov 
64986be9f0dSKonstantin Belousov void
65086be9f0dSKonstantin Belousov dmar_free_ctx(struct dmar_ctx *ctx)
65186be9f0dSKonstantin Belousov {
65286be9f0dSKonstantin Belousov 	struct dmar_unit *dmar;
65386be9f0dSKonstantin Belousov 
6541abfd355SKonstantin Belousov 	dmar = ctx->domain->dmar;
65586be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
65686be9f0dSKonstantin Belousov 	dmar_free_ctx_locked(dmar, ctx);
65786be9f0dSKonstantin Belousov }
65886be9f0dSKonstantin Belousov 
6591abfd355SKonstantin Belousov /*
6601abfd355SKonstantin Belousov  * Returns with the domain locked.
6611abfd355SKonstantin Belousov  */
66286be9f0dSKonstantin Belousov struct dmar_ctx *
66367499354SRyan Stone dmar_find_ctx_locked(struct dmar_unit *dmar, uint16_t rid)
66486be9f0dSKonstantin Belousov {
6651abfd355SKonstantin Belousov 	struct dmar_domain *domain;
66686be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
66786be9f0dSKonstantin Belousov 
66886be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
66986be9f0dSKonstantin Belousov 
6701abfd355SKonstantin Belousov 	LIST_FOREACH(domain, &dmar->domains, link) {
6711abfd355SKonstantin Belousov 		LIST_FOREACH(ctx, &domain->contexts, link) {
67267499354SRyan Stone 			if (ctx->rid == rid)
67386be9f0dSKonstantin Belousov 				return (ctx);
67486be9f0dSKonstantin Belousov 		}
6751abfd355SKonstantin Belousov 	}
67686be9f0dSKonstantin Belousov 	return (NULL);
67786be9f0dSKonstantin Belousov }
67886be9f0dSKonstantin Belousov 
67986be9f0dSKonstantin Belousov void
6801abfd355SKonstantin Belousov dmar_domain_free_entry(struct dmar_map_entry *entry, bool free)
68168eeb96aSKonstantin Belousov {
6821abfd355SKonstantin Belousov 	struct dmar_domain *domain;
68368eeb96aSKonstantin Belousov 
6841abfd355SKonstantin Belousov 	domain = entry->domain;
6851abfd355SKonstantin Belousov 	DMAR_DOMAIN_LOCK(domain);
68668eeb96aSKonstantin Belousov 	if ((entry->flags & DMAR_MAP_ENTRY_RMRR) != 0)
6871abfd355SKonstantin Belousov 		dmar_gas_free_region(domain, entry);
68868eeb96aSKonstantin Belousov 	else
6891abfd355SKonstantin Belousov 		dmar_gas_free_space(domain, entry);
6901abfd355SKonstantin Belousov 	DMAR_DOMAIN_UNLOCK(domain);
69168eeb96aSKonstantin Belousov 	if (free)
6921abfd355SKonstantin Belousov 		dmar_gas_free_entry(domain, entry);
69368eeb96aSKonstantin Belousov 	else
69468eeb96aSKonstantin Belousov 		entry->flags = 0;
69568eeb96aSKonstantin Belousov }
69668eeb96aSKonstantin Belousov 
69768eeb96aSKonstantin Belousov void
6981abfd355SKonstantin Belousov dmar_domain_unload_entry(struct dmar_map_entry *entry, bool free)
69968eeb96aSKonstantin Belousov {
70068eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
70168eeb96aSKonstantin Belousov 
7021abfd355SKonstantin Belousov 	unit = entry->domain->dmar;
70368eeb96aSKonstantin Belousov 	if (unit->qi_enabled) {
70468eeb96aSKonstantin Belousov 		DMAR_LOCK(unit);
7051abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(entry->domain, entry->start,
70668eeb96aSKonstantin Belousov 		    entry->end - entry->start, &entry->gseq);
70768eeb96aSKonstantin Belousov 		if (!free)
70868eeb96aSKonstantin Belousov 			entry->flags |= DMAR_MAP_ENTRY_QI_NF;
70968eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
71068eeb96aSKonstantin Belousov 		DMAR_UNLOCK(unit);
71168eeb96aSKonstantin Belousov 	} else {
7121abfd355SKonstantin Belousov 		domain_flush_iotlb_sync(entry->domain, entry->start,
7131abfd355SKonstantin Belousov 		    entry->end - entry->start);
7141abfd355SKonstantin Belousov 		dmar_domain_free_entry(entry, free);
71568eeb96aSKonstantin Belousov 	}
71668eeb96aSKonstantin Belousov }
71768eeb96aSKonstantin Belousov 
718e164cafcSKonstantin Belousov static struct dmar_qi_genseq *
719e164cafcSKonstantin Belousov dmar_domain_unload_gseq(struct dmar_domain *domain,
720e164cafcSKonstantin Belousov     struct dmar_map_entry *entry, struct dmar_qi_genseq *gseq)
721e164cafcSKonstantin Belousov {
722e164cafcSKonstantin Belousov 
723e164cafcSKonstantin Belousov 	if (TAILQ_NEXT(entry, dmamap_link) != NULL)
724e164cafcSKonstantin Belousov 		return (NULL);
725e164cafcSKonstantin Belousov 	if (domain->batch_no++ % dmar_batch_coalesce != 0)
726e164cafcSKonstantin Belousov 		return (NULL);
727e164cafcSKonstantin Belousov 	return (gseq);
728e164cafcSKonstantin Belousov }
729e164cafcSKonstantin Belousov 
73068eeb96aSKonstantin Belousov void
7311abfd355SKonstantin Belousov dmar_domain_unload(struct dmar_domain *domain,
7321abfd355SKonstantin Belousov     struct dmar_map_entries_tailq *entries, bool cansleep)
73386be9f0dSKonstantin Belousov {
73468eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
73568eeb96aSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
73668eeb96aSKonstantin Belousov 	struct dmar_qi_genseq gseq;
73786be9f0dSKonstantin Belousov 	int error;
73886be9f0dSKonstantin Belousov 
7391abfd355SKonstantin Belousov 	unit = domain->dmar;
74068eeb96aSKonstantin Belousov 
74168eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
74286be9f0dSKonstantin Belousov 		KASSERT((entry->flags & DMAR_MAP_ENTRY_MAP) != 0,
7431abfd355SKonstantin Belousov 		    ("not mapped entry %p %p", domain, entry));
7441abfd355SKonstantin Belousov 		error = domain_unmap_buf(domain, entry->start, entry->end -
74586be9f0dSKonstantin Belousov 		    entry->start, cansleep ? DMAR_PGF_WAITOK : 0);
7461abfd355SKonstantin Belousov 		KASSERT(error == 0, ("unmap %p error %d", domain, error));
74768eeb96aSKonstantin Belousov 		if (!unit->qi_enabled) {
7481abfd355SKonstantin Belousov 			domain_flush_iotlb_sync(domain, entry->start,
74968eeb96aSKonstantin Belousov 			    entry->end - entry->start);
75068eeb96aSKonstantin Belousov 			TAILQ_REMOVE(entries, entry, dmamap_link);
7511abfd355SKonstantin Belousov 			dmar_domain_free_entry(entry, true);
75286be9f0dSKonstantin Belousov 		}
75386be9f0dSKonstantin Belousov 	}
75468eeb96aSKonstantin Belousov 	if (TAILQ_EMPTY(entries))
75568eeb96aSKonstantin Belousov 		return;
75668eeb96aSKonstantin Belousov 
75768eeb96aSKonstantin Belousov 	KASSERT(unit->qi_enabled, ("loaded entry left"));
75868eeb96aSKonstantin Belousov 	DMAR_LOCK(unit);
75968eeb96aSKonstantin Belousov 	TAILQ_FOREACH(entry, entries, dmamap_link) {
76068eeb96aSKonstantin Belousov 		entry->gseq.gen = 0;
76168eeb96aSKonstantin Belousov 		entry->gseq.seq = 0;
7621abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(domain, entry->start, entry->end -
763e164cafcSKonstantin Belousov 		    entry->start, dmar_domain_unload_gseq(domain, entry,
764e164cafcSKonstantin Belousov 		    &gseq));
76568eeb96aSKonstantin Belousov 	}
76668eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
76768eeb96aSKonstantin Belousov 		entry->gseq = gseq;
76868eeb96aSKonstantin Belousov 		TAILQ_REMOVE(entries, entry, dmamap_link);
76968eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
77068eeb96aSKonstantin Belousov 	}
77168eeb96aSKonstantin Belousov 	DMAR_UNLOCK(unit);
77268eeb96aSKonstantin Belousov }
77386be9f0dSKonstantin Belousov 
77486be9f0dSKonstantin Belousov static void
7751abfd355SKonstantin Belousov dmar_domain_unload_task(void *arg, int pending)
77686be9f0dSKonstantin Belousov {
7771abfd355SKonstantin Belousov 	struct dmar_domain *domain;
77886be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq entries;
77986be9f0dSKonstantin Belousov 
7801abfd355SKonstantin Belousov 	domain = arg;
78186be9f0dSKonstantin Belousov 	TAILQ_INIT(&entries);
78286be9f0dSKonstantin Belousov 
78386be9f0dSKonstantin Belousov 	for (;;) {
7841abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
7851abfd355SKonstantin Belousov 		TAILQ_SWAP(&domain->unload_entries, &entries, dmar_map_entry,
78686be9f0dSKonstantin Belousov 		    dmamap_link);
7871abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
78886be9f0dSKonstantin Belousov 		if (TAILQ_EMPTY(&entries))
78986be9f0dSKonstantin Belousov 			break;
7901abfd355SKonstantin Belousov 		dmar_domain_unload(domain, &entries, true);
79186be9f0dSKonstantin Belousov 	}
79286be9f0dSKonstantin Belousov }
793