xref: /freebsd/sys/x86/iommu/intel_ctx.c (revision e164cafc699818f27dd1f24776a19bea4fd0b6f4)
186be9f0dSKonstantin Belousov /*-
286be9f0dSKonstantin Belousov  * Copyright (c) 2013 The FreeBSD Foundation
386be9f0dSKonstantin Belousov  * All rights reserved.
486be9f0dSKonstantin Belousov  *
586be9f0dSKonstantin Belousov  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
686be9f0dSKonstantin Belousov  * under sponsorship from the FreeBSD Foundation.
786be9f0dSKonstantin Belousov  *
886be9f0dSKonstantin Belousov  * Redistribution and use in source and binary forms, with or without
986be9f0dSKonstantin Belousov  * modification, are permitted provided that the following conditions
1086be9f0dSKonstantin Belousov  * are met:
1186be9f0dSKonstantin Belousov  * 1. Redistributions of source code must retain the above copyright
1286be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer.
1386be9f0dSKonstantin Belousov  * 2. Redistributions in binary form must reproduce the above copyright
1486be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer in the
1586be9f0dSKonstantin Belousov  *    documentation and/or other materials provided with the distribution.
1686be9f0dSKonstantin Belousov  *
1786be9f0dSKonstantin Belousov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1886be9f0dSKonstantin Belousov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1986be9f0dSKonstantin Belousov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2086be9f0dSKonstantin Belousov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2186be9f0dSKonstantin Belousov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2286be9f0dSKonstantin Belousov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2386be9f0dSKonstantin Belousov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2486be9f0dSKonstantin Belousov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2586be9f0dSKonstantin Belousov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2686be9f0dSKonstantin Belousov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2786be9f0dSKonstantin Belousov  * SUCH DAMAGE.
2886be9f0dSKonstantin Belousov  */
2986be9f0dSKonstantin Belousov 
3086be9f0dSKonstantin Belousov #include <sys/cdefs.h>
3186be9f0dSKonstantin Belousov __FBSDID("$FreeBSD$");
3286be9f0dSKonstantin Belousov 
3386be9f0dSKonstantin Belousov #include <sys/param.h>
3486be9f0dSKonstantin Belousov #include <sys/systm.h>
3586be9f0dSKonstantin Belousov #include <sys/malloc.h>
3686be9f0dSKonstantin Belousov #include <sys/bus.h>
3786be9f0dSKonstantin Belousov #include <sys/interrupt.h>
3886be9f0dSKonstantin Belousov #include <sys/kernel.h>
3986be9f0dSKonstantin Belousov #include <sys/ktr.h>
4086be9f0dSKonstantin Belousov #include <sys/limits.h>
4186be9f0dSKonstantin Belousov #include <sys/lock.h>
4286be9f0dSKonstantin Belousov #include <sys/memdesc.h>
4386be9f0dSKonstantin Belousov #include <sys/mutex.h>
4486be9f0dSKonstantin Belousov #include <sys/proc.h>
4586be9f0dSKonstantin Belousov #include <sys/rwlock.h>
4686be9f0dSKonstantin Belousov #include <sys/rman.h>
4786be9f0dSKonstantin Belousov #include <sys/sysctl.h>
4886be9f0dSKonstantin Belousov #include <sys/taskqueue.h>
4986be9f0dSKonstantin Belousov #include <sys/tree.h>
5086be9f0dSKonstantin Belousov #include <sys/uio.h>
510a110d5bSKonstantin Belousov #include <sys/vmem.h>
5286be9f0dSKonstantin Belousov #include <vm/vm.h>
5386be9f0dSKonstantin Belousov #include <vm/vm_extern.h>
5486be9f0dSKonstantin Belousov #include <vm/vm_kern.h>
5586be9f0dSKonstantin Belousov #include <vm/vm_object.h>
5686be9f0dSKonstantin Belousov #include <vm/vm_page.h>
5786be9f0dSKonstantin Belousov #include <vm/vm_pager.h>
5886be9f0dSKonstantin Belousov #include <vm/vm_map.h>
5986be9f0dSKonstantin Belousov #include <machine/atomic.h>
6086be9f0dSKonstantin Belousov #include <machine/bus.h>
6186be9f0dSKonstantin Belousov #include <machine/md_var.h>
6286be9f0dSKonstantin Belousov #include <machine/specialreg.h>
6386be9f0dSKonstantin Belousov #include <x86/include/busdma_impl.h>
6486be9f0dSKonstantin Belousov #include <x86/iommu/intel_reg.h>
6586be9f0dSKonstantin Belousov #include <x86/iommu/busdma_dmar.h>
6686be9f0dSKonstantin Belousov #include <x86/iommu/intel_dmar.h>
6767499354SRyan Stone #include <dev/pci/pcireg.h>
6886be9f0dSKonstantin Belousov #include <dev/pci/pcivar.h>
6986be9f0dSKonstantin Belousov 
7086be9f0dSKonstantin Belousov static MALLOC_DEFINE(M_DMAR_CTX, "dmar_ctx", "Intel DMAR Context");
711abfd355SKonstantin Belousov static MALLOC_DEFINE(M_DMAR_DOMAIN, "dmar_dom", "Intel DMAR Domain");
7286be9f0dSKonstantin Belousov 
731abfd355SKonstantin Belousov static void dmar_domain_unload_task(void *arg, int pending);
741abfd355SKonstantin Belousov static void dmar_unref_domain_locked(struct dmar_unit *dmar,
751abfd355SKonstantin Belousov     struct dmar_domain *domain);
761abfd355SKonstantin Belousov static void dmar_domain_destroy(struct dmar_domain *domain);
7786be9f0dSKonstantin Belousov 
7886be9f0dSKonstantin Belousov static void
7986be9f0dSKonstantin Belousov dmar_ensure_ctx_page(struct dmar_unit *dmar, int bus)
8086be9f0dSKonstantin Belousov {
8186be9f0dSKonstantin Belousov 	struct sf_buf *sf;
8286be9f0dSKonstantin Belousov 	dmar_root_entry_t *re;
8386be9f0dSKonstantin Belousov 	vm_page_t ctxm;
8486be9f0dSKonstantin Belousov 
8586be9f0dSKonstantin Belousov 	/*
8686be9f0dSKonstantin Belousov 	 * Allocated context page must be linked.
8786be9f0dSKonstantin Belousov 	 */
8886be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_NOALLOC);
8986be9f0dSKonstantin Belousov 	if (ctxm != NULL)
9086be9f0dSKonstantin Belousov 		return;
9186be9f0dSKonstantin Belousov 
9286be9f0dSKonstantin Belousov 	/*
9386be9f0dSKonstantin Belousov 	 * Page not present, allocate and link.  Note that other
9486be9f0dSKonstantin Belousov 	 * thread might execute this sequence in parallel.  This
9586be9f0dSKonstantin Belousov 	 * should be safe, because the context entries written by both
9686be9f0dSKonstantin Belousov 	 * threads are equal.
9786be9f0dSKonstantin Belousov 	 */
9886be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
9986be9f0dSKonstantin Belousov 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, DMAR_PGF_ZERO |
10086be9f0dSKonstantin Belousov 	    DMAR_PGF_WAITOK);
10186be9f0dSKonstantin Belousov 	re = dmar_map_pgtbl(dmar->ctx_obj, 0, DMAR_PGF_NOALLOC, &sf);
10286be9f0dSKonstantin Belousov 	re += bus;
10386be9f0dSKonstantin Belousov 	dmar_pte_store(&re->r1, DMAR_ROOT_R1_P | (DMAR_ROOT_R1_CTP_MASK &
10486be9f0dSKonstantin Belousov 	    VM_PAGE_TO_PHYS(ctxm)));
1056b7c46afSKonstantin Belousov 	dmar_flush_root_to_ram(dmar, re);
1066b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
10786be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
10886be9f0dSKonstantin Belousov }
10986be9f0dSKonstantin Belousov 
11086be9f0dSKonstantin Belousov static dmar_ctx_entry_t *
11186be9f0dSKonstantin Belousov dmar_map_ctx_entry(struct dmar_ctx *ctx, struct sf_buf **sfp)
11286be9f0dSKonstantin Belousov {
11386be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
11486be9f0dSKonstantin Belousov 
1151abfd355SKonstantin Belousov 	ctxp = dmar_map_pgtbl(ctx->domain->dmar->ctx_obj, 1 +
1161abfd355SKonstantin Belousov 	    PCI_RID2BUS(ctx->rid), DMAR_PGF_NOALLOC | DMAR_PGF_WAITOK, sfp);
11767499354SRyan Stone 	ctxp += ctx->rid & 0xff;
11886be9f0dSKonstantin Belousov 	return (ctxp);
11986be9f0dSKonstantin Belousov }
12086be9f0dSKonstantin Belousov 
12186be9f0dSKonstantin Belousov static void
12267499354SRyan Stone ctx_tag_init(struct dmar_ctx *ctx, device_t dev)
12386be9f0dSKonstantin Belousov {
12486be9f0dSKonstantin Belousov 	bus_addr_t maxaddr;
12586be9f0dSKonstantin Belousov 
1261abfd355SKonstantin Belousov 	maxaddr = MIN(ctx->domain->end, BUS_SPACE_MAXADDR);
12786be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.ref_count = 1; /* Prevent free */
12886be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.impl = &bus_dma_dmar_impl;
12986be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.boundary = PCI_DMA_BOUNDARY;
13086be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.lowaddr = maxaddr;
13186be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.highaddr = maxaddr;
13286be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsize = maxaddr;
13386be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.nsegments = BUS_SPACE_UNRESTRICTED;
13486be9f0dSKonstantin Belousov 	ctx->ctx_tag.common.maxsegsz = maxaddr;
13586be9f0dSKonstantin Belousov 	ctx->ctx_tag.ctx = ctx;
13667499354SRyan Stone 	ctx->ctx_tag.owner = dev;
13786be9f0dSKonstantin Belousov }
13886be9f0dSKonstantin Belousov 
13986be9f0dSKonstantin Belousov static void
1401abfd355SKonstantin Belousov ctx_id_entry_init(struct dmar_ctx *ctx, dmar_ctx_entry_t *ctxp, bool move)
14186be9f0dSKonstantin Belousov {
14286be9f0dSKonstantin Belousov 	struct dmar_unit *unit;
1431abfd355SKonstantin Belousov 	struct dmar_domain *domain;
14486be9f0dSKonstantin Belousov 	vm_page_t ctx_root;
14586be9f0dSKonstantin Belousov 
1461abfd355SKonstantin Belousov 	domain = ctx->domain;
1471abfd355SKonstantin Belousov 	unit = domain->dmar;
1481abfd355SKonstantin Belousov 	KASSERT(move || (ctxp->ctx1 == 0 && ctxp->ctx2 == 0),
14986be9f0dSKonstantin Belousov 	    ("dmar%d: initialized ctx entry %d:%d:%d 0x%jx 0x%jx",
15067499354SRyan Stone 	    unit->unit, pci_get_bus(ctx->ctx_tag.owner),
15167499354SRyan Stone 	    pci_get_slot(ctx->ctx_tag.owner),
15267499354SRyan Stone 	    pci_get_function(ctx->ctx_tag.owner),
1531abfd355SKonstantin Belousov 	    ctxp->ctx1, ctxp->ctx2));
1541abfd355SKonstantin Belousov 	/*
1551abfd355SKonstantin Belousov 	 * For update due to move, the store is not atomic.  It is
1561abfd355SKonstantin Belousov 	 * possible that DMAR read upper doubleword, while low
1571abfd355SKonstantin Belousov 	 * doubleword is not yet updated.  The domain id is stored in
1581abfd355SKonstantin Belousov 	 * the upper doubleword, while the table pointer in the lower.
1591abfd355SKonstantin Belousov 	 *
1601abfd355SKonstantin Belousov 	 * There is no good solution, for the same reason it is wrong
1611abfd355SKonstantin Belousov 	 * to clear P bit in the ctx entry for update.
1621abfd355SKonstantin Belousov 	 */
1631abfd355SKonstantin Belousov 	dmar_pte_store1(&ctxp->ctx2, DMAR_CTX2_DID(domain->domain) |
1641abfd355SKonstantin Belousov 	    domain->awlvl);
1651abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_IDMAP) != 0 &&
16686be9f0dSKonstantin Belousov 	    (unit->hw_ecap & DMAR_ECAP_PT) != 0) {
1671abfd355SKonstantin Belousov 		KASSERT(domain->pgtbl_obj == NULL,
16886be9f0dSKonstantin Belousov 		    ("ctx %p non-null pgtbl_obj", ctx));
1691abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_PASS | DMAR_CTX1_P);
17086be9f0dSKonstantin Belousov 	} else {
1711abfd355SKonstantin Belousov 		ctx_root = dmar_pgalloc(domain->pgtbl_obj, 0, DMAR_PGF_NOALLOC);
1721abfd355SKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_UNTR |
17386be9f0dSKonstantin Belousov 		    (DMAR_CTX1_ASR_MASK & VM_PAGE_TO_PHYS(ctx_root)) |
17486be9f0dSKonstantin Belousov 		    DMAR_CTX1_P);
17586be9f0dSKonstantin Belousov 	}
1766b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(unit, ctxp);
17786be9f0dSKonstantin Belousov }
17886be9f0dSKonstantin Belousov 
17986be9f0dSKonstantin Belousov static int
1801abfd355SKonstantin Belousov dmar_flush_for_ctx_entry(struct dmar_unit *dmar, bool force)
1811abfd355SKonstantin Belousov {
1821abfd355SKonstantin Belousov 	int error;
1831abfd355SKonstantin Belousov 
1841abfd355SKonstantin Belousov 	/*
1851abfd355SKonstantin Belousov 	 * If dmar declares Caching Mode as Set, follow 11.5 "Caching
1861abfd355SKonstantin Belousov 	 * Mode Consideration" and do the (global) invalidation of the
1871abfd355SKonstantin Belousov 	 * negative TLB entries.
1881abfd355SKonstantin Belousov 	 */
1891abfd355SKonstantin Belousov 	if ((dmar->hw_cap & DMAR_CAP_CM) == 0 && !force)
1901abfd355SKonstantin Belousov 		return (0);
1911abfd355SKonstantin Belousov 	if (dmar->qi_enabled) {
1921abfd355SKonstantin Belousov 		dmar_qi_invalidate_ctx_glob_locked(dmar);
1931abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force)
1941abfd355SKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
1951abfd355SKonstantin Belousov 		return (0);
1961abfd355SKonstantin Belousov 	}
1971abfd355SKonstantin Belousov 	error = dmar_inv_ctx_glob(dmar);
1981abfd355SKonstantin Belousov 	if (error == 0 && ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force))
1991abfd355SKonstantin Belousov 		error = dmar_inv_iotlb_glob(dmar);
2001abfd355SKonstantin Belousov 	return (error);
2011abfd355SKonstantin Belousov }
2021abfd355SKonstantin Belousov 
2031abfd355SKonstantin Belousov static int
2041abfd355SKonstantin Belousov domain_init_rmrr(struct dmar_domain *domain, device_t dev)
20586be9f0dSKonstantin Belousov {
20686be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq rmrr_entries;
20786be9f0dSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
20886be9f0dSKonstantin Belousov 	vm_page_t *ma;
20986be9f0dSKonstantin Belousov 	dmar_gaddr_t start, end;
21086be9f0dSKonstantin Belousov 	vm_pindex_t size, i;
21186be9f0dSKonstantin Belousov 	int error, error1;
21286be9f0dSKonstantin Belousov 
21386be9f0dSKonstantin Belousov 	error = 0;
21486be9f0dSKonstantin Belousov 	TAILQ_INIT(&rmrr_entries);
2151abfd355SKonstantin Belousov 	dmar_dev_parse_rmrr(domain, dev, &rmrr_entries);
21686be9f0dSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, &rmrr_entries, unroll_link, entry1) {
21786be9f0dSKonstantin Belousov 		/*
21886be9f0dSKonstantin Belousov 		 * VT-d specification requires that the start of an
21986be9f0dSKonstantin Belousov 		 * RMRR entry is 4k-aligned.  Buggy BIOSes put
22086be9f0dSKonstantin Belousov 		 * anything into the start and end fields.  Truncate
22186be9f0dSKonstantin Belousov 		 * and round as neccesary.
22286be9f0dSKonstantin Belousov 		 *
22386be9f0dSKonstantin Belousov 		 * We also allow the overlapping RMRR entries, see
22486be9f0dSKonstantin Belousov 		 * dmar_gas_alloc_region().
22586be9f0dSKonstantin Belousov 		 */
22686be9f0dSKonstantin Belousov 		start = entry->start;
22786be9f0dSKonstantin Belousov 		end = entry->end;
22886be9f0dSKonstantin Belousov 		entry->start = trunc_page(start);
22986be9f0dSKonstantin Belousov 		entry->end = round_page(end);
230e02b05b3SKonstantin Belousov 		if (entry->start == entry->end) {
231e02b05b3SKonstantin Belousov 			/* Workaround for some AMI (?) BIOSes */
232e02b05b3SKonstantin Belousov 			if (bootverbose) {
233e02b05b3SKonstantin Belousov 				device_printf(dev, "BIOS bug: dmar%d RMRR "
234e02b05b3SKonstantin Belousov 				    "region (%jx, %jx) corrected\n",
2351abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end);
236e02b05b3SKonstantin Belousov 			}
237e02b05b3SKonstantin Belousov 			entry->end += DMAR_PAGE_SIZE * 0x20;
238e02b05b3SKonstantin Belousov 		}
23986be9f0dSKonstantin Belousov 		size = OFF_TO_IDX(entry->end - entry->start);
24086be9f0dSKonstantin Belousov 		ma = malloc(sizeof(vm_page_t) * size, M_TEMP, M_WAITOK);
24186be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++) {
24286be9f0dSKonstantin Belousov 			ma[i] = vm_page_getfake(entry->start + PAGE_SIZE * i,
24386be9f0dSKonstantin Belousov 			    VM_MEMATTR_DEFAULT);
24486be9f0dSKonstantin Belousov 		}
2451abfd355SKonstantin Belousov 		error1 = dmar_gas_map_region(domain, entry,
2461abfd355SKonstantin Belousov 		    DMAR_MAP_ENTRY_READ | DMAR_MAP_ENTRY_WRITE,
2471abfd355SKonstantin Belousov 		    DMAR_GM_CANWAIT, ma);
24886be9f0dSKonstantin Belousov 		/*
24986be9f0dSKonstantin Belousov 		 * Non-failed RMRR entries are owned by context rb
25086be9f0dSKonstantin Belousov 		 * tree.  Get rid of the failed entry, but do not stop
25186be9f0dSKonstantin Belousov 		 * the loop.  Rest of the parsed RMRR entries are
25286be9f0dSKonstantin Belousov 		 * loaded and removed on the context destruction.
25386be9f0dSKonstantin Belousov 		 */
25486be9f0dSKonstantin Belousov 		if (error1 == 0 && entry->end != entry->start) {
2551abfd355SKonstantin Belousov 			DMAR_LOCK(domain->dmar);
2561abfd355SKonstantin Belousov 			domain->refs++; /* XXXKIB prevent free */
2571abfd355SKonstantin Belousov 			domain->flags |= DMAR_DOMAIN_RMRR;
2581abfd355SKonstantin Belousov 			DMAR_UNLOCK(domain->dmar);
25986be9f0dSKonstantin Belousov 		} else {
26086be9f0dSKonstantin Belousov 			if (error1 != 0) {
26186be9f0dSKonstantin Belousov 				device_printf(dev,
26286be9f0dSKonstantin Belousov 			    "dmar%d failed to map RMRR region (%jx, %jx) %d\n",
2631abfd355SKonstantin Belousov 				    domain->dmar->unit, start, end, error1);
26486be9f0dSKonstantin Belousov 				error = error1;
26586be9f0dSKonstantin Belousov 			}
26686be9f0dSKonstantin Belousov 			TAILQ_REMOVE(&rmrr_entries, entry, unroll_link);
2671abfd355SKonstantin Belousov 			dmar_gas_free_entry(domain, entry);
26886be9f0dSKonstantin Belousov 		}
26986be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++)
27086be9f0dSKonstantin Belousov 			vm_page_putfake(ma[i]);
27186be9f0dSKonstantin Belousov 		free(ma, M_TEMP);
27286be9f0dSKonstantin Belousov 	}
27386be9f0dSKonstantin Belousov 	return (error);
27486be9f0dSKonstantin Belousov }
27586be9f0dSKonstantin Belousov 
2761abfd355SKonstantin Belousov static struct dmar_domain *
2771abfd355SKonstantin Belousov dmar_domain_alloc(struct dmar_unit *dmar, bool id_mapped)
2781abfd355SKonstantin Belousov {
2791abfd355SKonstantin Belousov 	struct dmar_domain *domain;
2801abfd355SKonstantin Belousov 	int error, id, mgaw;
2811abfd355SKonstantin Belousov 
2821abfd355SKonstantin Belousov 	id = alloc_unr(dmar->domids);
2831abfd355SKonstantin Belousov 	if (id == -1)
2841abfd355SKonstantin Belousov 		return (NULL);
2851abfd355SKonstantin Belousov 	domain = malloc(sizeof(*domain), M_DMAR_DOMAIN, M_WAITOK | M_ZERO);
2861abfd355SKonstantin Belousov 	domain->domain = id;
2871abfd355SKonstantin Belousov 	LIST_INIT(&domain->contexts);
2881abfd355SKonstantin Belousov 	RB_INIT(&domain->rb_root);
2891abfd355SKonstantin Belousov 	TAILQ_INIT(&domain->unload_entries);
2901abfd355SKonstantin Belousov 	TASK_INIT(&domain->unload_task, 0, dmar_domain_unload_task, domain);
2911abfd355SKonstantin Belousov 	mtx_init(&domain->lock, "dmardom", NULL, MTX_DEF);
2921abfd355SKonstantin Belousov 	domain->dmar = dmar;
2931abfd355SKonstantin Belousov 
2941abfd355SKonstantin Belousov 	/*
2951abfd355SKonstantin Belousov 	 * For now, use the maximal usable physical address of the
2961abfd355SKonstantin Belousov 	 * installed memory to calculate the mgaw on id_mapped domain.
2971abfd355SKonstantin Belousov 	 * It is useful for the identity mapping, and less so for the
2981abfd355SKonstantin Belousov 	 * virtualized bus address space.
2991abfd355SKonstantin Belousov 	 */
3001abfd355SKonstantin Belousov 	domain->end = id_mapped ? ptoa(Maxmem) : BUS_SPACE_MAXADDR;
3011abfd355SKonstantin Belousov 	mgaw = dmar_maxaddr2mgaw(dmar, domain->end, !id_mapped);
3021abfd355SKonstantin Belousov 	error = domain_set_agaw(domain, mgaw);
3031abfd355SKonstantin Belousov 	if (error != 0)
3041abfd355SKonstantin Belousov 		goto fail;
3051abfd355SKonstantin Belousov 	if (!id_mapped)
3061abfd355SKonstantin Belousov 		/* Use all supported address space for remapping. */
3071abfd355SKonstantin Belousov 		domain->end = 1ULL << (domain->agaw - 1);
3081abfd355SKonstantin Belousov 
3091abfd355SKonstantin Belousov 	dmar_gas_init_domain(domain);
3101abfd355SKonstantin Belousov 
3111abfd355SKonstantin Belousov 	if (id_mapped) {
3121abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_PT) == 0) {
3131abfd355SKonstantin Belousov 			domain->pgtbl_obj = domain_get_idmap_pgtbl(domain,
3141abfd355SKonstantin Belousov 			    domain->end);
3151abfd355SKonstantin Belousov 		}
3161abfd355SKonstantin Belousov 		domain->flags |= DMAR_DOMAIN_IDMAP;
3171abfd355SKonstantin Belousov 	} else {
3181abfd355SKonstantin Belousov 		error = domain_alloc_pgtbl(domain);
3191abfd355SKonstantin Belousov 		if (error != 0)
3201abfd355SKonstantin Belousov 			goto fail;
3211abfd355SKonstantin Belousov 		/* Disable local apic region access */
3221abfd355SKonstantin Belousov 		error = dmar_gas_reserve_region(domain, 0xfee00000,
3231abfd355SKonstantin Belousov 		    0xfeefffff + 1);
3241abfd355SKonstantin Belousov 		if (error != 0)
3251abfd355SKonstantin Belousov 			goto fail;
3261abfd355SKonstantin Belousov 	}
3271abfd355SKonstantin Belousov 	return (domain);
3281abfd355SKonstantin Belousov 
3291abfd355SKonstantin Belousov fail:
3301abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
3311abfd355SKonstantin Belousov 	return (NULL);
3321abfd355SKonstantin Belousov }
3331abfd355SKonstantin Belousov 
33486be9f0dSKonstantin Belousov static struct dmar_ctx *
3351abfd355SKonstantin Belousov dmar_ctx_alloc(struct dmar_domain *domain, uint16_t rid)
33686be9f0dSKonstantin Belousov {
33786be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
33886be9f0dSKonstantin Belousov 
33986be9f0dSKonstantin Belousov 	ctx = malloc(sizeof(*ctx), M_DMAR_CTX, M_WAITOK | M_ZERO);
3401abfd355SKonstantin Belousov 	ctx->domain = domain;
34167499354SRyan Stone 	ctx->rid = rid;
3421abfd355SKonstantin Belousov 	ctx->refs = 1;
34386be9f0dSKonstantin Belousov 	return (ctx);
34486be9f0dSKonstantin Belousov }
34586be9f0dSKonstantin Belousov 
34686be9f0dSKonstantin Belousov static void
3471abfd355SKonstantin Belousov dmar_ctx_link(struct dmar_ctx *ctx)
3481abfd355SKonstantin Belousov {
3491abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3501abfd355SKonstantin Belousov 
3511abfd355SKonstantin Belousov 	domain = ctx->domain;
3521abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
3531abfd355SKonstantin Belousov 	KASSERT(domain->refs >= domain->ctx_cnt,
3541abfd355SKonstantin Belousov 	    ("dom %p ref underflow %d %d", domain, domain->refs,
3551abfd355SKonstantin Belousov 	    domain->ctx_cnt));
3561abfd355SKonstantin Belousov 	domain->refs++;
3571abfd355SKonstantin Belousov 	domain->ctx_cnt++;
3581abfd355SKonstantin Belousov 	LIST_INSERT_HEAD(&domain->contexts, ctx, link);
3591abfd355SKonstantin Belousov }
3601abfd355SKonstantin Belousov 
3611abfd355SKonstantin Belousov static void
3621abfd355SKonstantin Belousov dmar_ctx_unlink(struct dmar_ctx *ctx)
3631abfd355SKonstantin Belousov {
3641abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3651abfd355SKonstantin Belousov 
3661abfd355SKonstantin Belousov 	domain = ctx->domain;
3671abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(domain->dmar);
3681abfd355SKonstantin Belousov 	KASSERT(domain->refs > 0,
3691abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d", domain, domain->refs));
3701abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt >= domain->refs,
3711abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d ctx_cnt %d", domain,
3721abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
3731abfd355SKonstantin Belousov 	domain->refs--;
3741abfd355SKonstantin Belousov 	domain->ctx_cnt--;
3751abfd355SKonstantin Belousov 	LIST_REMOVE(ctx, link);
3761abfd355SKonstantin Belousov }
3771abfd355SKonstantin Belousov 
3781abfd355SKonstantin Belousov static void
3791abfd355SKonstantin Belousov dmar_domain_destroy(struct dmar_domain *domain)
38086be9f0dSKonstantin Belousov {
38186be9f0dSKonstantin Belousov 
3821abfd355SKonstantin Belousov 	KASSERT(TAILQ_EMPTY(&domain->unload_entries),
3831abfd355SKonstantin Belousov 	    ("unfinished unloads %p", domain));
3841abfd355SKonstantin Belousov 	KASSERT(LIST_EMPTY(&domain->contexts),
3851abfd355SKonstantin Belousov 	    ("destroying dom %p with contexts", domain));
3861abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt == 0,
3871abfd355SKonstantin Belousov 	    ("destroying dom %p with ctx_cnt %d", domain, domain->ctx_cnt));
3881abfd355SKonstantin Belousov 	KASSERT(domain->refs == 0,
3891abfd355SKonstantin Belousov 	    ("destroying dom %p with refs %d", domain, domain->refs));
3901abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_GAS_INITED) != 0) {
3911abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
3921abfd355SKonstantin Belousov 		dmar_gas_fini_domain(domain);
3931abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
39486be9f0dSKonstantin Belousov 	}
3951abfd355SKonstantin Belousov 	if ((domain->flags & DMAR_DOMAIN_PGTBL_INITED) != 0) {
3961abfd355SKonstantin Belousov 		if (domain->pgtbl_obj != NULL)
3971abfd355SKonstantin Belousov 			DMAR_DOMAIN_PGLOCK(domain);
3981abfd355SKonstantin Belousov 		domain_free_pgtbl(domain);
39986be9f0dSKonstantin Belousov 	}
4001abfd355SKonstantin Belousov 	mtx_destroy(&domain->lock);
4011abfd355SKonstantin Belousov 	free_unr(domain->dmar->domids, domain->domain);
4021abfd355SKonstantin Belousov 	free(domain, M_DMAR_DOMAIN);
40386be9f0dSKonstantin Belousov }
40486be9f0dSKonstantin Belousov 
40586be9f0dSKonstantin Belousov struct dmar_ctx *
4061abfd355SKonstantin Belousov dmar_get_ctx_for_dev(struct dmar_unit *dmar, device_t dev, uint16_t rid,
4071abfd355SKonstantin Belousov     bool id_mapped, bool rmrr_init)
40886be9f0dSKonstantin Belousov {
4091abfd355SKonstantin Belousov 	struct dmar_domain *domain, *domain1;
41086be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx, *ctx1;
41186be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
41286be9f0dSKonstantin Belousov 	struct sf_buf *sf;
4131abfd355SKonstantin Belousov 	int bus, slot, func, error;
41486be9f0dSKonstantin Belousov 	bool enable;
41586be9f0dSKonstantin Belousov 
41667499354SRyan Stone 	bus = pci_get_bus(dev);
41767499354SRyan Stone 	slot = pci_get_slot(dev);
41867499354SRyan Stone 	func = pci_get_function(dev);
41986be9f0dSKonstantin Belousov 	enable = false;
42086be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
42186be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
42267499354SRyan Stone 	ctx = dmar_find_ctx_locked(dmar, rid);
42386be9f0dSKonstantin Belousov 	error = 0;
42486be9f0dSKonstantin Belousov 	if (ctx == NULL) {
42586be9f0dSKonstantin Belousov 		/*
42686be9f0dSKonstantin Belousov 		 * Perform the allocations which require sleep or have
42786be9f0dSKonstantin Belousov 		 * higher chance to succeed if the sleep is allowed.
42886be9f0dSKonstantin Belousov 		 */
42986be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
430b29d186cSKonstantin Belousov 		dmar_ensure_ctx_page(dmar, PCI_RID2BUS(rid));
4311abfd355SKonstantin Belousov 		domain1 = dmar_domain_alloc(dmar, id_mapped);
4321abfd355SKonstantin Belousov 		if (domain1 == NULL) {
43386be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
43486be9f0dSKonstantin Belousov 			return (NULL);
43586be9f0dSKonstantin Belousov 		}
4361abfd355SKonstantin Belousov 		error = domain_init_rmrr(domain1, dev);
43786be9f0dSKonstantin Belousov 		if (error != 0) {
4381abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
43986be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
44086be9f0dSKonstantin Belousov 			return (NULL);
44186be9f0dSKonstantin Belousov 		}
4421abfd355SKonstantin Belousov 		ctx1 = dmar_ctx_alloc(domain1, rid);
44386be9f0dSKonstantin Belousov 		ctxp = dmar_map_ctx_entry(ctx1, &sf);
44486be9f0dSKonstantin Belousov 		DMAR_LOCK(dmar);
44586be9f0dSKonstantin Belousov 
44686be9f0dSKonstantin Belousov 		/*
44786be9f0dSKonstantin Belousov 		 * Recheck the contexts, other thread might have
44886be9f0dSKonstantin Belousov 		 * already allocated needed one.
44986be9f0dSKonstantin Belousov 		 */
45067499354SRyan Stone 		ctx = dmar_find_ctx_locked(dmar, rid);
45186be9f0dSKonstantin Belousov 		if (ctx == NULL) {
4521abfd355SKonstantin Belousov 			domain = domain1;
45386be9f0dSKonstantin Belousov 			ctx = ctx1;
4541abfd355SKonstantin Belousov 			dmar_ctx_link(ctx);
4559d0bc6d8SKonstantin Belousov 			ctx->ctx_tag.owner = dev;
45667499354SRyan Stone 			ctx_tag_init(ctx, dev);
45786be9f0dSKonstantin Belousov 
45886be9f0dSKonstantin Belousov 			/*
45986be9f0dSKonstantin Belousov 			 * This is the first activated context for the
46086be9f0dSKonstantin Belousov 			 * DMAR unit.  Enable the translation after
46186be9f0dSKonstantin Belousov 			 * everything is set up.
46286be9f0dSKonstantin Belousov 			 */
4631abfd355SKonstantin Belousov 			if (LIST_EMPTY(&dmar->domains))
46486be9f0dSKonstantin Belousov 				enable = true;
4651abfd355SKonstantin Belousov 			LIST_INSERT_HEAD(&dmar->domains, domain, link);
4661abfd355SKonstantin Belousov 			ctx_id_entry_init(ctx, ctxp, false);
46786be9f0dSKonstantin Belousov 			device_printf(dev,
46834e8337bSKonstantin Belousov 			    "dmar%d pci%d:%d:%d:%d rid %x domain %d mgaw %d "
4699d0bc6d8SKonstantin Belousov 			    "agaw %d %s-mapped\n",
47086be9f0dSKonstantin Belousov 			    dmar->unit, dmar->segment, bus, slot,
4711abfd355SKonstantin Belousov 			    func, rid, domain->domain, domain->mgaw,
4721abfd355SKonstantin Belousov 			    domain->agaw, id_mapped ? "id" : "re");
47386be9f0dSKonstantin Belousov 		} else {
4741abfd355SKonstantin Belousov 			/* Nothing needs to be done to destroy ctx1. */
4751abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
4761abfd355SKonstantin Belousov 			domain = ctx->domain;
4771abfd355SKonstantin Belousov 			ctx->refs++; /* tag referenced us */
47886be9f0dSKonstantin Belousov 		}
4796b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
48068eeb96aSKonstantin Belousov 	} else {
4811abfd355SKonstantin Belousov 		domain = ctx->domain;
4821abfd355SKonstantin Belousov 		ctx->refs++; /* tag referenced us */
4831abfd355SKonstantin Belousov 	}
4841abfd355SKonstantin Belousov 
4851abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, enable);
48686be9f0dSKonstantin Belousov 	if (error != 0) {
48786be9f0dSKonstantin Belousov 		dmar_free_ctx_locked(dmar, ctx);
48886be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
48986be9f0dSKonstantin Belousov 		return (NULL);
49086be9f0dSKonstantin Belousov 	}
49168eeb96aSKonstantin Belousov 
49268eeb96aSKonstantin Belousov 	/*
49368eeb96aSKonstantin Belousov 	 * The dmar lock was potentially dropped between check for the
49468eeb96aSKonstantin Belousov 	 * empty context list and now.  Recheck the state of GCMD_TE
49568eeb96aSKonstantin Belousov 	 * to avoid unneeded command.
49668eeb96aSKonstantin Belousov 	 */
49768eeb96aSKonstantin Belousov 	if (enable && !rmrr_init && (dmar->hw_gcmd & DMAR_GCMD_TE) == 0) {
49886be9f0dSKonstantin Belousov 		error = dmar_enable_translation(dmar);
49986be9f0dSKonstantin Belousov 		if (error != 0) {
50086be9f0dSKonstantin Belousov 			dmar_free_ctx_locked(dmar, ctx);
50186be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
50286be9f0dSKonstantin Belousov 			return (NULL);
50386be9f0dSKonstantin Belousov 		}
50486be9f0dSKonstantin Belousov 	}
50586be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
50686be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
50786be9f0dSKonstantin Belousov 	return (ctx);
50886be9f0dSKonstantin Belousov }
50986be9f0dSKonstantin Belousov 
5101abfd355SKonstantin Belousov int
5111abfd355SKonstantin Belousov dmar_move_ctx_to_domain(struct dmar_domain *domain, struct dmar_ctx *ctx)
5121abfd355SKonstantin Belousov {
5131abfd355SKonstantin Belousov 	struct dmar_unit *dmar;
5141abfd355SKonstantin Belousov 	struct dmar_domain *old_domain;
5151abfd355SKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
5161abfd355SKonstantin Belousov 	struct sf_buf *sf;
5171abfd355SKonstantin Belousov 	int error;
5181abfd355SKonstantin Belousov 
5191abfd355SKonstantin Belousov 	dmar = domain->dmar;
5201abfd355SKonstantin Belousov 	old_domain = ctx->domain;
5211abfd355SKonstantin Belousov 	if (domain == old_domain)
5221abfd355SKonstantin Belousov 		return (0);
5231abfd355SKonstantin Belousov 	KASSERT(old_domain->dmar == dmar,
5241abfd355SKonstantin Belousov 	    ("domain %p %u moving between dmars %u %u", domain,
5251abfd355SKonstantin Belousov 	    domain->domain, old_domain->dmar->unit, domain->dmar->unit));
5261abfd355SKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
5271abfd355SKonstantin Belousov 
5281abfd355SKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
5291abfd355SKonstantin Belousov 	DMAR_LOCK(dmar);
5301abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
5311abfd355SKonstantin Belousov 	ctx->domain = domain;
5321abfd355SKonstantin Belousov 	dmar_ctx_link(ctx);
5331abfd355SKonstantin Belousov 	ctx_id_entry_init(ctx, ctxp, true);
5341abfd355SKonstantin Belousov 	dmar_unmap_pgtbl(sf);
5351abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, true);
5361abfd355SKonstantin Belousov 	/* If flush failed, rolling back would not work as well. */
5371abfd355SKonstantin Belousov 	printf("dmar%d rid %x domain %d->%d %s-mapped\n",
5381abfd355SKonstantin Belousov 	    dmar->unit, ctx->rid, old_domain->domain, domain->domain,
5391abfd355SKonstantin Belousov 	    (domain->flags & DMAR_DOMAIN_IDMAP) != 0 ? "id" : "re");
5401abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, old_domain);
5411abfd355SKonstantin Belousov 	TD_PINNED_ASSERT;
5421abfd355SKonstantin Belousov 	return (error);
5431abfd355SKonstantin Belousov }
5441abfd355SKonstantin Belousov 
5451abfd355SKonstantin Belousov static void
5461abfd355SKonstantin Belousov dmar_unref_domain_locked(struct dmar_unit *dmar, struct dmar_domain *domain)
5471abfd355SKonstantin Belousov {
5481abfd355SKonstantin Belousov 
5491abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
5501abfd355SKonstantin Belousov 	KASSERT(domain->refs >= 1,
5511abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %u", dmar->unit, domain, domain->refs));
5521abfd355SKonstantin Belousov 	KASSERT(domain->refs > domain->ctx_cnt,
5531abfd355SKonstantin Belousov 	    ("dmar %d domain %p refs %d ctx_cnt %d", dmar->unit, domain,
5541abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
5551abfd355SKonstantin Belousov 
5561abfd355SKonstantin Belousov 	if (domain->refs > 1) {
5571abfd355SKonstantin Belousov 		domain->refs--;
5581abfd355SKonstantin Belousov 		DMAR_UNLOCK(dmar);
5591abfd355SKonstantin Belousov 		return;
5601abfd355SKonstantin Belousov 	}
5611abfd355SKonstantin Belousov 
5621abfd355SKonstantin Belousov 	KASSERT((domain->flags & DMAR_DOMAIN_RMRR) == 0,
5631abfd355SKonstantin Belousov 	    ("lost ref on RMRR domain %p", domain));
5641abfd355SKonstantin Belousov 
5651abfd355SKonstantin Belousov 	LIST_REMOVE(domain, link);
5661abfd355SKonstantin Belousov 	DMAR_UNLOCK(dmar);
5671abfd355SKonstantin Belousov 
5681abfd355SKonstantin Belousov 	taskqueue_drain(dmar->delayed_taskqueue, &domain->unload_task);
5691abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
5701abfd355SKonstantin Belousov }
5711abfd355SKonstantin Belousov 
57286be9f0dSKonstantin Belousov void
57386be9f0dSKonstantin Belousov dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx)
57486be9f0dSKonstantin Belousov {
57586be9f0dSKonstantin Belousov 	struct sf_buf *sf;
57686be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
5771abfd355SKonstantin Belousov 	struct dmar_domain *domain;
57886be9f0dSKonstantin Belousov 
57986be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
58086be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
58186be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
58286be9f0dSKonstantin Belousov 
58386be9f0dSKonstantin Belousov 	/*
58486be9f0dSKonstantin Belousov 	 * If our reference is not last, only the dereference should
58586be9f0dSKonstantin Belousov 	 * be performed.
58686be9f0dSKonstantin Belousov 	 */
58786be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
58886be9f0dSKonstantin Belousov 		ctx->refs--;
58986be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
59086be9f0dSKonstantin Belousov 		return;
59186be9f0dSKonstantin Belousov 	}
59286be9f0dSKonstantin Belousov 
59386be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
59486be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
59586be9f0dSKonstantin Belousov 
59686be9f0dSKonstantin Belousov 	/*
59786be9f0dSKonstantin Belousov 	 * Otherwise, the context entry must be cleared before the
59886be9f0dSKonstantin Belousov 	 * page table is destroyed.  The mapping of the context
59986be9f0dSKonstantin Belousov 	 * entries page could require sleep, unlock the dmar.
60086be9f0dSKonstantin Belousov 	 */
60186be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
60286be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
60386be9f0dSKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
60486be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
60586be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
60686be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
60786be9f0dSKonstantin Belousov 
60886be9f0dSKonstantin Belousov 	/*
60986be9f0dSKonstantin Belousov 	 * Other thread might have referenced the context, in which
61086be9f0dSKonstantin Belousov 	 * case again only the dereference should be performed.
61186be9f0dSKonstantin Belousov 	 */
61286be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
61386be9f0dSKonstantin Belousov 		ctx->refs--;
61486be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
6156b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
61686be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
61786be9f0dSKonstantin Belousov 		return;
61886be9f0dSKonstantin Belousov 	}
61986be9f0dSKonstantin Belousov 
62086be9f0dSKonstantin Belousov 	KASSERT((ctx->flags & DMAR_CTX_DISABLED) == 0,
62186be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
62286be9f0dSKonstantin Belousov 
62386be9f0dSKonstantin Belousov 	/*
62486be9f0dSKonstantin Belousov 	 * Clear the context pointer and flush the caches.
62586be9f0dSKonstantin Belousov 	 * XXXKIB: cannot do this if any RMRR entries are still present.
62686be9f0dSKonstantin Belousov 	 */
62786be9f0dSKonstantin Belousov 	dmar_pte_clear(&ctxp->ctx1);
62886be9f0dSKonstantin Belousov 	ctxp->ctx2 = 0;
6296b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(dmar, ctxp);
63086be9f0dSKonstantin Belousov 	dmar_inv_ctx_glob(dmar);
63168eeb96aSKonstantin Belousov 	if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0) {
63268eeb96aSKonstantin Belousov 		if (dmar->qi_enabled)
63368eeb96aSKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
63468eeb96aSKonstantin Belousov 		else
63586be9f0dSKonstantin Belousov 			dmar_inv_iotlb_glob(dmar);
63668eeb96aSKonstantin Belousov 	}
6376b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
6381abfd355SKonstantin Belousov 	domain = ctx->domain;
6391abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
6401abfd355SKonstantin Belousov 	free(ctx, M_DMAR_CTX);
6411abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, domain);
64286be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
64386be9f0dSKonstantin Belousov }
64486be9f0dSKonstantin Belousov 
64586be9f0dSKonstantin Belousov void
64686be9f0dSKonstantin Belousov dmar_free_ctx(struct dmar_ctx *ctx)
64786be9f0dSKonstantin Belousov {
64886be9f0dSKonstantin Belousov 	struct dmar_unit *dmar;
64986be9f0dSKonstantin Belousov 
6501abfd355SKonstantin Belousov 	dmar = ctx->domain->dmar;
65186be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
65286be9f0dSKonstantin Belousov 	dmar_free_ctx_locked(dmar, ctx);
65386be9f0dSKonstantin Belousov }
65486be9f0dSKonstantin Belousov 
6551abfd355SKonstantin Belousov /*
6561abfd355SKonstantin Belousov  * Returns with the domain locked.
6571abfd355SKonstantin Belousov  */
65886be9f0dSKonstantin Belousov struct dmar_ctx *
65967499354SRyan Stone dmar_find_ctx_locked(struct dmar_unit *dmar, uint16_t rid)
66086be9f0dSKonstantin Belousov {
6611abfd355SKonstantin Belousov 	struct dmar_domain *domain;
66286be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
66386be9f0dSKonstantin Belousov 
66486be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
66586be9f0dSKonstantin Belousov 
6661abfd355SKonstantin Belousov 	LIST_FOREACH(domain, &dmar->domains, link) {
6671abfd355SKonstantin Belousov 		LIST_FOREACH(ctx, &domain->contexts, link) {
66867499354SRyan Stone 			if (ctx->rid == rid)
66986be9f0dSKonstantin Belousov 				return (ctx);
67086be9f0dSKonstantin Belousov 		}
6711abfd355SKonstantin Belousov 	}
67286be9f0dSKonstantin Belousov 	return (NULL);
67386be9f0dSKonstantin Belousov }
67486be9f0dSKonstantin Belousov 
67586be9f0dSKonstantin Belousov void
6761abfd355SKonstantin Belousov dmar_domain_free_entry(struct dmar_map_entry *entry, bool free)
67768eeb96aSKonstantin Belousov {
6781abfd355SKonstantin Belousov 	struct dmar_domain *domain;
67968eeb96aSKonstantin Belousov 
6801abfd355SKonstantin Belousov 	domain = entry->domain;
6811abfd355SKonstantin Belousov 	DMAR_DOMAIN_LOCK(domain);
68268eeb96aSKonstantin Belousov 	if ((entry->flags & DMAR_MAP_ENTRY_RMRR) != 0)
6831abfd355SKonstantin Belousov 		dmar_gas_free_region(domain, entry);
68468eeb96aSKonstantin Belousov 	else
6851abfd355SKonstantin Belousov 		dmar_gas_free_space(domain, entry);
6861abfd355SKonstantin Belousov 	DMAR_DOMAIN_UNLOCK(domain);
68768eeb96aSKonstantin Belousov 	if (free)
6881abfd355SKonstantin Belousov 		dmar_gas_free_entry(domain, entry);
68968eeb96aSKonstantin Belousov 	else
69068eeb96aSKonstantin Belousov 		entry->flags = 0;
69168eeb96aSKonstantin Belousov }
69268eeb96aSKonstantin Belousov 
69368eeb96aSKonstantin Belousov void
6941abfd355SKonstantin Belousov dmar_domain_unload_entry(struct dmar_map_entry *entry, bool free)
69568eeb96aSKonstantin Belousov {
69668eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
69768eeb96aSKonstantin Belousov 
6981abfd355SKonstantin Belousov 	unit = entry->domain->dmar;
69968eeb96aSKonstantin Belousov 	if (unit->qi_enabled) {
70068eeb96aSKonstantin Belousov 		DMAR_LOCK(unit);
7011abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(entry->domain, entry->start,
70268eeb96aSKonstantin Belousov 		    entry->end - entry->start, &entry->gseq);
70368eeb96aSKonstantin Belousov 		if (!free)
70468eeb96aSKonstantin Belousov 			entry->flags |= DMAR_MAP_ENTRY_QI_NF;
70568eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
70668eeb96aSKonstantin Belousov 		DMAR_UNLOCK(unit);
70768eeb96aSKonstantin Belousov 	} else {
7081abfd355SKonstantin Belousov 		domain_flush_iotlb_sync(entry->domain, entry->start,
7091abfd355SKonstantin Belousov 		    entry->end - entry->start);
7101abfd355SKonstantin Belousov 		dmar_domain_free_entry(entry, free);
71168eeb96aSKonstantin Belousov 	}
71268eeb96aSKonstantin Belousov }
71368eeb96aSKonstantin Belousov 
714*e164cafcSKonstantin Belousov static struct dmar_qi_genseq *
715*e164cafcSKonstantin Belousov dmar_domain_unload_gseq(struct dmar_domain *domain,
716*e164cafcSKonstantin Belousov     struct dmar_map_entry *entry, struct dmar_qi_genseq *gseq)
717*e164cafcSKonstantin Belousov {
718*e164cafcSKonstantin Belousov 
719*e164cafcSKonstantin Belousov 	if (TAILQ_NEXT(entry, dmamap_link) != NULL)
720*e164cafcSKonstantin Belousov 		return (NULL);
721*e164cafcSKonstantin Belousov 	if (domain->batch_no++ % dmar_batch_coalesce != 0)
722*e164cafcSKonstantin Belousov 		return (NULL);
723*e164cafcSKonstantin Belousov 	return (gseq);
724*e164cafcSKonstantin Belousov }
725*e164cafcSKonstantin Belousov 
72668eeb96aSKonstantin Belousov void
7271abfd355SKonstantin Belousov dmar_domain_unload(struct dmar_domain *domain,
7281abfd355SKonstantin Belousov     struct dmar_map_entries_tailq *entries, bool cansleep)
72986be9f0dSKonstantin Belousov {
73068eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
73168eeb96aSKonstantin Belousov 	struct dmar_map_entry *entry, *entry1;
73268eeb96aSKonstantin Belousov 	struct dmar_qi_genseq gseq;
73386be9f0dSKonstantin Belousov 	int error;
73486be9f0dSKonstantin Belousov 
7351abfd355SKonstantin Belousov 	unit = domain->dmar;
73668eeb96aSKonstantin Belousov 
73768eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
73886be9f0dSKonstantin Belousov 		KASSERT((entry->flags & DMAR_MAP_ENTRY_MAP) != 0,
7391abfd355SKonstantin Belousov 		    ("not mapped entry %p %p", domain, entry));
7401abfd355SKonstantin Belousov 		error = domain_unmap_buf(domain, entry->start, entry->end -
74186be9f0dSKonstantin Belousov 		    entry->start, cansleep ? DMAR_PGF_WAITOK : 0);
7421abfd355SKonstantin Belousov 		KASSERT(error == 0, ("unmap %p error %d", domain, error));
74368eeb96aSKonstantin Belousov 		if (!unit->qi_enabled) {
7441abfd355SKonstantin Belousov 			domain_flush_iotlb_sync(domain, entry->start,
74568eeb96aSKonstantin Belousov 			    entry->end - entry->start);
74668eeb96aSKonstantin Belousov 			TAILQ_REMOVE(entries, entry, dmamap_link);
7471abfd355SKonstantin Belousov 			dmar_domain_free_entry(entry, true);
74886be9f0dSKonstantin Belousov 		}
74986be9f0dSKonstantin Belousov 	}
75068eeb96aSKonstantin Belousov 	if (TAILQ_EMPTY(entries))
75168eeb96aSKonstantin Belousov 		return;
75268eeb96aSKonstantin Belousov 
75368eeb96aSKonstantin Belousov 	KASSERT(unit->qi_enabled, ("loaded entry left"));
75468eeb96aSKonstantin Belousov 	DMAR_LOCK(unit);
75568eeb96aSKonstantin Belousov 	TAILQ_FOREACH(entry, entries, dmamap_link) {
75668eeb96aSKonstantin Belousov 		entry->gseq.gen = 0;
75768eeb96aSKonstantin Belousov 		entry->gseq.seq = 0;
7581abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(domain, entry->start, entry->end -
759*e164cafcSKonstantin Belousov 		    entry->start, dmar_domain_unload_gseq(domain, entry,
760*e164cafcSKonstantin Belousov 		    &gseq));
76168eeb96aSKonstantin Belousov 	}
76268eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
76368eeb96aSKonstantin Belousov 		entry->gseq = gseq;
76468eeb96aSKonstantin Belousov 		TAILQ_REMOVE(entries, entry, dmamap_link);
76568eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
76668eeb96aSKonstantin Belousov 	}
76768eeb96aSKonstantin Belousov 	DMAR_UNLOCK(unit);
76868eeb96aSKonstantin Belousov }
76986be9f0dSKonstantin Belousov 
77086be9f0dSKonstantin Belousov static void
7711abfd355SKonstantin Belousov dmar_domain_unload_task(void *arg, int pending)
77286be9f0dSKonstantin Belousov {
7731abfd355SKonstantin Belousov 	struct dmar_domain *domain;
77486be9f0dSKonstantin Belousov 	struct dmar_map_entries_tailq entries;
77586be9f0dSKonstantin Belousov 
7761abfd355SKonstantin Belousov 	domain = arg;
77786be9f0dSKonstantin Belousov 	TAILQ_INIT(&entries);
77886be9f0dSKonstantin Belousov 
77986be9f0dSKonstantin Belousov 	for (;;) {
7801abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
7811abfd355SKonstantin Belousov 		TAILQ_SWAP(&domain->unload_entries, &entries, dmar_map_entry,
78286be9f0dSKonstantin Belousov 		    dmamap_link);
7831abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
78486be9f0dSKonstantin Belousov 		if (TAILQ_EMPTY(&entries))
78586be9f0dSKonstantin Belousov 			break;
7861abfd355SKonstantin Belousov 		dmar_domain_unload(domain, &entries, true);
78786be9f0dSKonstantin Belousov 	}
78886be9f0dSKonstantin Belousov }
789