xref: /freebsd/sys/x86/iommu/intel_ctx.c (revision cb9050dd21b28f6e735649556ca63d09c4ba4efb)
186be9f0dSKonstantin Belousov /*-
2ebf5747bSPedro F. Giffuni  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3ebf5747bSPedro F. Giffuni  *
486be9f0dSKonstantin Belousov  * Copyright (c) 2013 The FreeBSD Foundation
586be9f0dSKonstantin Belousov  * All rights reserved.
686be9f0dSKonstantin Belousov  *
786be9f0dSKonstantin Belousov  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
886be9f0dSKonstantin Belousov  * under sponsorship from the FreeBSD Foundation.
986be9f0dSKonstantin Belousov  *
1086be9f0dSKonstantin Belousov  * Redistribution and use in source and binary forms, with or without
1186be9f0dSKonstantin Belousov  * modification, are permitted provided that the following conditions
1286be9f0dSKonstantin Belousov  * are met:
1386be9f0dSKonstantin Belousov  * 1. Redistributions of source code must retain the above copyright
1486be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer.
1586be9f0dSKonstantin Belousov  * 2. Redistributions in binary form must reproduce the above copyright
1686be9f0dSKonstantin Belousov  *    notice, this list of conditions and the following disclaimer in the
1786be9f0dSKonstantin Belousov  *    documentation and/or other materials provided with the distribution.
1886be9f0dSKonstantin Belousov  *
1986be9f0dSKonstantin Belousov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
2086be9f0dSKonstantin Belousov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2186be9f0dSKonstantin Belousov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2286be9f0dSKonstantin Belousov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2386be9f0dSKonstantin Belousov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2486be9f0dSKonstantin Belousov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2586be9f0dSKonstantin Belousov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2686be9f0dSKonstantin Belousov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2786be9f0dSKonstantin Belousov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2886be9f0dSKonstantin Belousov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2986be9f0dSKonstantin Belousov  * SUCH DAMAGE.
3086be9f0dSKonstantin Belousov  */
3186be9f0dSKonstantin Belousov 
3286be9f0dSKonstantin Belousov #include <sys/cdefs.h>
3386be9f0dSKonstantin Belousov __FBSDID("$FreeBSD$");
3486be9f0dSKonstantin Belousov 
3586be9f0dSKonstantin Belousov #include <sys/param.h>
3686be9f0dSKonstantin Belousov #include <sys/systm.h>
3786be9f0dSKonstantin Belousov #include <sys/malloc.h>
3886be9f0dSKonstantin Belousov #include <sys/bus.h>
3986be9f0dSKonstantin Belousov #include <sys/interrupt.h>
4086be9f0dSKonstantin Belousov #include <sys/kernel.h>
4186be9f0dSKonstantin Belousov #include <sys/ktr.h>
4286be9f0dSKonstantin Belousov #include <sys/limits.h>
4386be9f0dSKonstantin Belousov #include <sys/lock.h>
4486be9f0dSKonstantin Belousov #include <sys/memdesc.h>
4586be9f0dSKonstantin Belousov #include <sys/mutex.h>
4686be9f0dSKonstantin Belousov #include <sys/proc.h>
4786be9f0dSKonstantin Belousov #include <sys/rwlock.h>
4886be9f0dSKonstantin Belousov #include <sys/rman.h>
4986be9f0dSKonstantin Belousov #include <sys/sysctl.h>
5086be9f0dSKonstantin Belousov #include <sys/taskqueue.h>
5186be9f0dSKonstantin Belousov #include <sys/tree.h>
5286be9f0dSKonstantin Belousov #include <sys/uio.h>
530a110d5bSKonstantin Belousov #include <sys/vmem.h>
5486be9f0dSKonstantin Belousov #include <vm/vm.h>
5586be9f0dSKonstantin Belousov #include <vm/vm_extern.h>
5686be9f0dSKonstantin Belousov #include <vm/vm_kern.h>
5786be9f0dSKonstantin Belousov #include <vm/vm_object.h>
5886be9f0dSKonstantin Belousov #include <vm/vm_page.h>
5986be9f0dSKonstantin Belousov #include <vm/vm_pager.h>
6086be9f0dSKonstantin Belousov #include <vm/vm_map.h>
61c8597a1fSRuslan Bukin #include <contrib/dev/acpica/include/acpi.h>
62c8597a1fSRuslan Bukin #include <contrib/dev/acpica/include/accommon.h>
63c8597a1fSRuslan Bukin #include <dev/pci/pcireg.h>
64c8597a1fSRuslan Bukin #include <dev/pci/pcivar.h>
6586be9f0dSKonstantin Belousov #include <machine/atomic.h>
6686be9f0dSKonstantin Belousov #include <machine/bus.h>
6786be9f0dSKonstantin Belousov #include <machine/md_var.h>
6886be9f0dSKonstantin Belousov #include <machine/specialreg.h>
6986be9f0dSKonstantin Belousov #include <x86/include/busdma_impl.h>
70f2b2f317SRuslan Bukin #include <dev/iommu/busdma_iommu.h>
71c8597a1fSRuslan Bukin #include <x86/iommu/intel_reg.h>
72685666aaSKonstantin Belousov #include <x86/iommu/intel_dmar.h>
7386be9f0dSKonstantin Belousov 
7486be9f0dSKonstantin Belousov static MALLOC_DEFINE(M_DMAR_CTX, "dmar_ctx", "Intel DMAR Context");
751abfd355SKonstantin Belousov static MALLOC_DEFINE(M_DMAR_DOMAIN, "dmar_dom", "Intel DMAR Domain");
7686be9f0dSKonstantin Belousov 
771abfd355SKonstantin Belousov static void dmar_unref_domain_locked(struct dmar_unit *dmar,
781abfd355SKonstantin Belousov     struct dmar_domain *domain);
791abfd355SKonstantin Belousov static void dmar_domain_destroy(struct dmar_domain *domain);
8086be9f0dSKonstantin Belousov 
8186be9f0dSKonstantin Belousov static void
8286be9f0dSKonstantin Belousov dmar_ensure_ctx_page(struct dmar_unit *dmar, int bus)
8386be9f0dSKonstantin Belousov {
8486be9f0dSKonstantin Belousov 	struct sf_buf *sf;
8586be9f0dSKonstantin Belousov 	dmar_root_entry_t *re;
8686be9f0dSKonstantin Belousov 	vm_page_t ctxm;
8786be9f0dSKonstantin Belousov 
8886be9f0dSKonstantin Belousov 	/*
8986be9f0dSKonstantin Belousov 	 * Allocated context page must be linked.
9086be9f0dSKonstantin Belousov 	 */
9115f6baf4SRuslan Bukin 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, IOMMU_PGF_NOALLOC);
9286be9f0dSKonstantin Belousov 	if (ctxm != NULL)
9386be9f0dSKonstantin Belousov 		return;
9486be9f0dSKonstantin Belousov 
9586be9f0dSKonstantin Belousov 	/*
9686be9f0dSKonstantin Belousov 	 * Page not present, allocate and link.  Note that other
9786be9f0dSKonstantin Belousov 	 * thread might execute this sequence in parallel.  This
9886be9f0dSKonstantin Belousov 	 * should be safe, because the context entries written by both
9986be9f0dSKonstantin Belousov 	 * threads are equal.
10086be9f0dSKonstantin Belousov 	 */
10186be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
10215f6baf4SRuslan Bukin 	ctxm = dmar_pgalloc(dmar->ctx_obj, 1 + bus, IOMMU_PGF_ZERO |
10315f6baf4SRuslan Bukin 	    IOMMU_PGF_WAITOK);
10415f6baf4SRuslan Bukin 	re = dmar_map_pgtbl(dmar->ctx_obj, 0, IOMMU_PGF_NOALLOC, &sf);
10586be9f0dSKonstantin Belousov 	re += bus;
10686be9f0dSKonstantin Belousov 	dmar_pte_store(&re->r1, DMAR_ROOT_R1_P | (DMAR_ROOT_R1_CTP_MASK &
10786be9f0dSKonstantin Belousov 	    VM_PAGE_TO_PHYS(ctxm)));
1086b7c46afSKonstantin Belousov 	dmar_flush_root_to_ram(dmar, re);
1096b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
11086be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
11186be9f0dSKonstantin Belousov }
11286be9f0dSKonstantin Belousov 
11386be9f0dSKonstantin Belousov static dmar_ctx_entry_t *
11486be9f0dSKonstantin Belousov dmar_map_ctx_entry(struct dmar_ctx *ctx, struct sf_buf **sfp)
11586be9f0dSKonstantin Belousov {
11659e37c8aSRuslan Bukin 	struct dmar_unit *dmar;
11786be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
11886be9f0dSKonstantin Belousov 
11978b51754SRuslan Bukin 	dmar = CTX2DMAR(ctx);
12059e37c8aSRuslan Bukin 
121*cb9050ddSRuslan Bukin 	ctxp = dmar_map_pgtbl(dmar->ctx_obj, 1 + PCI_RID2BUS(ctx->context.rid),
122*cb9050ddSRuslan Bukin 	    IOMMU_PGF_NOALLOC | IOMMU_PGF_WAITOK, sfp);
123*cb9050ddSRuslan Bukin 	ctxp += ctx->context.rid & 0xff;
12486be9f0dSKonstantin Belousov 	return (ctxp);
12586be9f0dSKonstantin Belousov }
12686be9f0dSKonstantin Belousov 
12786be9f0dSKonstantin Belousov static void
12859e37c8aSRuslan Bukin device_tag_init(struct dmar_ctx *ctx, device_t dev)
12986be9f0dSKonstantin Belousov {
13059e37c8aSRuslan Bukin 	struct dmar_domain *domain;
13186be9f0dSKonstantin Belousov 	bus_addr_t maxaddr;
13286be9f0dSKonstantin Belousov 
13378b51754SRuslan Bukin 	domain = CTX2DOM(ctx);
13462ad310cSRuslan Bukin 	maxaddr = MIN(domain->iodom.end, BUS_SPACE_MAXADDR);
13559e37c8aSRuslan Bukin 	ctx->context.tag->common.ref_count = 1; /* Prevent free */
13659e37c8aSRuslan Bukin 	ctx->context.tag->common.impl = &bus_dma_iommu_impl;
13759e37c8aSRuslan Bukin 	ctx->context.tag->common.boundary = 0;
13859e37c8aSRuslan Bukin 	ctx->context.tag->common.lowaddr = maxaddr;
13959e37c8aSRuslan Bukin 	ctx->context.tag->common.highaddr = maxaddr;
14059e37c8aSRuslan Bukin 	ctx->context.tag->common.maxsize = maxaddr;
14159e37c8aSRuslan Bukin 	ctx->context.tag->common.nsegments = BUS_SPACE_UNRESTRICTED;
14259e37c8aSRuslan Bukin 	ctx->context.tag->common.maxsegsz = maxaddr;
14378b51754SRuslan Bukin 	ctx->context.tag->ctx = CTX2IOCTX(ctx);
14459e37c8aSRuslan Bukin 	ctx->context.tag->owner = dev;
14586be9f0dSKonstantin Belousov }
14686be9f0dSKonstantin Belousov 
14786be9f0dSKonstantin Belousov static void
148685666aaSKonstantin Belousov ctx_id_entry_init_one(dmar_ctx_entry_t *ctxp, struct dmar_domain *domain,
149685666aaSKonstantin Belousov     vm_page_t ctx_root)
15086be9f0dSKonstantin Belousov {
1511abfd355SKonstantin Belousov 	/*
1521abfd355SKonstantin Belousov 	 * For update due to move, the store is not atomic.  It is
1531abfd355SKonstantin Belousov 	 * possible that DMAR read upper doubleword, while low
1541abfd355SKonstantin Belousov 	 * doubleword is not yet updated.  The domain id is stored in
1551abfd355SKonstantin Belousov 	 * the upper doubleword, while the table pointer in the lower.
1561abfd355SKonstantin Belousov 	 *
1571abfd355SKonstantin Belousov 	 * There is no good solution, for the same reason it is wrong
1581abfd355SKonstantin Belousov 	 * to clear P bit in the ctx entry for update.
1591abfd355SKonstantin Belousov 	 */
1601abfd355SKonstantin Belousov 	dmar_pte_store1(&ctxp->ctx2, DMAR_CTX2_DID(domain->domain) |
1611abfd355SKonstantin Belousov 	    domain->awlvl);
162685666aaSKonstantin Belousov 	if (ctx_root == NULL) {
163685666aaSKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_PASS | DMAR_CTX1_P);
164685666aaSKonstantin Belousov 	} else {
165685666aaSKonstantin Belousov 		dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_UNTR |
166685666aaSKonstantin Belousov 		    (DMAR_CTX1_ASR_MASK & VM_PAGE_TO_PHYS(ctx_root)) |
167685666aaSKonstantin Belousov 		    DMAR_CTX1_P);
168685666aaSKonstantin Belousov 	}
169685666aaSKonstantin Belousov }
170685666aaSKonstantin Belousov 
171685666aaSKonstantin Belousov static void
172685666aaSKonstantin Belousov ctx_id_entry_init(struct dmar_ctx *ctx, dmar_ctx_entry_t *ctxp, bool move,
173685666aaSKonstantin Belousov     int busno)
174685666aaSKonstantin Belousov {
175685666aaSKonstantin Belousov 	struct dmar_unit *unit;
176685666aaSKonstantin Belousov 	struct dmar_domain *domain;
177685666aaSKonstantin Belousov 	vm_page_t ctx_root;
178685666aaSKonstantin Belousov 	int i;
179685666aaSKonstantin Belousov 
18078b51754SRuslan Bukin 	domain = CTX2DOM(ctx);
18178b51754SRuslan Bukin 	unit = DOM2DMAR(domain);
182685666aaSKonstantin Belousov 	KASSERT(move || (ctxp->ctx1 == 0 && ctxp->ctx2 == 0),
183685666aaSKonstantin Belousov 	    ("dmar%d: initialized ctx entry %d:%d:%d 0x%jx 0x%jx",
18459e37c8aSRuslan Bukin 	    unit->iommu.unit, busno, pci_get_slot(ctx->context.tag->owner),
18559e37c8aSRuslan Bukin 	    pci_get_function(ctx->context.tag->owner),
186685666aaSKonstantin Belousov 	    ctxp->ctx1, ctxp->ctx2));
187685666aaSKonstantin Belousov 
18815f6baf4SRuslan Bukin 	if ((domain->iodom.flags & IOMMU_DOMAIN_IDMAP) != 0 &&
18986be9f0dSKonstantin Belousov 	    (unit->hw_ecap & DMAR_ECAP_PT) != 0) {
1901abfd355SKonstantin Belousov 		KASSERT(domain->pgtbl_obj == NULL,
19186be9f0dSKonstantin Belousov 		    ("ctx %p non-null pgtbl_obj", ctx));
192685666aaSKonstantin Belousov 		ctx_root = NULL;
19386be9f0dSKonstantin Belousov 	} else {
19415f6baf4SRuslan Bukin 		ctx_root = dmar_pgalloc(domain->pgtbl_obj, 0,
19515f6baf4SRuslan Bukin 		    IOMMU_PGF_NOALLOC);
196685666aaSKonstantin Belousov 	}
197685666aaSKonstantin Belousov 
19878b51754SRuslan Bukin 	if (iommu_is_buswide_ctx(DMAR2IOMMU(unit), busno)) {
199685666aaSKonstantin Belousov 		MPASS(!move);
200685666aaSKonstantin Belousov 		for (i = 0; i <= PCI_BUSMAX; i++) {
201685666aaSKonstantin Belousov 			ctx_id_entry_init_one(&ctxp[i], domain, ctx_root);
202685666aaSKonstantin Belousov 		}
203685666aaSKonstantin Belousov 	} else {
204685666aaSKonstantin Belousov 		ctx_id_entry_init_one(ctxp, domain, ctx_root);
20586be9f0dSKonstantin Belousov 	}
2066b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(unit, ctxp);
20786be9f0dSKonstantin Belousov }
20886be9f0dSKonstantin Belousov 
20986be9f0dSKonstantin Belousov static int
2101abfd355SKonstantin Belousov dmar_flush_for_ctx_entry(struct dmar_unit *dmar, bool force)
2111abfd355SKonstantin Belousov {
2121abfd355SKonstantin Belousov 	int error;
2131abfd355SKonstantin Belousov 
2141abfd355SKonstantin Belousov 	/*
2151abfd355SKonstantin Belousov 	 * If dmar declares Caching Mode as Set, follow 11.5 "Caching
2161abfd355SKonstantin Belousov 	 * Mode Consideration" and do the (global) invalidation of the
2171abfd355SKonstantin Belousov 	 * negative TLB entries.
2181abfd355SKonstantin Belousov 	 */
2191abfd355SKonstantin Belousov 	if ((dmar->hw_cap & DMAR_CAP_CM) == 0 && !force)
2201abfd355SKonstantin Belousov 		return (0);
2211abfd355SKonstantin Belousov 	if (dmar->qi_enabled) {
2221abfd355SKonstantin Belousov 		dmar_qi_invalidate_ctx_glob_locked(dmar);
2231abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force)
2241abfd355SKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
2251abfd355SKonstantin Belousov 		return (0);
2261abfd355SKonstantin Belousov 	}
2271abfd355SKonstantin Belousov 	error = dmar_inv_ctx_glob(dmar);
2281abfd355SKonstantin Belousov 	if (error == 0 && ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force))
2291abfd355SKonstantin Belousov 		error = dmar_inv_iotlb_glob(dmar);
2301abfd355SKonstantin Belousov 	return (error);
2311abfd355SKonstantin Belousov }
2321abfd355SKonstantin Belousov 
2331abfd355SKonstantin Belousov static int
234f9feb091SKonstantin Belousov domain_init_rmrr(struct dmar_domain *domain, device_t dev, int bus,
235f9feb091SKonstantin Belousov     int slot, int func, int dev_domain, int dev_busno,
236f9feb091SKonstantin Belousov     const void *dev_path, int dev_path_len)
23786be9f0dSKonstantin Belousov {
23859e37c8aSRuslan Bukin 	struct iommu_map_entries_tailq rmrr_entries;
23959e37c8aSRuslan Bukin 	struct iommu_map_entry *entry, *entry1;
24086be9f0dSKonstantin Belousov 	vm_page_t *ma;
24159e37c8aSRuslan Bukin 	iommu_gaddr_t start, end;
24286be9f0dSKonstantin Belousov 	vm_pindex_t size, i;
24386be9f0dSKonstantin Belousov 	int error, error1;
24486be9f0dSKonstantin Belousov 
24586be9f0dSKonstantin Belousov 	error = 0;
24686be9f0dSKonstantin Belousov 	TAILQ_INIT(&rmrr_entries);
247f9feb091SKonstantin Belousov 	dmar_dev_parse_rmrr(domain, dev_domain, dev_busno, dev_path,
248f9feb091SKonstantin Belousov 	    dev_path_len, &rmrr_entries);
24986be9f0dSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, &rmrr_entries, unroll_link, entry1) {
25086be9f0dSKonstantin Belousov 		/*
25186be9f0dSKonstantin Belousov 		 * VT-d specification requires that the start of an
25286be9f0dSKonstantin Belousov 		 * RMRR entry is 4k-aligned.  Buggy BIOSes put
25386be9f0dSKonstantin Belousov 		 * anything into the start and end fields.  Truncate
25486be9f0dSKonstantin Belousov 		 * and round as neccesary.
25586be9f0dSKonstantin Belousov 		 *
25686be9f0dSKonstantin Belousov 		 * We also allow the overlapping RMRR entries, see
25762ad310cSRuslan Bukin 		 * iommu_gas_alloc_region().
25886be9f0dSKonstantin Belousov 		 */
25986be9f0dSKonstantin Belousov 		start = entry->start;
26086be9f0dSKonstantin Belousov 		end = entry->end;
261f9feb091SKonstantin Belousov 		if (bootverbose)
262f9feb091SKonstantin Belousov 			printf("dmar%d ctx pci%d:%d:%d RMRR [%#jx, %#jx]\n",
26359e37c8aSRuslan Bukin 			    domain->iodom.iommu->unit, bus, slot, func,
264f9feb091SKonstantin Belousov 			    (uintmax_t)start, (uintmax_t)end);
26586be9f0dSKonstantin Belousov 		entry->start = trunc_page(start);
26686be9f0dSKonstantin Belousov 		entry->end = round_page(end);
267e02b05b3SKonstantin Belousov 		if (entry->start == entry->end) {
268e02b05b3SKonstantin Belousov 			/* Workaround for some AMI (?) BIOSes */
269e02b05b3SKonstantin Belousov 			if (bootverbose) {
270f9feb091SKonstantin Belousov 				if (dev != NULL)
271f9feb091SKonstantin Belousov 					device_printf(dev, "");
272f9feb091SKonstantin Belousov 				printf("pci%d:%d:%d ", bus, slot, func);
273f9feb091SKonstantin Belousov 				printf("BIOS bug: dmar%d RMRR "
274e02b05b3SKonstantin Belousov 				    "region (%jx, %jx) corrected\n",
27559e37c8aSRuslan Bukin 				    domain->iodom.iommu->unit, start, end);
276e02b05b3SKonstantin Belousov 			}
277e02b05b3SKonstantin Belousov 			entry->end += DMAR_PAGE_SIZE * 0x20;
278e02b05b3SKonstantin Belousov 		}
27986be9f0dSKonstantin Belousov 		size = OFF_TO_IDX(entry->end - entry->start);
28086be9f0dSKonstantin Belousov 		ma = malloc(sizeof(vm_page_t) * size, M_TEMP, M_WAITOK);
28186be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++) {
28286be9f0dSKonstantin Belousov 			ma[i] = vm_page_getfake(entry->start + PAGE_SIZE * i,
28386be9f0dSKonstantin Belousov 			    VM_MEMATTR_DEFAULT);
28486be9f0dSKonstantin Belousov 		}
28578b51754SRuslan Bukin 		error1 = iommu_gas_map_region(DOM2IODOM(domain), entry,
28659e37c8aSRuslan Bukin 		    IOMMU_MAP_ENTRY_READ | IOMMU_MAP_ENTRY_WRITE,
28759e37c8aSRuslan Bukin 		    IOMMU_MF_CANWAIT | IOMMU_MF_RMRR, ma);
28886be9f0dSKonstantin Belousov 		/*
28986be9f0dSKonstantin Belousov 		 * Non-failed RMRR entries are owned by context rb
29086be9f0dSKonstantin Belousov 		 * tree.  Get rid of the failed entry, but do not stop
29186be9f0dSKonstantin Belousov 		 * the loop.  Rest of the parsed RMRR entries are
29286be9f0dSKonstantin Belousov 		 * loaded and removed on the context destruction.
29386be9f0dSKonstantin Belousov 		 */
29486be9f0dSKonstantin Belousov 		if (error1 == 0 && entry->end != entry->start) {
29559e37c8aSRuslan Bukin 			IOMMU_LOCK(domain->iodom.iommu);
2961abfd355SKonstantin Belousov 			domain->refs++; /* XXXKIB prevent free */
29715f6baf4SRuslan Bukin 			domain->iodom.flags |= IOMMU_DOMAIN_RMRR;
29859e37c8aSRuslan Bukin 			IOMMU_UNLOCK(domain->iodom.iommu);
29986be9f0dSKonstantin Belousov 		} else {
30086be9f0dSKonstantin Belousov 			if (error1 != 0) {
301f9feb091SKonstantin Belousov 				if (dev != NULL)
302f9feb091SKonstantin Belousov 					device_printf(dev, "");
303f9feb091SKonstantin Belousov 				printf("pci%d:%d:%d ", bus, slot, func);
304f9feb091SKonstantin Belousov 				printf(
30586be9f0dSKonstantin Belousov 			    "dmar%d failed to map RMRR region (%jx, %jx) %d\n",
30659e37c8aSRuslan Bukin 				    domain->iodom.iommu->unit, start, end,
307f9feb091SKonstantin Belousov 				    error1);
30886be9f0dSKonstantin Belousov 				error = error1;
30986be9f0dSKonstantin Belousov 			}
31086be9f0dSKonstantin Belousov 			TAILQ_REMOVE(&rmrr_entries, entry, unroll_link);
31178b51754SRuslan Bukin 			iommu_gas_free_entry(DOM2IODOM(domain), entry);
31286be9f0dSKonstantin Belousov 		}
31386be9f0dSKonstantin Belousov 		for (i = 0; i < size; i++)
31486be9f0dSKonstantin Belousov 			vm_page_putfake(ma[i]);
31586be9f0dSKonstantin Belousov 		free(ma, M_TEMP);
31686be9f0dSKonstantin Belousov 	}
31786be9f0dSKonstantin Belousov 	return (error);
31886be9f0dSKonstantin Belousov }
31986be9f0dSKonstantin Belousov 
3201abfd355SKonstantin Belousov static struct dmar_domain *
3211abfd355SKonstantin Belousov dmar_domain_alloc(struct dmar_unit *dmar, bool id_mapped)
3221abfd355SKonstantin Belousov {
32362ad310cSRuslan Bukin 	struct iommu_domain *iodom;
32416696f60SRuslan Bukin 	struct iommu_unit *unit;
3251abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3261abfd355SKonstantin Belousov 	int error, id, mgaw;
3271abfd355SKonstantin Belousov 
3281abfd355SKonstantin Belousov 	id = alloc_unr(dmar->domids);
3291abfd355SKonstantin Belousov 	if (id == -1)
3301abfd355SKonstantin Belousov 		return (NULL);
3311abfd355SKonstantin Belousov 	domain = malloc(sizeof(*domain), M_DMAR_DOMAIN, M_WAITOK | M_ZERO);
33278b51754SRuslan Bukin 	iodom = DOM2IODOM(domain);
33316696f60SRuslan Bukin 	unit = DMAR2IOMMU(dmar);
3341abfd355SKonstantin Belousov 	domain->domain = id;
3351abfd355SKonstantin Belousov 	LIST_INIT(&domain->contexts);
33616696f60SRuslan Bukin 	iommu_domain_init(unit, iodom, &dmar_domain_map_ops);
33716696f60SRuslan Bukin 
3381abfd355SKonstantin Belousov 	domain->dmar = dmar;
3391abfd355SKonstantin Belousov 
3401abfd355SKonstantin Belousov 	/*
3411abfd355SKonstantin Belousov 	 * For now, use the maximal usable physical address of the
3421abfd355SKonstantin Belousov 	 * installed memory to calculate the mgaw on id_mapped domain.
3431abfd355SKonstantin Belousov 	 * It is useful for the identity mapping, and less so for the
3441abfd355SKonstantin Belousov 	 * virtualized bus address space.
3451abfd355SKonstantin Belousov 	 */
34662ad310cSRuslan Bukin 	domain->iodom.end = id_mapped ? ptoa(Maxmem) : BUS_SPACE_MAXADDR;
34762ad310cSRuslan Bukin 	mgaw = dmar_maxaddr2mgaw(dmar, domain->iodom.end, !id_mapped);
3481abfd355SKonstantin Belousov 	error = domain_set_agaw(domain, mgaw);
3491abfd355SKonstantin Belousov 	if (error != 0)
3501abfd355SKonstantin Belousov 		goto fail;
3511abfd355SKonstantin Belousov 	if (!id_mapped)
3521abfd355SKonstantin Belousov 		/* Use all supported address space for remapping. */
35362ad310cSRuslan Bukin 		domain->iodom.end = 1ULL << (domain->agaw - 1);
3541abfd355SKonstantin Belousov 
35578b51754SRuslan Bukin 	iommu_gas_init_domain(DOM2IODOM(domain));
3561abfd355SKonstantin Belousov 
3571abfd355SKonstantin Belousov 	if (id_mapped) {
3581abfd355SKonstantin Belousov 		if ((dmar->hw_ecap & DMAR_ECAP_PT) == 0) {
3591abfd355SKonstantin Belousov 			domain->pgtbl_obj = domain_get_idmap_pgtbl(domain,
36062ad310cSRuslan Bukin 			    domain->iodom.end);
3611abfd355SKonstantin Belousov 		}
36215f6baf4SRuslan Bukin 		domain->iodom.flags |= IOMMU_DOMAIN_IDMAP;
3631abfd355SKonstantin Belousov 	} else {
3641abfd355SKonstantin Belousov 		error = domain_alloc_pgtbl(domain);
3651abfd355SKonstantin Belousov 		if (error != 0)
3661abfd355SKonstantin Belousov 			goto fail;
3671abfd355SKonstantin Belousov 		/* Disable local apic region access */
36862ad310cSRuslan Bukin 		error = iommu_gas_reserve_region(iodom, 0xfee00000,
3691abfd355SKonstantin Belousov 		    0xfeefffff + 1);
3701abfd355SKonstantin Belousov 		if (error != 0)
3711abfd355SKonstantin Belousov 			goto fail;
3721abfd355SKonstantin Belousov 	}
3731abfd355SKonstantin Belousov 	return (domain);
3741abfd355SKonstantin Belousov 
3751abfd355SKonstantin Belousov fail:
3761abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
3771abfd355SKonstantin Belousov 	return (NULL);
3781abfd355SKonstantin Belousov }
3791abfd355SKonstantin Belousov 
38086be9f0dSKonstantin Belousov static struct dmar_ctx *
3811abfd355SKonstantin Belousov dmar_ctx_alloc(struct dmar_domain *domain, uint16_t rid)
38286be9f0dSKonstantin Belousov {
38386be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
38486be9f0dSKonstantin Belousov 
38586be9f0dSKonstantin Belousov 	ctx = malloc(sizeof(*ctx), M_DMAR_CTX, M_WAITOK | M_ZERO);
38678b51754SRuslan Bukin 	ctx->context.domain = DOM2IODOM(domain);
38759e37c8aSRuslan Bukin 	ctx->context.tag = malloc(sizeof(struct bus_dma_tag_iommu),
38859e37c8aSRuslan Bukin 	    M_DMAR_CTX, M_WAITOK | M_ZERO);
389*cb9050ddSRuslan Bukin 	ctx->context.rid = rid;
3901abfd355SKonstantin Belousov 	ctx->refs = 1;
39186be9f0dSKonstantin Belousov 	return (ctx);
39286be9f0dSKonstantin Belousov }
39386be9f0dSKonstantin Belousov 
39486be9f0dSKonstantin Belousov static void
3951abfd355SKonstantin Belousov dmar_ctx_link(struct dmar_ctx *ctx)
3961abfd355SKonstantin Belousov {
3971abfd355SKonstantin Belousov 	struct dmar_domain *domain;
3981abfd355SKonstantin Belousov 
39978b51754SRuslan Bukin 	domain = CTX2DOM(ctx);
40059e37c8aSRuslan Bukin 	IOMMU_ASSERT_LOCKED(domain->iodom.iommu);
4011abfd355SKonstantin Belousov 	KASSERT(domain->refs >= domain->ctx_cnt,
4021abfd355SKonstantin Belousov 	    ("dom %p ref underflow %d %d", domain, domain->refs,
4031abfd355SKonstantin Belousov 	    domain->ctx_cnt));
4041abfd355SKonstantin Belousov 	domain->refs++;
4051abfd355SKonstantin Belousov 	domain->ctx_cnt++;
4061abfd355SKonstantin Belousov 	LIST_INSERT_HEAD(&domain->contexts, ctx, link);
4071abfd355SKonstantin Belousov }
4081abfd355SKonstantin Belousov 
4091abfd355SKonstantin Belousov static void
4101abfd355SKonstantin Belousov dmar_ctx_unlink(struct dmar_ctx *ctx)
4111abfd355SKonstantin Belousov {
4121abfd355SKonstantin Belousov 	struct dmar_domain *domain;
4131abfd355SKonstantin Belousov 
41478b51754SRuslan Bukin 	domain = CTX2DOM(ctx);
41559e37c8aSRuslan Bukin 	IOMMU_ASSERT_LOCKED(domain->iodom.iommu);
4161abfd355SKonstantin Belousov 	KASSERT(domain->refs > 0,
4171abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d", domain, domain->refs));
4181abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt >= domain->refs,
4191abfd355SKonstantin Belousov 	    ("domain %p ctx dtr refs %d ctx_cnt %d", domain,
4201abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
4211abfd355SKonstantin Belousov 	domain->refs--;
4221abfd355SKonstantin Belousov 	domain->ctx_cnt--;
4231abfd355SKonstantin Belousov 	LIST_REMOVE(ctx, link);
4241abfd355SKonstantin Belousov }
4251abfd355SKonstantin Belousov 
4261abfd355SKonstantin Belousov static void
4271abfd355SKonstantin Belousov dmar_domain_destroy(struct dmar_domain *domain)
42886be9f0dSKonstantin Belousov {
42916696f60SRuslan Bukin 	struct iommu_domain *iodom;
43059e37c8aSRuslan Bukin 	struct dmar_unit *dmar;
43186be9f0dSKonstantin Belousov 
43216696f60SRuslan Bukin 	iodom = DOM2IODOM(domain);
43316696f60SRuslan Bukin 
43459e37c8aSRuslan Bukin 	KASSERT(TAILQ_EMPTY(&domain->iodom.unload_entries),
4351abfd355SKonstantin Belousov 	    ("unfinished unloads %p", domain));
4361abfd355SKonstantin Belousov 	KASSERT(LIST_EMPTY(&domain->contexts),
4371abfd355SKonstantin Belousov 	    ("destroying dom %p with contexts", domain));
4381abfd355SKonstantin Belousov 	KASSERT(domain->ctx_cnt == 0,
4391abfd355SKonstantin Belousov 	    ("destroying dom %p with ctx_cnt %d", domain, domain->ctx_cnt));
4401abfd355SKonstantin Belousov 	KASSERT(domain->refs == 0,
4411abfd355SKonstantin Belousov 	    ("destroying dom %p with refs %d", domain, domain->refs));
44215f6baf4SRuslan Bukin 	if ((domain->iodom.flags & IOMMU_DOMAIN_GAS_INITED) != 0) {
4431abfd355SKonstantin Belousov 		DMAR_DOMAIN_LOCK(domain);
44416696f60SRuslan Bukin 		iommu_gas_fini_domain(iodom);
4451abfd355SKonstantin Belousov 		DMAR_DOMAIN_UNLOCK(domain);
44686be9f0dSKonstantin Belousov 	}
44715f6baf4SRuslan Bukin 	if ((domain->iodom.flags & IOMMU_DOMAIN_PGTBL_INITED) != 0) {
4481abfd355SKonstantin Belousov 		if (domain->pgtbl_obj != NULL)
4491abfd355SKonstantin Belousov 			DMAR_DOMAIN_PGLOCK(domain);
4501abfd355SKonstantin Belousov 		domain_free_pgtbl(domain);
45186be9f0dSKonstantin Belousov 	}
45216696f60SRuslan Bukin 	iommu_domain_fini(iodom);
45378b51754SRuslan Bukin 	dmar = DOM2DMAR(domain);
45459e37c8aSRuslan Bukin 	free_unr(dmar->domids, domain->domain);
4551abfd355SKonstantin Belousov 	free(domain, M_DMAR_DOMAIN);
45686be9f0dSKonstantin Belousov }
45786be9f0dSKonstantin Belousov 
458f9feb091SKonstantin Belousov static struct dmar_ctx *
459f9feb091SKonstantin Belousov dmar_get_ctx_for_dev1(struct dmar_unit *dmar, device_t dev, uint16_t rid,
460f9feb091SKonstantin Belousov     int dev_domain, int dev_busno, const void *dev_path, int dev_path_len,
4611abfd355SKonstantin Belousov     bool id_mapped, bool rmrr_init)
46286be9f0dSKonstantin Belousov {
4631abfd355SKonstantin Belousov 	struct dmar_domain *domain, *domain1;
46486be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx, *ctx1;
465ea4c0115SRuslan Bukin 	struct iommu_unit *unit;
46686be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
46786be9f0dSKonstantin Belousov 	struct sf_buf *sf;
4681abfd355SKonstantin Belousov 	int bus, slot, func, error;
46986be9f0dSKonstantin Belousov 	bool enable;
47086be9f0dSKonstantin Belousov 
471f9feb091SKonstantin Belousov 	if (dev != NULL) {
47267499354SRyan Stone 		bus = pci_get_bus(dev);
47367499354SRyan Stone 		slot = pci_get_slot(dev);
47467499354SRyan Stone 		func = pci_get_function(dev);
475f9feb091SKonstantin Belousov 	} else {
476f9feb091SKonstantin Belousov 		bus = PCI_RID2BUS(rid);
477f9feb091SKonstantin Belousov 		slot = PCI_RID2SLOT(rid);
478f9feb091SKonstantin Belousov 		func = PCI_RID2FUNC(rid);
479f9feb091SKonstantin Belousov 	}
48086be9f0dSKonstantin Belousov 	enable = false;
48186be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
48278b51754SRuslan Bukin 	unit = DMAR2IOMMU(dmar);
48386be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
484ea4c0115SRuslan Bukin 	KASSERT(!iommu_is_buswide_ctx(unit, bus) || (slot == 0 && func == 0),
485ea4c0115SRuslan Bukin 	    ("iommu%d pci%d:%d:%d get_ctx for buswide", dmar->iommu.unit, bus,
486685666aaSKonstantin Belousov 	    slot, func));
48767499354SRyan Stone 	ctx = dmar_find_ctx_locked(dmar, rid);
48886be9f0dSKonstantin Belousov 	error = 0;
48986be9f0dSKonstantin Belousov 	if (ctx == NULL) {
49086be9f0dSKonstantin Belousov 		/*
49186be9f0dSKonstantin Belousov 		 * Perform the allocations which require sleep or have
49286be9f0dSKonstantin Belousov 		 * higher chance to succeed if the sleep is allowed.
49386be9f0dSKonstantin Belousov 		 */
49486be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
495b29d186cSKonstantin Belousov 		dmar_ensure_ctx_page(dmar, PCI_RID2BUS(rid));
4961abfd355SKonstantin Belousov 		domain1 = dmar_domain_alloc(dmar, id_mapped);
4971abfd355SKonstantin Belousov 		if (domain1 == NULL) {
49886be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
49986be9f0dSKonstantin Belousov 			return (NULL);
50086be9f0dSKonstantin Belousov 		}
5015f8e5c7fSKonstantin Belousov 		if (!id_mapped) {
502f9feb091SKonstantin Belousov 			error = domain_init_rmrr(domain1, dev, bus,
503f9feb091SKonstantin Belousov 			    slot, func, dev_domain, dev_busno, dev_path,
504f9feb091SKonstantin Belousov 			    dev_path_len);
50586be9f0dSKonstantin Belousov 			if (error != 0) {
5061abfd355SKonstantin Belousov 				dmar_domain_destroy(domain1);
50786be9f0dSKonstantin Belousov 				TD_PINNED_ASSERT;
50886be9f0dSKonstantin Belousov 				return (NULL);
50986be9f0dSKonstantin Belousov 			}
5105f8e5c7fSKonstantin Belousov 		}
5111abfd355SKonstantin Belousov 		ctx1 = dmar_ctx_alloc(domain1, rid);
51286be9f0dSKonstantin Belousov 		ctxp = dmar_map_ctx_entry(ctx1, &sf);
51386be9f0dSKonstantin Belousov 		DMAR_LOCK(dmar);
51486be9f0dSKonstantin Belousov 
51586be9f0dSKonstantin Belousov 		/*
51686be9f0dSKonstantin Belousov 		 * Recheck the contexts, other thread might have
51786be9f0dSKonstantin Belousov 		 * already allocated needed one.
51886be9f0dSKonstantin Belousov 		 */
51967499354SRyan Stone 		ctx = dmar_find_ctx_locked(dmar, rid);
52086be9f0dSKonstantin Belousov 		if (ctx == NULL) {
5211abfd355SKonstantin Belousov 			domain = domain1;
52286be9f0dSKonstantin Belousov 			ctx = ctx1;
5231abfd355SKonstantin Belousov 			dmar_ctx_link(ctx);
52459e37c8aSRuslan Bukin 			ctx->context.tag->owner = dev;
52559e37c8aSRuslan Bukin 			device_tag_init(ctx, dev);
52686be9f0dSKonstantin Belousov 
52786be9f0dSKonstantin Belousov 			/*
52886be9f0dSKonstantin Belousov 			 * This is the first activated context for the
52986be9f0dSKonstantin Belousov 			 * DMAR unit.  Enable the translation after
53086be9f0dSKonstantin Belousov 			 * everything is set up.
53186be9f0dSKonstantin Belousov 			 */
5321abfd355SKonstantin Belousov 			if (LIST_EMPTY(&dmar->domains))
53386be9f0dSKonstantin Belousov 				enable = true;
5341abfd355SKonstantin Belousov 			LIST_INSERT_HEAD(&dmar->domains, domain, link);
535685666aaSKonstantin Belousov 			ctx_id_entry_init(ctx, ctxp, false, bus);
536f9feb091SKonstantin Belousov 			if (dev != NULL) {
53786be9f0dSKonstantin Belousov 				device_printf(dev,
53834e8337bSKonstantin Belousov 			    "dmar%d pci%d:%d:%d:%d rid %x domain %d mgaw %d "
5399d0bc6d8SKonstantin Belousov 				    "agaw %d %s-mapped\n",
54059e37c8aSRuslan Bukin 				    dmar->iommu.unit, dmar->segment, bus, slot,
5411abfd355SKonstantin Belousov 				    func, rid, domain->domain, domain->mgaw,
5421abfd355SKonstantin Belousov 				    domain->agaw, id_mapped ? "id" : "re");
543f9feb091SKonstantin Belousov 			}
5443d47c58bSKonstantin Belousov 			dmar_unmap_pgtbl(sf);
54586be9f0dSKonstantin Belousov 		} else {
5463d47c58bSKonstantin Belousov 			dmar_unmap_pgtbl(sf);
5471abfd355SKonstantin Belousov 			dmar_domain_destroy(domain1);
5483d47c58bSKonstantin Belousov 			/* Nothing needs to be done to destroy ctx1. */
5493d47c58bSKonstantin Belousov 			free(ctx1, M_DMAR_CTX);
55078b51754SRuslan Bukin 			domain = CTX2DOM(ctx);
5511abfd355SKonstantin Belousov 			ctx->refs++; /* tag referenced us */
55286be9f0dSKonstantin Belousov 		}
55368eeb96aSKonstantin Belousov 	} else {
55478b51754SRuslan Bukin 		domain = CTX2DOM(ctx);
55559e37c8aSRuslan Bukin 		if (ctx->context.tag->owner == NULL)
55659e37c8aSRuslan Bukin 			ctx->context.tag->owner = dev;
5571abfd355SKonstantin Belousov 		ctx->refs++; /* tag referenced us */
5581abfd355SKonstantin Belousov 	}
5591abfd355SKonstantin Belousov 
5601abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, enable);
56186be9f0dSKonstantin Belousov 	if (error != 0) {
56286be9f0dSKonstantin Belousov 		dmar_free_ctx_locked(dmar, ctx);
56386be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
56486be9f0dSKonstantin Belousov 		return (NULL);
56586be9f0dSKonstantin Belousov 	}
56668eeb96aSKonstantin Belousov 
56768eeb96aSKonstantin Belousov 	/*
56868eeb96aSKonstantin Belousov 	 * The dmar lock was potentially dropped between check for the
56968eeb96aSKonstantin Belousov 	 * empty context list and now.  Recheck the state of GCMD_TE
57068eeb96aSKonstantin Belousov 	 * to avoid unneeded command.
57168eeb96aSKonstantin Belousov 	 */
57268eeb96aSKonstantin Belousov 	if (enable && !rmrr_init && (dmar->hw_gcmd & DMAR_GCMD_TE) == 0) {
57386be9f0dSKonstantin Belousov 		error = dmar_enable_translation(dmar);
574f9feb091SKonstantin Belousov 		if (error == 0) {
575f9feb091SKonstantin Belousov 			if (bootverbose) {
576f9feb091SKonstantin Belousov 				printf("dmar%d: enabled translation\n",
57759e37c8aSRuslan Bukin 				    dmar->iommu.unit);
578f9feb091SKonstantin Belousov 			}
579f9feb091SKonstantin Belousov 		} else {
580f9feb091SKonstantin Belousov 			printf("dmar%d: enabling translation failed, "
58159e37c8aSRuslan Bukin 			    "error %d\n", dmar->iommu.unit, error);
58286be9f0dSKonstantin Belousov 			dmar_free_ctx_locked(dmar, ctx);
58386be9f0dSKonstantin Belousov 			TD_PINNED_ASSERT;
58486be9f0dSKonstantin Belousov 			return (NULL);
58586be9f0dSKonstantin Belousov 		}
58686be9f0dSKonstantin Belousov 	}
58786be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
58886be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
58986be9f0dSKonstantin Belousov 	return (ctx);
59086be9f0dSKonstantin Belousov }
59186be9f0dSKonstantin Belousov 
592f9feb091SKonstantin Belousov struct dmar_ctx *
593f9feb091SKonstantin Belousov dmar_get_ctx_for_dev(struct dmar_unit *dmar, device_t dev, uint16_t rid,
594f9feb091SKonstantin Belousov     bool id_mapped, bool rmrr_init)
595f9feb091SKonstantin Belousov {
596f9feb091SKonstantin Belousov 	int dev_domain, dev_path_len, dev_busno;
597f9feb091SKonstantin Belousov 
598f9feb091SKonstantin Belousov 	dev_domain = pci_get_domain(dev);
599f9feb091SKonstantin Belousov 	dev_path_len = dmar_dev_depth(dev);
600f9feb091SKonstantin Belousov 	ACPI_DMAR_PCI_PATH dev_path[dev_path_len];
601f9feb091SKonstantin Belousov 	dmar_dev_path(dev, &dev_busno, dev_path, dev_path_len);
602f9feb091SKonstantin Belousov 	return (dmar_get_ctx_for_dev1(dmar, dev, rid, dev_domain, dev_busno,
603f9feb091SKonstantin Belousov 	    dev_path, dev_path_len, id_mapped, rmrr_init));
604f9feb091SKonstantin Belousov }
605f9feb091SKonstantin Belousov 
606f9feb091SKonstantin Belousov struct dmar_ctx *
607f9feb091SKonstantin Belousov dmar_get_ctx_for_devpath(struct dmar_unit *dmar, uint16_t rid,
608f9feb091SKonstantin Belousov     int dev_domain, int dev_busno,
609f9feb091SKonstantin Belousov     const void *dev_path, int dev_path_len,
610f9feb091SKonstantin Belousov     bool id_mapped, bool rmrr_init)
611f9feb091SKonstantin Belousov {
612f9feb091SKonstantin Belousov 
613f9feb091SKonstantin Belousov 	return (dmar_get_ctx_for_dev1(dmar, NULL, rid, dev_domain, dev_busno,
614f9feb091SKonstantin Belousov 	    dev_path, dev_path_len, id_mapped, rmrr_init));
615f9feb091SKonstantin Belousov }
616f9feb091SKonstantin Belousov 
6171abfd355SKonstantin Belousov int
6181abfd355SKonstantin Belousov dmar_move_ctx_to_domain(struct dmar_domain *domain, struct dmar_ctx *ctx)
6191abfd355SKonstantin Belousov {
6201abfd355SKonstantin Belousov 	struct dmar_unit *dmar;
6211abfd355SKonstantin Belousov 	struct dmar_domain *old_domain;
6221abfd355SKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
6231abfd355SKonstantin Belousov 	struct sf_buf *sf;
6241abfd355SKonstantin Belousov 	int error;
6251abfd355SKonstantin Belousov 
6261abfd355SKonstantin Belousov 	dmar = domain->dmar;
62778b51754SRuslan Bukin 	old_domain = CTX2DOM(ctx);
6281abfd355SKonstantin Belousov 	if (domain == old_domain)
6291abfd355SKonstantin Belousov 		return (0);
63059e37c8aSRuslan Bukin 	KASSERT(old_domain->iodom.iommu == domain->iodom.iommu,
6311abfd355SKonstantin Belousov 	    ("domain %p %u moving between dmars %u %u", domain,
63259e37c8aSRuslan Bukin 	    domain->domain, old_domain->iodom.iommu->unit,
63359e37c8aSRuslan Bukin 	    domain->iodom.iommu->unit));
6341abfd355SKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
6351abfd355SKonstantin Belousov 
6361abfd355SKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
6371abfd355SKonstantin Belousov 	DMAR_LOCK(dmar);
6381abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
63959e37c8aSRuslan Bukin 	ctx->context.domain = &domain->iodom;
6401abfd355SKonstantin Belousov 	dmar_ctx_link(ctx);
641685666aaSKonstantin Belousov 	ctx_id_entry_init(ctx, ctxp, true, PCI_BUSMAX + 100);
6421abfd355SKonstantin Belousov 	dmar_unmap_pgtbl(sf);
6431abfd355SKonstantin Belousov 	error = dmar_flush_for_ctx_entry(dmar, true);
6441abfd355SKonstantin Belousov 	/* If flush failed, rolling back would not work as well. */
6451abfd355SKonstantin Belousov 	printf("dmar%d rid %x domain %d->%d %s-mapped\n",
646*cb9050ddSRuslan Bukin 	    dmar->iommu.unit, ctx->context.rid, old_domain->domain,
647*cb9050ddSRuslan Bukin 	    domain->domain, (domain->iodom.flags & IOMMU_DOMAIN_IDMAP) != 0 ?
648*cb9050ddSRuslan Bukin 	    "id" : "re");
6491abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, old_domain);
6501abfd355SKonstantin Belousov 	TD_PINNED_ASSERT;
6511abfd355SKonstantin Belousov 	return (error);
6521abfd355SKonstantin Belousov }
6531abfd355SKonstantin Belousov 
6541abfd355SKonstantin Belousov static void
6551abfd355SKonstantin Belousov dmar_unref_domain_locked(struct dmar_unit *dmar, struct dmar_domain *domain)
6561abfd355SKonstantin Belousov {
6571abfd355SKonstantin Belousov 
6581abfd355SKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
6591abfd355SKonstantin Belousov 	KASSERT(domain->refs >= 1,
66059e37c8aSRuslan Bukin 	    ("dmar %d domain %p refs %u", dmar->iommu.unit, domain,
66159e37c8aSRuslan Bukin 	    domain->refs));
6621abfd355SKonstantin Belousov 	KASSERT(domain->refs > domain->ctx_cnt,
66359e37c8aSRuslan Bukin 	    ("dmar %d domain %p refs %d ctx_cnt %d", dmar->iommu.unit, domain,
6641abfd355SKonstantin Belousov 	    domain->refs, domain->ctx_cnt));
6651abfd355SKonstantin Belousov 
6661abfd355SKonstantin Belousov 	if (domain->refs > 1) {
6671abfd355SKonstantin Belousov 		domain->refs--;
6681abfd355SKonstantin Belousov 		DMAR_UNLOCK(dmar);
6691abfd355SKonstantin Belousov 		return;
6701abfd355SKonstantin Belousov 	}
6711abfd355SKonstantin Belousov 
67215f6baf4SRuslan Bukin 	KASSERT((domain->iodom.flags & IOMMU_DOMAIN_RMRR) == 0,
6731abfd355SKonstantin Belousov 	    ("lost ref on RMRR domain %p", domain));
6741abfd355SKonstantin Belousov 
6751abfd355SKonstantin Belousov 	LIST_REMOVE(domain, link);
6761abfd355SKonstantin Belousov 	DMAR_UNLOCK(dmar);
6771abfd355SKonstantin Belousov 
67859e37c8aSRuslan Bukin 	taskqueue_drain(dmar->iommu.delayed_taskqueue,
67959e37c8aSRuslan Bukin 	    &domain->iodom.unload_task);
6801abfd355SKonstantin Belousov 	dmar_domain_destroy(domain);
6811abfd355SKonstantin Belousov }
6821abfd355SKonstantin Belousov 
68386be9f0dSKonstantin Belousov void
68486be9f0dSKonstantin Belousov dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx)
68586be9f0dSKonstantin Belousov {
68686be9f0dSKonstantin Belousov 	struct sf_buf *sf;
68786be9f0dSKonstantin Belousov 	dmar_ctx_entry_t *ctxp;
6881abfd355SKonstantin Belousov 	struct dmar_domain *domain;
68986be9f0dSKonstantin Belousov 
69086be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
69186be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
69286be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
69386be9f0dSKonstantin Belousov 
69486be9f0dSKonstantin Belousov 	/*
69586be9f0dSKonstantin Belousov 	 * If our reference is not last, only the dereference should
69686be9f0dSKonstantin Belousov 	 * be performed.
69786be9f0dSKonstantin Belousov 	 */
69886be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
69986be9f0dSKonstantin Belousov 		ctx->refs--;
70086be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
70186be9f0dSKonstantin Belousov 		return;
70286be9f0dSKonstantin Belousov 	}
70386be9f0dSKonstantin Belousov 
70459e37c8aSRuslan Bukin 	KASSERT((ctx->context.flags & IOMMU_CTX_DISABLED) == 0,
70586be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
70686be9f0dSKonstantin Belousov 
70786be9f0dSKonstantin Belousov 	/*
70886be9f0dSKonstantin Belousov 	 * Otherwise, the context entry must be cleared before the
70986be9f0dSKonstantin Belousov 	 * page table is destroyed.  The mapping of the context
71086be9f0dSKonstantin Belousov 	 * entries page could require sleep, unlock the dmar.
71186be9f0dSKonstantin Belousov 	 */
71286be9f0dSKonstantin Belousov 	DMAR_UNLOCK(dmar);
71386be9f0dSKonstantin Belousov 	TD_PREP_PINNED_ASSERT;
71486be9f0dSKonstantin Belousov 	ctxp = dmar_map_ctx_entry(ctx, &sf);
71586be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
71686be9f0dSKonstantin Belousov 	KASSERT(ctx->refs >= 1,
71786be9f0dSKonstantin Belousov 	    ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs));
71886be9f0dSKonstantin Belousov 
71986be9f0dSKonstantin Belousov 	/*
72086be9f0dSKonstantin Belousov 	 * Other thread might have referenced the context, in which
72186be9f0dSKonstantin Belousov 	 * case again only the dereference should be performed.
72286be9f0dSKonstantin Belousov 	 */
72386be9f0dSKonstantin Belousov 	if (ctx->refs > 1) {
72486be9f0dSKonstantin Belousov 		ctx->refs--;
72586be9f0dSKonstantin Belousov 		DMAR_UNLOCK(dmar);
7266b7c46afSKonstantin Belousov 		dmar_unmap_pgtbl(sf);
72786be9f0dSKonstantin Belousov 		TD_PINNED_ASSERT;
72886be9f0dSKonstantin Belousov 		return;
72986be9f0dSKonstantin Belousov 	}
73086be9f0dSKonstantin Belousov 
73159e37c8aSRuslan Bukin 	KASSERT((ctx->context.flags & IOMMU_CTX_DISABLED) == 0,
73286be9f0dSKonstantin Belousov 	    ("lost ref on disabled ctx %p", ctx));
73386be9f0dSKonstantin Belousov 
73486be9f0dSKonstantin Belousov 	/*
73586be9f0dSKonstantin Belousov 	 * Clear the context pointer and flush the caches.
73686be9f0dSKonstantin Belousov 	 * XXXKIB: cannot do this if any RMRR entries are still present.
73786be9f0dSKonstantin Belousov 	 */
73886be9f0dSKonstantin Belousov 	dmar_pte_clear(&ctxp->ctx1);
73986be9f0dSKonstantin Belousov 	ctxp->ctx2 = 0;
7406b7c46afSKonstantin Belousov 	dmar_flush_ctx_to_ram(dmar, ctxp);
74186be9f0dSKonstantin Belousov 	dmar_inv_ctx_glob(dmar);
74268eeb96aSKonstantin Belousov 	if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0) {
74368eeb96aSKonstantin Belousov 		if (dmar->qi_enabled)
74468eeb96aSKonstantin Belousov 			dmar_qi_invalidate_iotlb_glob_locked(dmar);
74568eeb96aSKonstantin Belousov 		else
74686be9f0dSKonstantin Belousov 			dmar_inv_iotlb_glob(dmar);
74768eeb96aSKonstantin Belousov 	}
7486b7c46afSKonstantin Belousov 	dmar_unmap_pgtbl(sf);
74978b51754SRuslan Bukin 	domain = CTX2DOM(ctx);
7501abfd355SKonstantin Belousov 	dmar_ctx_unlink(ctx);
75159e37c8aSRuslan Bukin 	free(ctx->context.tag, M_DMAR_CTX);
7521abfd355SKonstantin Belousov 	free(ctx, M_DMAR_CTX);
7531abfd355SKonstantin Belousov 	dmar_unref_domain_locked(dmar, domain);
75486be9f0dSKonstantin Belousov 	TD_PINNED_ASSERT;
75586be9f0dSKonstantin Belousov }
75686be9f0dSKonstantin Belousov 
75786be9f0dSKonstantin Belousov void
75886be9f0dSKonstantin Belousov dmar_free_ctx(struct dmar_ctx *ctx)
75986be9f0dSKonstantin Belousov {
76086be9f0dSKonstantin Belousov 	struct dmar_unit *dmar;
76186be9f0dSKonstantin Belousov 
76278b51754SRuslan Bukin 	dmar = CTX2DMAR(ctx);
76386be9f0dSKonstantin Belousov 	DMAR_LOCK(dmar);
76486be9f0dSKonstantin Belousov 	dmar_free_ctx_locked(dmar, ctx);
76586be9f0dSKonstantin Belousov }
76686be9f0dSKonstantin Belousov 
7671abfd355SKonstantin Belousov /*
7681abfd355SKonstantin Belousov  * Returns with the domain locked.
7691abfd355SKonstantin Belousov  */
77086be9f0dSKonstantin Belousov struct dmar_ctx *
77167499354SRyan Stone dmar_find_ctx_locked(struct dmar_unit *dmar, uint16_t rid)
77286be9f0dSKonstantin Belousov {
7731abfd355SKonstantin Belousov 	struct dmar_domain *domain;
77486be9f0dSKonstantin Belousov 	struct dmar_ctx *ctx;
77586be9f0dSKonstantin Belousov 
77686be9f0dSKonstantin Belousov 	DMAR_ASSERT_LOCKED(dmar);
77786be9f0dSKonstantin Belousov 
7781abfd355SKonstantin Belousov 	LIST_FOREACH(domain, &dmar->domains, link) {
7791abfd355SKonstantin Belousov 		LIST_FOREACH(ctx, &domain->contexts, link) {
780*cb9050ddSRuslan Bukin 			if (ctx->context.rid == rid)
78186be9f0dSKonstantin Belousov 				return (ctx);
78286be9f0dSKonstantin Belousov 		}
7831abfd355SKonstantin Belousov 	}
78486be9f0dSKonstantin Belousov 	return (NULL);
78586be9f0dSKonstantin Belousov }
78686be9f0dSKonstantin Belousov 
78786be9f0dSKonstantin Belousov void
78859e37c8aSRuslan Bukin dmar_domain_free_entry(struct iommu_map_entry *entry, bool free)
78968eeb96aSKonstantin Belousov {
79062ad310cSRuslan Bukin 	struct iommu_domain *domain;
79168eeb96aSKonstantin Belousov 
79262ad310cSRuslan Bukin 	domain = entry->domain;
79362ad310cSRuslan Bukin 	IOMMU_DOMAIN_LOCK(domain);
79459e37c8aSRuslan Bukin 	if ((entry->flags & IOMMU_MAP_ENTRY_RMRR) != 0)
79562ad310cSRuslan Bukin 		iommu_gas_free_region(domain, entry);
79668eeb96aSKonstantin Belousov 	else
79762ad310cSRuslan Bukin 		iommu_gas_free_space(domain, entry);
79862ad310cSRuslan Bukin 	IOMMU_DOMAIN_UNLOCK(domain);
79968eeb96aSKonstantin Belousov 	if (free)
80062ad310cSRuslan Bukin 		iommu_gas_free_entry(domain, entry);
80168eeb96aSKonstantin Belousov 	else
80268eeb96aSKonstantin Belousov 		entry->flags = 0;
80368eeb96aSKonstantin Belousov }
80468eeb96aSKonstantin Belousov 
80568eeb96aSKonstantin Belousov void
80659e37c8aSRuslan Bukin dmar_domain_unload_entry(struct iommu_map_entry *entry, bool free)
80768eeb96aSKonstantin Belousov {
80859e37c8aSRuslan Bukin 	struct dmar_domain *domain;
80968eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
81068eeb96aSKonstantin Belousov 
81178b51754SRuslan Bukin 	domain = IODOM2DOM(entry->domain);
81278b51754SRuslan Bukin 	unit = DOM2DMAR(domain);
81368eeb96aSKonstantin Belousov 	if (unit->qi_enabled) {
81468eeb96aSKonstantin Belousov 		DMAR_LOCK(unit);
81578b51754SRuslan Bukin 		dmar_qi_invalidate_locked(IODOM2DOM(entry->domain),
81659e37c8aSRuslan Bukin 		    entry->start, entry->end - entry->start, &entry->gseq,
81759e37c8aSRuslan Bukin 		    true);
81868eeb96aSKonstantin Belousov 		if (!free)
81959e37c8aSRuslan Bukin 			entry->flags |= IOMMU_MAP_ENTRY_QI_NF;
82068eeb96aSKonstantin Belousov 		TAILQ_INSERT_TAIL(&unit->tlb_flush_entries, entry, dmamap_link);
82168eeb96aSKonstantin Belousov 		DMAR_UNLOCK(unit);
82268eeb96aSKonstantin Belousov 	} else {
82378b51754SRuslan Bukin 		domain_flush_iotlb_sync(IODOM2DOM(entry->domain),
82459e37c8aSRuslan Bukin 		    entry->start, entry->end - entry->start);
8251abfd355SKonstantin Belousov 		dmar_domain_free_entry(entry, free);
82668eeb96aSKonstantin Belousov 	}
82768eeb96aSKonstantin Belousov }
82868eeb96aSKonstantin Belousov 
829cf619a92SKonstantin Belousov static bool
830cf619a92SKonstantin Belousov dmar_domain_unload_emit_wait(struct dmar_domain *domain,
83159e37c8aSRuslan Bukin     struct iommu_map_entry *entry)
832e164cafcSKonstantin Belousov {
833e164cafcSKonstantin Belousov 
834cf619a92SKonstantin Belousov 	if (TAILQ_NEXT(entry, dmamap_link) == NULL)
835cf619a92SKonstantin Belousov 		return (true);
836cf619a92SKonstantin Belousov 	return (domain->batch_no++ % dmar_batch_coalesce == 0);
837e164cafcSKonstantin Belousov }
838e164cafcSKonstantin Belousov 
83968eeb96aSKonstantin Belousov void
8401abfd355SKonstantin Belousov dmar_domain_unload(struct dmar_domain *domain,
84159e37c8aSRuslan Bukin     struct iommu_map_entries_tailq *entries, bool cansleep)
84286be9f0dSKonstantin Belousov {
84368eeb96aSKonstantin Belousov 	struct dmar_unit *unit;
8440eed04c8SRuslan Bukin 	struct iommu_domain *iodom;
84559e37c8aSRuslan Bukin 	struct iommu_map_entry *entry, *entry1;
84686be9f0dSKonstantin Belousov 	int error;
84786be9f0dSKonstantin Belousov 
84878b51754SRuslan Bukin 	iodom = DOM2IODOM(domain);
84978b51754SRuslan Bukin 	unit = DOM2DMAR(domain);
85068eeb96aSKonstantin Belousov 
85168eeb96aSKonstantin Belousov 	TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) {
85259e37c8aSRuslan Bukin 		KASSERT((entry->flags & IOMMU_MAP_ENTRY_MAP) != 0,
8531abfd355SKonstantin Belousov 		    ("not mapped entry %p %p", domain, entry));
8540eed04c8SRuslan Bukin 		error = iodom->ops->unmap(iodom, entry->start, entry->end -
85515f6baf4SRuslan Bukin 		    entry->start, cansleep ? IOMMU_PGF_WAITOK : 0);
8561abfd355SKonstantin Belousov 		KASSERT(error == 0, ("unmap %p error %d", domain, error));
85768eeb96aSKonstantin Belousov 		if (!unit->qi_enabled) {
8581abfd355SKonstantin Belousov 			domain_flush_iotlb_sync(domain, entry->start,
85968eeb96aSKonstantin Belousov 			    entry->end - entry->start);
86068eeb96aSKonstantin Belousov 			TAILQ_REMOVE(entries, entry, dmamap_link);
8611abfd355SKonstantin Belousov 			dmar_domain_free_entry(entry, true);
86286be9f0dSKonstantin Belousov 		}
86386be9f0dSKonstantin Belousov 	}
86468eeb96aSKonstantin Belousov 	if (TAILQ_EMPTY(entries))
86568eeb96aSKonstantin Belousov 		return;
86668eeb96aSKonstantin Belousov 
86768eeb96aSKonstantin Belousov 	KASSERT(unit->qi_enabled, ("loaded entry left"));
86868eeb96aSKonstantin Belousov 	DMAR_LOCK(unit);
86968eeb96aSKonstantin Belousov 	TAILQ_FOREACH(entry, entries, dmamap_link) {
8701abfd355SKonstantin Belousov 		dmar_qi_invalidate_locked(domain, entry->start, entry->end -
871cf619a92SKonstantin Belousov 		    entry->start, &entry->gseq,
872cf619a92SKonstantin Belousov 		    dmar_domain_unload_emit_wait(domain, entry));
87368eeb96aSKonstantin Belousov 	}
874cf619a92SKonstantin Belousov 	TAILQ_CONCAT(&unit->tlb_flush_entries, entries, dmamap_link);
87568eeb96aSKonstantin Belousov 	DMAR_UNLOCK(unit);
87668eeb96aSKonstantin Belousov }
87786be9f0dSKonstantin Belousov 
87859e37c8aSRuslan Bukin struct iommu_ctx *
87959e37c8aSRuslan Bukin iommu_get_ctx(struct iommu_unit *iommu, device_t dev, uint16_t rid,
88059e37c8aSRuslan Bukin     bool id_mapped, bool rmrr_init)
88159e37c8aSRuslan Bukin {
88259e37c8aSRuslan Bukin 	struct dmar_unit *dmar;
88359e37c8aSRuslan Bukin 	struct dmar_ctx *ret;
88459e37c8aSRuslan Bukin 
88578b51754SRuslan Bukin 	dmar = IOMMU2DMAR(iommu);
88659e37c8aSRuslan Bukin 
88759e37c8aSRuslan Bukin 	ret = dmar_get_ctx_for_dev(dmar, dev, rid, id_mapped, rmrr_init);
88859e37c8aSRuslan Bukin 
88978b51754SRuslan Bukin 	return (CTX2IOCTX(ret));
89059e37c8aSRuslan Bukin }
89159e37c8aSRuslan Bukin 
89259e37c8aSRuslan Bukin void
89359e37c8aSRuslan Bukin iommu_free_ctx_locked(struct iommu_unit *iommu, struct iommu_ctx *context)
89459e37c8aSRuslan Bukin {
89559e37c8aSRuslan Bukin 	struct dmar_unit *dmar;
89659e37c8aSRuslan Bukin 	struct dmar_ctx *ctx;
89759e37c8aSRuslan Bukin 
89878b51754SRuslan Bukin 	dmar = IOMMU2DMAR(iommu);
89978b51754SRuslan Bukin 	ctx = IOCTX2CTX(context);
90059e37c8aSRuslan Bukin 
90159e37c8aSRuslan Bukin 	dmar_free_ctx_locked(dmar, ctx);
90259e37c8aSRuslan Bukin }
90359e37c8aSRuslan Bukin 
90459e37c8aSRuslan Bukin void
90559e37c8aSRuslan Bukin iommu_free_ctx(struct iommu_ctx *context)
90659e37c8aSRuslan Bukin {
90759e37c8aSRuslan Bukin 	struct dmar_ctx *ctx;
90859e37c8aSRuslan Bukin 
90978b51754SRuslan Bukin 	ctx = IOCTX2CTX(context);
91059e37c8aSRuslan Bukin 
91159e37c8aSRuslan Bukin 	dmar_free_ctx(ctx);
91259e37c8aSRuslan Bukin }
91359e37c8aSRuslan Bukin 
91459e37c8aSRuslan Bukin void
91559e37c8aSRuslan Bukin iommu_domain_unload_entry(struct iommu_map_entry *entry, bool free)
91659e37c8aSRuslan Bukin {
91759e37c8aSRuslan Bukin 
91859e37c8aSRuslan Bukin 	dmar_domain_unload_entry(entry, free);
91959e37c8aSRuslan Bukin }
92059e37c8aSRuslan Bukin 
92159e37c8aSRuslan Bukin void
92259e37c8aSRuslan Bukin iommu_domain_unload(struct iommu_domain *iodom,
92359e37c8aSRuslan Bukin     struct iommu_map_entries_tailq *entries, bool cansleep)
92459e37c8aSRuslan Bukin {
92559e37c8aSRuslan Bukin 	struct dmar_domain *domain;
92659e37c8aSRuslan Bukin 
92778b51754SRuslan Bukin 	domain = IODOM2DOM(iodom);
92859e37c8aSRuslan Bukin 
92959e37c8aSRuslan Bukin 	dmar_domain_unload(domain, entries, cansleep);
93059e37c8aSRuslan Bukin }
931