186be9f0dSKonstantin Belousov /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 3ebf5747bSPedro F. Giffuni * 486be9f0dSKonstantin Belousov * Copyright (c) 2013 The FreeBSD Foundation 586be9f0dSKonstantin Belousov * 686be9f0dSKonstantin Belousov * This software was developed by Konstantin Belousov <kib@FreeBSD.org> 786be9f0dSKonstantin Belousov * under sponsorship from the FreeBSD Foundation. 886be9f0dSKonstantin Belousov * 986be9f0dSKonstantin Belousov * Redistribution and use in source and binary forms, with or without 1086be9f0dSKonstantin Belousov * modification, are permitted provided that the following conditions 1186be9f0dSKonstantin Belousov * are met: 1286be9f0dSKonstantin Belousov * 1. Redistributions of source code must retain the above copyright 1386be9f0dSKonstantin Belousov * notice, this list of conditions and the following disclaimer. 1486be9f0dSKonstantin Belousov * 2. Redistributions in binary form must reproduce the above copyright 1586be9f0dSKonstantin Belousov * notice, this list of conditions and the following disclaimer in the 1686be9f0dSKonstantin Belousov * documentation and/or other materials provided with the distribution. 1786be9f0dSKonstantin Belousov * 1886be9f0dSKonstantin Belousov * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 1986be9f0dSKonstantin Belousov * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2086be9f0dSKonstantin Belousov * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2186be9f0dSKonstantin Belousov * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 2286be9f0dSKonstantin Belousov * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2386be9f0dSKonstantin Belousov * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2486be9f0dSKonstantin Belousov * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 2586be9f0dSKonstantin Belousov * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2686be9f0dSKonstantin Belousov * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2786be9f0dSKonstantin Belousov * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 2886be9f0dSKonstantin Belousov * SUCH DAMAGE. 2986be9f0dSKonstantin Belousov */ 3086be9f0dSKonstantin Belousov 3186be9f0dSKonstantin Belousov #include <sys/param.h> 3286be9f0dSKonstantin Belousov #include <sys/systm.h> 3386be9f0dSKonstantin Belousov #include <sys/malloc.h> 3486be9f0dSKonstantin Belousov #include <sys/bus.h> 3586be9f0dSKonstantin Belousov #include <sys/interrupt.h> 3686be9f0dSKonstantin Belousov #include <sys/kernel.h> 3786be9f0dSKonstantin Belousov #include <sys/ktr.h> 3886be9f0dSKonstantin Belousov #include <sys/limits.h> 3986be9f0dSKonstantin Belousov #include <sys/lock.h> 4086be9f0dSKonstantin Belousov #include <sys/memdesc.h> 4186be9f0dSKonstantin Belousov #include <sys/mutex.h> 4286be9f0dSKonstantin Belousov #include <sys/proc.h> 4386be9f0dSKonstantin Belousov #include <sys/rwlock.h> 4486be9f0dSKonstantin Belousov #include <sys/rman.h> 4586be9f0dSKonstantin Belousov #include <sys/sysctl.h> 4686be9f0dSKonstantin Belousov #include <sys/taskqueue.h> 4786be9f0dSKonstantin Belousov #include <sys/tree.h> 4886be9f0dSKonstantin Belousov #include <sys/uio.h> 490a110d5bSKonstantin Belousov #include <sys/vmem.h> 5086be9f0dSKonstantin Belousov #include <vm/vm.h> 5186be9f0dSKonstantin Belousov #include <vm/vm_extern.h> 5286be9f0dSKonstantin Belousov #include <vm/vm_kern.h> 5386be9f0dSKonstantin Belousov #include <vm/vm_object.h> 5486be9f0dSKonstantin Belousov #include <vm/vm_page.h> 5586be9f0dSKonstantin Belousov #include <vm/vm_pager.h> 5686be9f0dSKonstantin Belousov #include <vm/vm_map.h> 57c8597a1fSRuslan Bukin #include <contrib/dev/acpica/include/acpi.h> 58c8597a1fSRuslan Bukin #include <contrib/dev/acpica/include/accommon.h> 59c8597a1fSRuslan Bukin #include <dev/pci/pcireg.h> 60c8597a1fSRuslan Bukin #include <dev/pci/pcivar.h> 6186be9f0dSKonstantin Belousov #include <machine/atomic.h> 6286be9f0dSKonstantin Belousov #include <machine/bus.h> 6386be9f0dSKonstantin Belousov #include <machine/md_var.h> 6486be9f0dSKonstantin Belousov #include <machine/specialreg.h> 6586be9f0dSKonstantin Belousov #include <x86/include/busdma_impl.h> 66f2b2f317SRuslan Bukin #include <dev/iommu/busdma_iommu.h> 67c8597a1fSRuslan Bukin #include <x86/iommu/intel_reg.h> 6840d951bcSKonstantin Belousov #include <x86/iommu/x86_iommu.h> 69685666aaSKonstantin Belousov #include <x86/iommu/intel_dmar.h> 7086be9f0dSKonstantin Belousov 7186be9f0dSKonstantin Belousov static MALLOC_DEFINE(M_DMAR_CTX, "dmar_ctx", "Intel DMAR Context"); 721abfd355SKonstantin Belousov static MALLOC_DEFINE(M_DMAR_DOMAIN, "dmar_dom", "Intel DMAR Domain"); 7386be9f0dSKonstantin Belousov 741abfd355SKonstantin Belousov static void dmar_unref_domain_locked(struct dmar_unit *dmar, 751abfd355SKonstantin Belousov struct dmar_domain *domain); 761abfd355SKonstantin Belousov static void dmar_domain_destroy(struct dmar_domain *domain); 7786be9f0dSKonstantin Belousov 78*65b133e5SKonstantin Belousov static void dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx); 79*65b133e5SKonstantin Belousov static void dmar_free_ctx(struct dmar_ctx *ctx); 80*65b133e5SKonstantin Belousov 8186be9f0dSKonstantin Belousov static void 8286be9f0dSKonstantin Belousov dmar_ensure_ctx_page(struct dmar_unit *dmar, int bus) 8386be9f0dSKonstantin Belousov { 8486be9f0dSKonstantin Belousov struct sf_buf *sf; 8586be9f0dSKonstantin Belousov dmar_root_entry_t *re; 8686be9f0dSKonstantin Belousov vm_page_t ctxm; 8786be9f0dSKonstantin Belousov 8886be9f0dSKonstantin Belousov /* 8986be9f0dSKonstantin Belousov * Allocated context page must be linked. 9086be9f0dSKonstantin Belousov */ 9140d951bcSKonstantin Belousov ctxm = iommu_pgalloc(dmar->ctx_obj, 1 + bus, IOMMU_PGF_NOALLOC); 9286be9f0dSKonstantin Belousov if (ctxm != NULL) 9386be9f0dSKonstantin Belousov return; 9486be9f0dSKonstantin Belousov 9586be9f0dSKonstantin Belousov /* 9686be9f0dSKonstantin Belousov * Page not present, allocate and link. Note that other 9786be9f0dSKonstantin Belousov * thread might execute this sequence in parallel. This 9886be9f0dSKonstantin Belousov * should be safe, because the context entries written by both 9986be9f0dSKonstantin Belousov * threads are equal. 10086be9f0dSKonstantin Belousov */ 10186be9f0dSKonstantin Belousov TD_PREP_PINNED_ASSERT; 10240d951bcSKonstantin Belousov ctxm = iommu_pgalloc(dmar->ctx_obj, 1 + bus, IOMMU_PGF_ZERO | 10315f6baf4SRuslan Bukin IOMMU_PGF_WAITOK); 10440d951bcSKonstantin Belousov re = iommu_map_pgtbl(dmar->ctx_obj, 0, IOMMU_PGF_NOALLOC, &sf); 10586be9f0dSKonstantin Belousov re += bus; 10686be9f0dSKonstantin Belousov dmar_pte_store(&re->r1, DMAR_ROOT_R1_P | (DMAR_ROOT_R1_CTP_MASK & 10786be9f0dSKonstantin Belousov VM_PAGE_TO_PHYS(ctxm))); 1086b7c46afSKonstantin Belousov dmar_flush_root_to_ram(dmar, re); 10940d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 11086be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 11186be9f0dSKonstantin Belousov } 11286be9f0dSKonstantin Belousov 11386be9f0dSKonstantin Belousov static dmar_ctx_entry_t * 11486be9f0dSKonstantin Belousov dmar_map_ctx_entry(struct dmar_ctx *ctx, struct sf_buf **sfp) 11586be9f0dSKonstantin Belousov { 11659e37c8aSRuslan Bukin struct dmar_unit *dmar; 11786be9f0dSKonstantin Belousov dmar_ctx_entry_t *ctxp; 11886be9f0dSKonstantin Belousov 11978b51754SRuslan Bukin dmar = CTX2DMAR(ctx); 12059e37c8aSRuslan Bukin 12140d951bcSKonstantin Belousov ctxp = iommu_map_pgtbl(dmar->ctx_obj, 1 + PCI_RID2BUS(ctx->context.rid), 122cb9050ddSRuslan Bukin IOMMU_PGF_NOALLOC | IOMMU_PGF_WAITOK, sfp); 123cb9050ddSRuslan Bukin ctxp += ctx->context.rid & 0xff; 12486be9f0dSKonstantin Belousov return (ctxp); 12586be9f0dSKonstantin Belousov } 12686be9f0dSKonstantin Belousov 12786be9f0dSKonstantin Belousov static void 12859e37c8aSRuslan Bukin device_tag_init(struct dmar_ctx *ctx, device_t dev) 12986be9f0dSKonstantin Belousov { 13059e37c8aSRuslan Bukin struct dmar_domain *domain; 13186be9f0dSKonstantin Belousov bus_addr_t maxaddr; 13286be9f0dSKonstantin Belousov 13378b51754SRuslan Bukin domain = CTX2DOM(ctx); 13462ad310cSRuslan Bukin maxaddr = MIN(domain->iodom.end, BUS_SPACE_MAXADDR); 13559e37c8aSRuslan Bukin ctx->context.tag->common.impl = &bus_dma_iommu_impl; 13659e37c8aSRuslan Bukin ctx->context.tag->common.boundary = 0; 13759e37c8aSRuslan Bukin ctx->context.tag->common.lowaddr = maxaddr; 13859e37c8aSRuslan Bukin ctx->context.tag->common.highaddr = maxaddr; 13959e37c8aSRuslan Bukin ctx->context.tag->common.maxsize = maxaddr; 14059e37c8aSRuslan Bukin ctx->context.tag->common.nsegments = BUS_SPACE_UNRESTRICTED; 14159e37c8aSRuslan Bukin ctx->context.tag->common.maxsegsz = maxaddr; 14278b51754SRuslan Bukin ctx->context.tag->ctx = CTX2IOCTX(ctx); 14359e37c8aSRuslan Bukin ctx->context.tag->owner = dev; 14486be9f0dSKonstantin Belousov } 14586be9f0dSKonstantin Belousov 14686be9f0dSKonstantin Belousov static void 147685666aaSKonstantin Belousov ctx_id_entry_init_one(dmar_ctx_entry_t *ctxp, struct dmar_domain *domain, 148685666aaSKonstantin Belousov vm_page_t ctx_root) 14986be9f0dSKonstantin Belousov { 1501abfd355SKonstantin Belousov /* 1511abfd355SKonstantin Belousov * For update due to move, the store is not atomic. It is 1521abfd355SKonstantin Belousov * possible that DMAR read upper doubleword, while low 1531abfd355SKonstantin Belousov * doubleword is not yet updated. The domain id is stored in 1541abfd355SKonstantin Belousov * the upper doubleword, while the table pointer in the lower. 1551abfd355SKonstantin Belousov * 1561abfd355SKonstantin Belousov * There is no good solution, for the same reason it is wrong 1571abfd355SKonstantin Belousov * to clear P bit in the ctx entry for update. 1581abfd355SKonstantin Belousov */ 1591abfd355SKonstantin Belousov dmar_pte_store1(&ctxp->ctx2, DMAR_CTX2_DID(domain->domain) | 1601abfd355SKonstantin Belousov domain->awlvl); 161685666aaSKonstantin Belousov if (ctx_root == NULL) { 162685666aaSKonstantin Belousov dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_PASS | DMAR_CTX1_P); 163685666aaSKonstantin Belousov } else { 164685666aaSKonstantin Belousov dmar_pte_store1(&ctxp->ctx1, DMAR_CTX1_T_UNTR | 165685666aaSKonstantin Belousov (DMAR_CTX1_ASR_MASK & VM_PAGE_TO_PHYS(ctx_root)) | 166685666aaSKonstantin Belousov DMAR_CTX1_P); 167685666aaSKonstantin Belousov } 168685666aaSKonstantin Belousov } 169685666aaSKonstantin Belousov 170685666aaSKonstantin Belousov static void 171685666aaSKonstantin Belousov ctx_id_entry_init(struct dmar_ctx *ctx, dmar_ctx_entry_t *ctxp, bool move, 172685666aaSKonstantin Belousov int busno) 173685666aaSKonstantin Belousov { 174685666aaSKonstantin Belousov struct dmar_unit *unit; 175685666aaSKonstantin Belousov struct dmar_domain *domain; 176685666aaSKonstantin Belousov vm_page_t ctx_root; 177685666aaSKonstantin Belousov int i; 178685666aaSKonstantin Belousov 17978b51754SRuslan Bukin domain = CTX2DOM(ctx); 18078b51754SRuslan Bukin unit = DOM2DMAR(domain); 181685666aaSKonstantin Belousov KASSERT(move || (ctxp->ctx1 == 0 && ctxp->ctx2 == 0), 182685666aaSKonstantin Belousov ("dmar%d: initialized ctx entry %d:%d:%d 0x%jx 0x%jx", 18359e37c8aSRuslan Bukin unit->iommu.unit, busno, pci_get_slot(ctx->context.tag->owner), 18459e37c8aSRuslan Bukin pci_get_function(ctx->context.tag->owner), 185685666aaSKonstantin Belousov ctxp->ctx1, ctxp->ctx2)); 186685666aaSKonstantin Belousov 18715f6baf4SRuslan Bukin if ((domain->iodom.flags & IOMMU_DOMAIN_IDMAP) != 0 && 18886be9f0dSKonstantin Belousov (unit->hw_ecap & DMAR_ECAP_PT) != 0) { 1891abfd355SKonstantin Belousov KASSERT(domain->pgtbl_obj == NULL, 19086be9f0dSKonstantin Belousov ("ctx %p non-null pgtbl_obj", ctx)); 191685666aaSKonstantin Belousov ctx_root = NULL; 19286be9f0dSKonstantin Belousov } else { 19340d951bcSKonstantin Belousov ctx_root = iommu_pgalloc(domain->pgtbl_obj, 0, 19415f6baf4SRuslan Bukin IOMMU_PGF_NOALLOC); 195685666aaSKonstantin Belousov } 196685666aaSKonstantin Belousov 19778b51754SRuslan Bukin if (iommu_is_buswide_ctx(DMAR2IOMMU(unit), busno)) { 198685666aaSKonstantin Belousov MPASS(!move); 199685666aaSKonstantin Belousov for (i = 0; i <= PCI_BUSMAX; i++) { 200685666aaSKonstantin Belousov ctx_id_entry_init_one(&ctxp[i], domain, ctx_root); 201685666aaSKonstantin Belousov } 202685666aaSKonstantin Belousov } else { 203685666aaSKonstantin Belousov ctx_id_entry_init_one(ctxp, domain, ctx_root); 20486be9f0dSKonstantin Belousov } 2056b7c46afSKonstantin Belousov dmar_flush_ctx_to_ram(unit, ctxp); 20686be9f0dSKonstantin Belousov } 20786be9f0dSKonstantin Belousov 20886be9f0dSKonstantin Belousov static int 2091abfd355SKonstantin Belousov dmar_flush_for_ctx_entry(struct dmar_unit *dmar, bool force) 2101abfd355SKonstantin Belousov { 2111abfd355SKonstantin Belousov int error; 2121abfd355SKonstantin Belousov 2131abfd355SKonstantin Belousov /* 2141abfd355SKonstantin Belousov * If dmar declares Caching Mode as Set, follow 11.5 "Caching 2151abfd355SKonstantin Belousov * Mode Consideration" and do the (global) invalidation of the 2161abfd355SKonstantin Belousov * negative TLB entries. 2171abfd355SKonstantin Belousov */ 2181abfd355SKonstantin Belousov if ((dmar->hw_cap & DMAR_CAP_CM) == 0 && !force) 2191abfd355SKonstantin Belousov return (0); 2201abfd355SKonstantin Belousov if (dmar->qi_enabled) { 2211abfd355SKonstantin Belousov dmar_qi_invalidate_ctx_glob_locked(dmar); 2221abfd355SKonstantin Belousov if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force) 2231abfd355SKonstantin Belousov dmar_qi_invalidate_iotlb_glob_locked(dmar); 2241abfd355SKonstantin Belousov return (0); 2251abfd355SKonstantin Belousov } 2261abfd355SKonstantin Belousov error = dmar_inv_ctx_glob(dmar); 2271abfd355SKonstantin Belousov if (error == 0 && ((dmar->hw_ecap & DMAR_ECAP_DI) != 0 || force)) 2281abfd355SKonstantin Belousov error = dmar_inv_iotlb_glob(dmar); 2291abfd355SKonstantin Belousov return (error); 2301abfd355SKonstantin Belousov } 2311abfd355SKonstantin Belousov 2321abfd355SKonstantin Belousov static int 233f9feb091SKonstantin Belousov domain_init_rmrr(struct dmar_domain *domain, device_t dev, int bus, 234f9feb091SKonstantin Belousov int slot, int func, int dev_domain, int dev_busno, 235f9feb091SKonstantin Belousov const void *dev_path, int dev_path_len) 23686be9f0dSKonstantin Belousov { 23759e37c8aSRuslan Bukin struct iommu_map_entries_tailq rmrr_entries; 23859e37c8aSRuslan Bukin struct iommu_map_entry *entry, *entry1; 23986be9f0dSKonstantin Belousov vm_page_t *ma; 24059e37c8aSRuslan Bukin iommu_gaddr_t start, end; 24186be9f0dSKonstantin Belousov vm_pindex_t size, i; 24286be9f0dSKonstantin Belousov int error, error1; 24386be9f0dSKonstantin Belousov 24424e38af6SKonstantin Belousov if (!dmar_rmrr_enable) 24524e38af6SKonstantin Belousov return (0); 24624e38af6SKonstantin Belousov 24786be9f0dSKonstantin Belousov error = 0; 24886be9f0dSKonstantin Belousov TAILQ_INIT(&rmrr_entries); 249f9feb091SKonstantin Belousov dmar_dev_parse_rmrr(domain, dev_domain, dev_busno, dev_path, 250f9feb091SKonstantin Belousov dev_path_len, &rmrr_entries); 251db0110a5SAlan Cox TAILQ_FOREACH_SAFE(entry, &rmrr_entries, dmamap_link, entry1) { 25286be9f0dSKonstantin Belousov /* 25386be9f0dSKonstantin Belousov * VT-d specification requires that the start of an 25486be9f0dSKonstantin Belousov * RMRR entry is 4k-aligned. Buggy BIOSes put 25586be9f0dSKonstantin Belousov * anything into the start and end fields. Truncate 25686be9f0dSKonstantin Belousov * and round as neccesary. 25786be9f0dSKonstantin Belousov * 25886be9f0dSKonstantin Belousov * We also allow the overlapping RMRR entries, see 25962ad310cSRuslan Bukin * iommu_gas_alloc_region(). 26086be9f0dSKonstantin Belousov */ 26186be9f0dSKonstantin Belousov start = entry->start; 26286be9f0dSKonstantin Belousov end = entry->end; 263f9feb091SKonstantin Belousov if (bootverbose) 264f9feb091SKonstantin Belousov printf("dmar%d ctx pci%d:%d:%d RMRR [%#jx, %#jx]\n", 26559e37c8aSRuslan Bukin domain->iodom.iommu->unit, bus, slot, func, 266f9feb091SKonstantin Belousov (uintmax_t)start, (uintmax_t)end); 26786be9f0dSKonstantin Belousov entry->start = trunc_page(start); 26886be9f0dSKonstantin Belousov entry->end = round_page(end); 269e02b05b3SKonstantin Belousov if (entry->start == entry->end) { 270e02b05b3SKonstantin Belousov /* Workaround for some AMI (?) BIOSes */ 271e02b05b3SKonstantin Belousov if (bootverbose) { 272f9feb091SKonstantin Belousov if (dev != NULL) 273f9feb091SKonstantin Belousov device_printf(dev, ""); 274f9feb091SKonstantin Belousov printf("pci%d:%d:%d ", bus, slot, func); 275f9feb091SKonstantin Belousov printf("BIOS bug: dmar%d RMRR " 276e02b05b3SKonstantin Belousov "region (%jx, %jx) corrected\n", 27759e37c8aSRuslan Bukin domain->iodom.iommu->unit, start, end); 278e02b05b3SKonstantin Belousov } 27940d951bcSKonstantin Belousov entry->end += IOMMU_PAGE_SIZE * 0x20; 280e02b05b3SKonstantin Belousov } 28186be9f0dSKonstantin Belousov size = OFF_TO_IDX(entry->end - entry->start); 28286be9f0dSKonstantin Belousov ma = malloc(sizeof(vm_page_t) * size, M_TEMP, M_WAITOK); 28386be9f0dSKonstantin Belousov for (i = 0; i < size; i++) { 28486be9f0dSKonstantin Belousov ma[i] = vm_page_getfake(entry->start + PAGE_SIZE * i, 28586be9f0dSKonstantin Belousov VM_MEMATTR_DEFAULT); 28686be9f0dSKonstantin Belousov } 28778b51754SRuslan Bukin error1 = iommu_gas_map_region(DOM2IODOM(domain), entry, 28859e37c8aSRuslan Bukin IOMMU_MAP_ENTRY_READ | IOMMU_MAP_ENTRY_WRITE, 28959e37c8aSRuslan Bukin IOMMU_MF_CANWAIT | IOMMU_MF_RMRR, ma); 29086be9f0dSKonstantin Belousov /* 29186be9f0dSKonstantin Belousov * Non-failed RMRR entries are owned by context rb 29286be9f0dSKonstantin Belousov * tree. Get rid of the failed entry, but do not stop 29386be9f0dSKonstantin Belousov * the loop. Rest of the parsed RMRR entries are 29486be9f0dSKonstantin Belousov * loaded and removed on the context destruction. 29586be9f0dSKonstantin Belousov */ 29686be9f0dSKonstantin Belousov if (error1 == 0 && entry->end != entry->start) { 29759e37c8aSRuslan Bukin IOMMU_LOCK(domain->iodom.iommu); 2981abfd355SKonstantin Belousov domain->refs++; /* XXXKIB prevent free */ 29915f6baf4SRuslan Bukin domain->iodom.flags |= IOMMU_DOMAIN_RMRR; 30059e37c8aSRuslan Bukin IOMMU_UNLOCK(domain->iodom.iommu); 30186be9f0dSKonstantin Belousov } else { 30286be9f0dSKonstantin Belousov if (error1 != 0) { 303f9feb091SKonstantin Belousov if (dev != NULL) 304f9feb091SKonstantin Belousov device_printf(dev, ""); 305f9feb091SKonstantin Belousov printf("pci%d:%d:%d ", bus, slot, func); 306f9feb091SKonstantin Belousov printf( 30786be9f0dSKonstantin Belousov "dmar%d failed to map RMRR region (%jx, %jx) %d\n", 30859e37c8aSRuslan Bukin domain->iodom.iommu->unit, start, end, 309f9feb091SKonstantin Belousov error1); 31086be9f0dSKonstantin Belousov error = error1; 31186be9f0dSKonstantin Belousov } 312db0110a5SAlan Cox TAILQ_REMOVE(&rmrr_entries, entry, dmamap_link); 3134670f908SAlan Cox iommu_gas_free_entry(entry); 31486be9f0dSKonstantin Belousov } 31586be9f0dSKonstantin Belousov for (i = 0; i < size; i++) 31686be9f0dSKonstantin Belousov vm_page_putfake(ma[i]); 31786be9f0dSKonstantin Belousov free(ma, M_TEMP); 31886be9f0dSKonstantin Belousov } 31986be9f0dSKonstantin Belousov return (error); 32086be9f0dSKonstantin Belousov } 32186be9f0dSKonstantin Belousov 322ee47a12aSRyan Libby /* 323ee47a12aSRyan Libby * PCI memory address space is shared between memory-mapped devices (MMIO) and 324ee47a12aSRyan Libby * host memory (which may be remapped by an IOMMU). Device accesses to an 325ee47a12aSRyan Libby * address within a memory aperture in a PCIe root port will be treated as 326ee47a12aSRyan Libby * peer-to-peer and not forwarded to an IOMMU. To avoid this, reserve the 327ee47a12aSRyan Libby * address space of the root port's memory apertures in the address space used 328ee47a12aSRyan Libby * by the IOMMU for remapping. 329ee47a12aSRyan Libby */ 330ee47a12aSRyan Libby static int 331ee47a12aSRyan Libby dmar_reserve_pci_regions(struct dmar_domain *domain, device_t dev) 332ee47a12aSRyan Libby { 333ee47a12aSRyan Libby struct iommu_domain *iodom; 334ee47a12aSRyan Libby device_t root; 335ee47a12aSRyan Libby uint32_t val; 336ee47a12aSRyan Libby uint64_t base, limit; 337ee47a12aSRyan Libby int error; 338ee47a12aSRyan Libby 339ee47a12aSRyan Libby iodom = DOM2IODOM(domain); 340ee47a12aSRyan Libby 341ee47a12aSRyan Libby root = pci_find_pcie_root_port(dev); 342ee47a12aSRyan Libby if (root == NULL) 343ee47a12aSRyan Libby return (0); 344ee47a12aSRyan Libby 345ee47a12aSRyan Libby /* Disable downstream memory */ 346ee47a12aSRyan Libby base = PCI_PPBMEMBASE(0, pci_read_config(root, PCIR_MEMBASE_1, 2)); 347ee47a12aSRyan Libby limit = PCI_PPBMEMLIMIT(0, pci_read_config(root, PCIR_MEMLIMIT_1, 2)); 348ee47a12aSRyan Libby error = iommu_gas_reserve_region_extend(iodom, base, limit + 1); 349ee47a12aSRyan Libby if (bootverbose || error != 0) 350ee47a12aSRyan Libby device_printf(dev, "DMAR reserve [%#jx-%#jx] (error %d)\n", 351ee47a12aSRyan Libby base, limit + 1, error); 352ee47a12aSRyan Libby if (error != 0) 353ee47a12aSRyan Libby return (error); 354ee47a12aSRyan Libby 355ee47a12aSRyan Libby /* Disable downstream prefetchable memory */ 356ee47a12aSRyan Libby val = pci_read_config(root, PCIR_PMBASEL_1, 2); 357ee47a12aSRyan Libby if (val != 0 || pci_read_config(root, PCIR_PMLIMITL_1, 2) != 0) { 358ee47a12aSRyan Libby if ((val & PCIM_BRPM_MASK) == PCIM_BRPM_64) { 359ee47a12aSRyan Libby base = PCI_PPBMEMBASE( 360ee47a12aSRyan Libby pci_read_config(root, PCIR_PMBASEH_1, 4), 361ee47a12aSRyan Libby val); 362ee47a12aSRyan Libby limit = PCI_PPBMEMLIMIT( 363ee47a12aSRyan Libby pci_read_config(root, PCIR_PMLIMITH_1, 4), 364ee47a12aSRyan Libby pci_read_config(root, PCIR_PMLIMITL_1, 2)); 365ee47a12aSRyan Libby } else { 366ee47a12aSRyan Libby base = PCI_PPBMEMBASE(0, val); 367ee47a12aSRyan Libby limit = PCI_PPBMEMLIMIT(0, 368ee47a12aSRyan Libby pci_read_config(root, PCIR_PMLIMITL_1, 2)); 369ee47a12aSRyan Libby } 370ee47a12aSRyan Libby error = iommu_gas_reserve_region_extend(iodom, base, 371ee47a12aSRyan Libby limit + 1); 372ee47a12aSRyan Libby if (bootverbose || error != 0) 373ee47a12aSRyan Libby device_printf(dev, "DMAR reserve [%#jx-%#jx] " 374ee47a12aSRyan Libby "(error %d)\n", base, limit + 1, error); 375ee47a12aSRyan Libby if (error != 0) 376ee47a12aSRyan Libby return (error); 377ee47a12aSRyan Libby } 378ee47a12aSRyan Libby 379ee47a12aSRyan Libby return (error); 380ee47a12aSRyan Libby } 381ee47a12aSRyan Libby 3821abfd355SKonstantin Belousov static struct dmar_domain * 3831abfd355SKonstantin Belousov dmar_domain_alloc(struct dmar_unit *dmar, bool id_mapped) 3841abfd355SKonstantin Belousov { 38562ad310cSRuslan Bukin struct iommu_domain *iodom; 38616696f60SRuslan Bukin struct iommu_unit *unit; 3871abfd355SKonstantin Belousov struct dmar_domain *domain; 3881abfd355SKonstantin Belousov int error, id, mgaw; 3891abfd355SKonstantin Belousov 3901abfd355SKonstantin Belousov id = alloc_unr(dmar->domids); 3911abfd355SKonstantin Belousov if (id == -1) 3921abfd355SKonstantin Belousov return (NULL); 3931abfd355SKonstantin Belousov domain = malloc(sizeof(*domain), M_DMAR_DOMAIN, M_WAITOK | M_ZERO); 39478b51754SRuslan Bukin iodom = DOM2IODOM(domain); 39516696f60SRuslan Bukin unit = DMAR2IOMMU(dmar); 3961abfd355SKonstantin Belousov domain->domain = id; 3971abfd355SKonstantin Belousov LIST_INIT(&domain->contexts); 39816696f60SRuslan Bukin iommu_domain_init(unit, iodom, &dmar_domain_map_ops); 39916696f60SRuslan Bukin 4001abfd355SKonstantin Belousov domain->dmar = dmar; 4011abfd355SKonstantin Belousov 4021abfd355SKonstantin Belousov /* 4031abfd355SKonstantin Belousov * For now, use the maximal usable physical address of the 4041abfd355SKonstantin Belousov * installed memory to calculate the mgaw on id_mapped domain. 4051abfd355SKonstantin Belousov * It is useful for the identity mapping, and less so for the 4061abfd355SKonstantin Belousov * virtualized bus address space. 4071abfd355SKonstantin Belousov */ 40862ad310cSRuslan Bukin domain->iodom.end = id_mapped ? ptoa(Maxmem) : BUS_SPACE_MAXADDR; 40962ad310cSRuslan Bukin mgaw = dmar_maxaddr2mgaw(dmar, domain->iodom.end, !id_mapped); 4101abfd355SKonstantin Belousov error = domain_set_agaw(domain, mgaw); 4111abfd355SKonstantin Belousov if (error != 0) 4121abfd355SKonstantin Belousov goto fail; 4131abfd355SKonstantin Belousov if (!id_mapped) 4141abfd355SKonstantin Belousov /* Use all supported address space for remapping. */ 41562ad310cSRuslan Bukin domain->iodom.end = 1ULL << (domain->agaw - 1); 4161abfd355SKonstantin Belousov 41778b51754SRuslan Bukin iommu_gas_init_domain(DOM2IODOM(domain)); 4181abfd355SKonstantin Belousov 4191abfd355SKonstantin Belousov if (id_mapped) { 4201abfd355SKonstantin Belousov if ((dmar->hw_ecap & DMAR_ECAP_PT) == 0) { 4211abfd355SKonstantin Belousov domain->pgtbl_obj = domain_get_idmap_pgtbl(domain, 42262ad310cSRuslan Bukin domain->iodom.end); 4231abfd355SKonstantin Belousov } 42415f6baf4SRuslan Bukin domain->iodom.flags |= IOMMU_DOMAIN_IDMAP; 4251abfd355SKonstantin Belousov } else { 4261abfd355SKonstantin Belousov error = domain_alloc_pgtbl(domain); 4271abfd355SKonstantin Belousov if (error != 0) 4281abfd355SKonstantin Belousov goto fail; 4291abfd355SKonstantin Belousov /* Disable local apic region access */ 43062ad310cSRuslan Bukin error = iommu_gas_reserve_region(iodom, 0xfee00000, 43194dfb28eSRuslan Bukin 0xfeefffff + 1, &iodom->msi_entry); 4321abfd355SKonstantin Belousov if (error != 0) 4331abfd355SKonstantin Belousov goto fail; 4341abfd355SKonstantin Belousov } 4351abfd355SKonstantin Belousov return (domain); 4361abfd355SKonstantin Belousov 4371abfd355SKonstantin Belousov fail: 4381abfd355SKonstantin Belousov dmar_domain_destroy(domain); 4391abfd355SKonstantin Belousov return (NULL); 4401abfd355SKonstantin Belousov } 4411abfd355SKonstantin Belousov 44286be9f0dSKonstantin Belousov static struct dmar_ctx * 4431abfd355SKonstantin Belousov dmar_ctx_alloc(struct dmar_domain *domain, uint16_t rid) 44486be9f0dSKonstantin Belousov { 44586be9f0dSKonstantin Belousov struct dmar_ctx *ctx; 44686be9f0dSKonstantin Belousov 44786be9f0dSKonstantin Belousov ctx = malloc(sizeof(*ctx), M_DMAR_CTX, M_WAITOK | M_ZERO); 44878b51754SRuslan Bukin ctx->context.domain = DOM2IODOM(domain); 44959e37c8aSRuslan Bukin ctx->context.tag = malloc(sizeof(struct bus_dma_tag_iommu), 45059e37c8aSRuslan Bukin M_DMAR_CTX, M_WAITOK | M_ZERO); 451cb9050ddSRuslan Bukin ctx->context.rid = rid; 4521abfd355SKonstantin Belousov ctx->refs = 1; 45386be9f0dSKonstantin Belousov return (ctx); 45486be9f0dSKonstantin Belousov } 45586be9f0dSKonstantin Belousov 45686be9f0dSKonstantin Belousov static void 4571abfd355SKonstantin Belousov dmar_ctx_link(struct dmar_ctx *ctx) 4581abfd355SKonstantin Belousov { 4591abfd355SKonstantin Belousov struct dmar_domain *domain; 4601abfd355SKonstantin Belousov 46178b51754SRuslan Bukin domain = CTX2DOM(ctx); 46259e37c8aSRuslan Bukin IOMMU_ASSERT_LOCKED(domain->iodom.iommu); 4631abfd355SKonstantin Belousov KASSERT(domain->refs >= domain->ctx_cnt, 4641abfd355SKonstantin Belousov ("dom %p ref underflow %d %d", domain, domain->refs, 4651abfd355SKonstantin Belousov domain->ctx_cnt)); 4661abfd355SKonstantin Belousov domain->refs++; 4671abfd355SKonstantin Belousov domain->ctx_cnt++; 4681abfd355SKonstantin Belousov LIST_INSERT_HEAD(&domain->contexts, ctx, link); 4691abfd355SKonstantin Belousov } 4701abfd355SKonstantin Belousov 4711abfd355SKonstantin Belousov static void 4721abfd355SKonstantin Belousov dmar_ctx_unlink(struct dmar_ctx *ctx) 4731abfd355SKonstantin Belousov { 4741abfd355SKonstantin Belousov struct dmar_domain *domain; 4751abfd355SKonstantin Belousov 47678b51754SRuslan Bukin domain = CTX2DOM(ctx); 47759e37c8aSRuslan Bukin IOMMU_ASSERT_LOCKED(domain->iodom.iommu); 4781abfd355SKonstantin Belousov KASSERT(domain->refs > 0, 4791abfd355SKonstantin Belousov ("domain %p ctx dtr refs %d", domain, domain->refs)); 4801abfd355SKonstantin Belousov KASSERT(domain->ctx_cnt >= domain->refs, 4811abfd355SKonstantin Belousov ("domain %p ctx dtr refs %d ctx_cnt %d", domain, 4821abfd355SKonstantin Belousov domain->refs, domain->ctx_cnt)); 4831abfd355SKonstantin Belousov domain->refs--; 4841abfd355SKonstantin Belousov domain->ctx_cnt--; 4851abfd355SKonstantin Belousov LIST_REMOVE(ctx, link); 4861abfd355SKonstantin Belousov } 4871abfd355SKonstantin Belousov 4881abfd355SKonstantin Belousov static void 4891abfd355SKonstantin Belousov dmar_domain_destroy(struct dmar_domain *domain) 49086be9f0dSKonstantin Belousov { 49116696f60SRuslan Bukin struct iommu_domain *iodom; 49259e37c8aSRuslan Bukin struct dmar_unit *dmar; 49386be9f0dSKonstantin Belousov 49416696f60SRuslan Bukin iodom = DOM2IODOM(domain); 49516696f60SRuslan Bukin 49659e37c8aSRuslan Bukin KASSERT(TAILQ_EMPTY(&domain->iodom.unload_entries), 4971abfd355SKonstantin Belousov ("unfinished unloads %p", domain)); 4981abfd355SKonstantin Belousov KASSERT(LIST_EMPTY(&domain->contexts), 4991abfd355SKonstantin Belousov ("destroying dom %p with contexts", domain)); 5001abfd355SKonstantin Belousov KASSERT(domain->ctx_cnt == 0, 5011abfd355SKonstantin Belousov ("destroying dom %p with ctx_cnt %d", domain, domain->ctx_cnt)); 5021abfd355SKonstantin Belousov KASSERT(domain->refs == 0, 5031abfd355SKonstantin Belousov ("destroying dom %p with refs %d", domain, domain->refs)); 50415f6baf4SRuslan Bukin if ((domain->iodom.flags & IOMMU_DOMAIN_GAS_INITED) != 0) { 5051abfd355SKonstantin Belousov DMAR_DOMAIN_LOCK(domain); 50616696f60SRuslan Bukin iommu_gas_fini_domain(iodom); 5071abfd355SKonstantin Belousov DMAR_DOMAIN_UNLOCK(domain); 50886be9f0dSKonstantin Belousov } 50915f6baf4SRuslan Bukin if ((domain->iodom.flags & IOMMU_DOMAIN_PGTBL_INITED) != 0) { 5101abfd355SKonstantin Belousov if (domain->pgtbl_obj != NULL) 5111abfd355SKonstantin Belousov DMAR_DOMAIN_PGLOCK(domain); 5121abfd355SKonstantin Belousov domain_free_pgtbl(domain); 51386be9f0dSKonstantin Belousov } 51416696f60SRuslan Bukin iommu_domain_fini(iodom); 51578b51754SRuslan Bukin dmar = DOM2DMAR(domain); 51659e37c8aSRuslan Bukin free_unr(dmar->domids, domain->domain); 5171abfd355SKonstantin Belousov free(domain, M_DMAR_DOMAIN); 51886be9f0dSKonstantin Belousov } 51986be9f0dSKonstantin Belousov 520f9feb091SKonstantin Belousov static struct dmar_ctx * 521f9feb091SKonstantin Belousov dmar_get_ctx_for_dev1(struct dmar_unit *dmar, device_t dev, uint16_t rid, 522f9feb091SKonstantin Belousov int dev_domain, int dev_busno, const void *dev_path, int dev_path_len, 5231abfd355SKonstantin Belousov bool id_mapped, bool rmrr_init) 52486be9f0dSKonstantin Belousov { 5251abfd355SKonstantin Belousov struct dmar_domain *domain, *domain1; 52686be9f0dSKonstantin Belousov struct dmar_ctx *ctx, *ctx1; 527661bd70bSKonstantin Belousov struct iommu_unit *unit __diagused; 52886be9f0dSKonstantin Belousov dmar_ctx_entry_t *ctxp; 52986be9f0dSKonstantin Belousov struct sf_buf *sf; 5301abfd355SKonstantin Belousov int bus, slot, func, error; 53186be9f0dSKonstantin Belousov bool enable; 53286be9f0dSKonstantin Belousov 533f9feb091SKonstantin Belousov if (dev != NULL) { 53467499354SRyan Stone bus = pci_get_bus(dev); 53567499354SRyan Stone slot = pci_get_slot(dev); 53667499354SRyan Stone func = pci_get_function(dev); 537f9feb091SKonstantin Belousov } else { 538f9feb091SKonstantin Belousov bus = PCI_RID2BUS(rid); 539f9feb091SKonstantin Belousov slot = PCI_RID2SLOT(rid); 540f9feb091SKonstantin Belousov func = PCI_RID2FUNC(rid); 541f9feb091SKonstantin Belousov } 54286be9f0dSKonstantin Belousov enable = false; 54386be9f0dSKonstantin Belousov TD_PREP_PINNED_ASSERT; 54478b51754SRuslan Bukin unit = DMAR2IOMMU(dmar); 54586be9f0dSKonstantin Belousov DMAR_LOCK(dmar); 546ea4c0115SRuslan Bukin KASSERT(!iommu_is_buswide_ctx(unit, bus) || (slot == 0 && func == 0), 547ea4c0115SRuslan Bukin ("iommu%d pci%d:%d:%d get_ctx for buswide", dmar->iommu.unit, bus, 548685666aaSKonstantin Belousov slot, func)); 54967499354SRyan Stone ctx = dmar_find_ctx_locked(dmar, rid); 55086be9f0dSKonstantin Belousov error = 0; 55186be9f0dSKonstantin Belousov if (ctx == NULL) { 55286be9f0dSKonstantin Belousov /* 55386be9f0dSKonstantin Belousov * Perform the allocations which require sleep or have 55486be9f0dSKonstantin Belousov * higher chance to succeed if the sleep is allowed. 55586be9f0dSKonstantin Belousov */ 55686be9f0dSKonstantin Belousov DMAR_UNLOCK(dmar); 557b29d186cSKonstantin Belousov dmar_ensure_ctx_page(dmar, PCI_RID2BUS(rid)); 5581abfd355SKonstantin Belousov domain1 = dmar_domain_alloc(dmar, id_mapped); 5591abfd355SKonstantin Belousov if (domain1 == NULL) { 56086be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 56186be9f0dSKonstantin Belousov return (NULL); 56286be9f0dSKonstantin Belousov } 5635f8e5c7fSKonstantin Belousov if (!id_mapped) { 564f9feb091SKonstantin Belousov error = domain_init_rmrr(domain1, dev, bus, 565f9feb091SKonstantin Belousov slot, func, dev_domain, dev_busno, dev_path, 566f9feb091SKonstantin Belousov dev_path_len); 5673c02da80SKornel Duleba if (error == 0 && dev != NULL) 568ee47a12aSRyan Libby error = dmar_reserve_pci_regions(domain1, dev); 56986be9f0dSKonstantin Belousov if (error != 0) { 5701abfd355SKonstantin Belousov dmar_domain_destroy(domain1); 57186be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 57286be9f0dSKonstantin Belousov return (NULL); 57386be9f0dSKonstantin Belousov } 5745f8e5c7fSKonstantin Belousov } 5751abfd355SKonstantin Belousov ctx1 = dmar_ctx_alloc(domain1, rid); 57686be9f0dSKonstantin Belousov ctxp = dmar_map_ctx_entry(ctx1, &sf); 57786be9f0dSKonstantin Belousov DMAR_LOCK(dmar); 57886be9f0dSKonstantin Belousov 57986be9f0dSKonstantin Belousov /* 58086be9f0dSKonstantin Belousov * Recheck the contexts, other thread might have 58186be9f0dSKonstantin Belousov * already allocated needed one. 58286be9f0dSKonstantin Belousov */ 58367499354SRyan Stone ctx = dmar_find_ctx_locked(dmar, rid); 58486be9f0dSKonstantin Belousov if (ctx == NULL) { 5851abfd355SKonstantin Belousov domain = domain1; 58686be9f0dSKonstantin Belousov ctx = ctx1; 5871abfd355SKonstantin Belousov dmar_ctx_link(ctx); 58859e37c8aSRuslan Bukin ctx->context.tag->owner = dev; 58959e37c8aSRuslan Bukin device_tag_init(ctx, dev); 59086be9f0dSKonstantin Belousov 59186be9f0dSKonstantin Belousov /* 59286be9f0dSKonstantin Belousov * This is the first activated context for the 59386be9f0dSKonstantin Belousov * DMAR unit. Enable the translation after 59486be9f0dSKonstantin Belousov * everything is set up. 59586be9f0dSKonstantin Belousov */ 5961abfd355SKonstantin Belousov if (LIST_EMPTY(&dmar->domains)) 59786be9f0dSKonstantin Belousov enable = true; 5981abfd355SKonstantin Belousov LIST_INSERT_HEAD(&dmar->domains, domain, link); 599685666aaSKonstantin Belousov ctx_id_entry_init(ctx, ctxp, false, bus); 600f9feb091SKonstantin Belousov if (dev != NULL) { 60186be9f0dSKonstantin Belousov device_printf(dev, 60234e8337bSKonstantin Belousov "dmar%d pci%d:%d:%d:%d rid %x domain %d mgaw %d " 6039d0bc6d8SKonstantin Belousov "agaw %d %s-mapped\n", 60459e37c8aSRuslan Bukin dmar->iommu.unit, dmar->segment, bus, slot, 6051abfd355SKonstantin Belousov func, rid, domain->domain, domain->mgaw, 6061abfd355SKonstantin Belousov domain->agaw, id_mapped ? "id" : "re"); 607f9feb091SKonstantin Belousov } 60840d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 60986be9f0dSKonstantin Belousov } else { 61040d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 6111abfd355SKonstantin Belousov dmar_domain_destroy(domain1); 6123d47c58bSKonstantin Belousov /* Nothing needs to be done to destroy ctx1. */ 6133d47c58bSKonstantin Belousov free(ctx1, M_DMAR_CTX); 61478b51754SRuslan Bukin domain = CTX2DOM(ctx); 6151abfd355SKonstantin Belousov ctx->refs++; /* tag referenced us */ 61686be9f0dSKonstantin Belousov } 61768eeb96aSKonstantin Belousov } else { 61878b51754SRuslan Bukin domain = CTX2DOM(ctx); 61959e37c8aSRuslan Bukin if (ctx->context.tag->owner == NULL) 62059e37c8aSRuslan Bukin ctx->context.tag->owner = dev; 6211abfd355SKonstantin Belousov ctx->refs++; /* tag referenced us */ 6221abfd355SKonstantin Belousov } 6231abfd355SKonstantin Belousov 6241abfd355SKonstantin Belousov error = dmar_flush_for_ctx_entry(dmar, enable); 62586be9f0dSKonstantin Belousov if (error != 0) { 62686be9f0dSKonstantin Belousov dmar_free_ctx_locked(dmar, ctx); 62786be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 62886be9f0dSKonstantin Belousov return (NULL); 62986be9f0dSKonstantin Belousov } 63068eeb96aSKonstantin Belousov 63168eeb96aSKonstantin Belousov /* 63268eeb96aSKonstantin Belousov * The dmar lock was potentially dropped between check for the 63368eeb96aSKonstantin Belousov * empty context list and now. Recheck the state of GCMD_TE 63468eeb96aSKonstantin Belousov * to avoid unneeded command. 63568eeb96aSKonstantin Belousov */ 63668eeb96aSKonstantin Belousov if (enable && !rmrr_init && (dmar->hw_gcmd & DMAR_GCMD_TE) == 0) { 63706e6ca6dSKornel Duleba error = dmar_disable_protected_regions(dmar); 63806e6ca6dSKornel Duleba if (error != 0) 63906e6ca6dSKornel Duleba printf("dmar%d: Failed to disable protected regions\n", 64006e6ca6dSKornel Duleba dmar->iommu.unit); 64186be9f0dSKonstantin Belousov error = dmar_enable_translation(dmar); 642f9feb091SKonstantin Belousov if (error == 0) { 643f9feb091SKonstantin Belousov if (bootverbose) { 644f9feb091SKonstantin Belousov printf("dmar%d: enabled translation\n", 64559e37c8aSRuslan Bukin dmar->iommu.unit); 646f9feb091SKonstantin Belousov } 647f9feb091SKonstantin Belousov } else { 648f9feb091SKonstantin Belousov printf("dmar%d: enabling translation failed, " 64959e37c8aSRuslan Bukin "error %d\n", dmar->iommu.unit, error); 65086be9f0dSKonstantin Belousov dmar_free_ctx_locked(dmar, ctx); 65186be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 65286be9f0dSKonstantin Belousov return (NULL); 65386be9f0dSKonstantin Belousov } 65486be9f0dSKonstantin Belousov } 65586be9f0dSKonstantin Belousov DMAR_UNLOCK(dmar); 65686be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 65786be9f0dSKonstantin Belousov return (ctx); 65886be9f0dSKonstantin Belousov } 65986be9f0dSKonstantin Belousov 660f9feb091SKonstantin Belousov struct dmar_ctx * 661f9feb091SKonstantin Belousov dmar_get_ctx_for_dev(struct dmar_unit *dmar, device_t dev, uint16_t rid, 662f9feb091SKonstantin Belousov bool id_mapped, bool rmrr_init) 663f9feb091SKonstantin Belousov { 664f9feb091SKonstantin Belousov int dev_domain, dev_path_len, dev_busno; 665f9feb091SKonstantin Belousov 666f9feb091SKonstantin Belousov dev_domain = pci_get_domain(dev); 667f9feb091SKonstantin Belousov dev_path_len = dmar_dev_depth(dev); 668f9feb091SKonstantin Belousov ACPI_DMAR_PCI_PATH dev_path[dev_path_len]; 669f9feb091SKonstantin Belousov dmar_dev_path(dev, &dev_busno, dev_path, dev_path_len); 670f9feb091SKonstantin Belousov return (dmar_get_ctx_for_dev1(dmar, dev, rid, dev_domain, dev_busno, 671f9feb091SKonstantin Belousov dev_path, dev_path_len, id_mapped, rmrr_init)); 672f9feb091SKonstantin Belousov } 673f9feb091SKonstantin Belousov 674f9feb091SKonstantin Belousov struct dmar_ctx * 675f9feb091SKonstantin Belousov dmar_get_ctx_for_devpath(struct dmar_unit *dmar, uint16_t rid, 676f9feb091SKonstantin Belousov int dev_domain, int dev_busno, 677f9feb091SKonstantin Belousov const void *dev_path, int dev_path_len, 678f9feb091SKonstantin Belousov bool id_mapped, bool rmrr_init) 679f9feb091SKonstantin Belousov { 680f9feb091SKonstantin Belousov 681f9feb091SKonstantin Belousov return (dmar_get_ctx_for_dev1(dmar, NULL, rid, dev_domain, dev_busno, 682f9feb091SKonstantin Belousov dev_path, dev_path_len, id_mapped, rmrr_init)); 683f9feb091SKonstantin Belousov } 684f9feb091SKonstantin Belousov 6851abfd355SKonstantin Belousov int 6861abfd355SKonstantin Belousov dmar_move_ctx_to_domain(struct dmar_domain *domain, struct dmar_ctx *ctx) 6871abfd355SKonstantin Belousov { 6881abfd355SKonstantin Belousov struct dmar_unit *dmar; 6891abfd355SKonstantin Belousov struct dmar_domain *old_domain; 6901abfd355SKonstantin Belousov dmar_ctx_entry_t *ctxp; 6911abfd355SKonstantin Belousov struct sf_buf *sf; 6921abfd355SKonstantin Belousov int error; 6931abfd355SKonstantin Belousov 6941abfd355SKonstantin Belousov dmar = domain->dmar; 69578b51754SRuslan Bukin old_domain = CTX2DOM(ctx); 6961abfd355SKonstantin Belousov if (domain == old_domain) 6971abfd355SKonstantin Belousov return (0); 69859e37c8aSRuslan Bukin KASSERT(old_domain->iodom.iommu == domain->iodom.iommu, 6991abfd355SKonstantin Belousov ("domain %p %u moving between dmars %u %u", domain, 70059e37c8aSRuslan Bukin domain->domain, old_domain->iodom.iommu->unit, 70159e37c8aSRuslan Bukin domain->iodom.iommu->unit)); 7021abfd355SKonstantin Belousov TD_PREP_PINNED_ASSERT; 7031abfd355SKonstantin Belousov 7041abfd355SKonstantin Belousov ctxp = dmar_map_ctx_entry(ctx, &sf); 7051abfd355SKonstantin Belousov DMAR_LOCK(dmar); 7061abfd355SKonstantin Belousov dmar_ctx_unlink(ctx); 70759e37c8aSRuslan Bukin ctx->context.domain = &domain->iodom; 7081abfd355SKonstantin Belousov dmar_ctx_link(ctx); 709685666aaSKonstantin Belousov ctx_id_entry_init(ctx, ctxp, true, PCI_BUSMAX + 100); 71040d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 7111abfd355SKonstantin Belousov error = dmar_flush_for_ctx_entry(dmar, true); 7121abfd355SKonstantin Belousov /* If flush failed, rolling back would not work as well. */ 7131abfd355SKonstantin Belousov printf("dmar%d rid %x domain %d->%d %s-mapped\n", 714cb9050ddSRuslan Bukin dmar->iommu.unit, ctx->context.rid, old_domain->domain, 715cb9050ddSRuslan Bukin domain->domain, (domain->iodom.flags & IOMMU_DOMAIN_IDMAP) != 0 ? 716cb9050ddSRuslan Bukin "id" : "re"); 7171abfd355SKonstantin Belousov dmar_unref_domain_locked(dmar, old_domain); 7181abfd355SKonstantin Belousov TD_PINNED_ASSERT; 7191abfd355SKonstantin Belousov return (error); 7201abfd355SKonstantin Belousov } 7211abfd355SKonstantin Belousov 7221abfd355SKonstantin Belousov static void 7231abfd355SKonstantin Belousov dmar_unref_domain_locked(struct dmar_unit *dmar, struct dmar_domain *domain) 7241abfd355SKonstantin Belousov { 7251abfd355SKonstantin Belousov 7261abfd355SKonstantin Belousov DMAR_ASSERT_LOCKED(dmar); 7271abfd355SKonstantin Belousov KASSERT(domain->refs >= 1, 72859e37c8aSRuslan Bukin ("dmar %d domain %p refs %u", dmar->iommu.unit, domain, 72959e37c8aSRuslan Bukin domain->refs)); 7301abfd355SKonstantin Belousov KASSERT(domain->refs > domain->ctx_cnt, 73159e37c8aSRuslan Bukin ("dmar %d domain %p refs %d ctx_cnt %d", dmar->iommu.unit, domain, 7321abfd355SKonstantin Belousov domain->refs, domain->ctx_cnt)); 7331abfd355SKonstantin Belousov 7341abfd355SKonstantin Belousov if (domain->refs > 1) { 7351abfd355SKonstantin Belousov domain->refs--; 7361abfd355SKonstantin Belousov DMAR_UNLOCK(dmar); 7371abfd355SKonstantin Belousov return; 7381abfd355SKonstantin Belousov } 7391abfd355SKonstantin Belousov 74015f6baf4SRuslan Bukin KASSERT((domain->iodom.flags & IOMMU_DOMAIN_RMRR) == 0, 7411abfd355SKonstantin Belousov ("lost ref on RMRR domain %p", domain)); 7421abfd355SKonstantin Belousov 7431abfd355SKonstantin Belousov LIST_REMOVE(domain, link); 7441abfd355SKonstantin Belousov DMAR_UNLOCK(dmar); 7451abfd355SKonstantin Belousov 74659e37c8aSRuslan Bukin taskqueue_drain(dmar->iommu.delayed_taskqueue, 74759e37c8aSRuslan Bukin &domain->iodom.unload_task); 7481abfd355SKonstantin Belousov dmar_domain_destroy(domain); 7491abfd355SKonstantin Belousov } 7501abfd355SKonstantin Belousov 751*65b133e5SKonstantin Belousov static void 75286be9f0dSKonstantin Belousov dmar_free_ctx_locked(struct dmar_unit *dmar, struct dmar_ctx *ctx) 75386be9f0dSKonstantin Belousov { 75486be9f0dSKonstantin Belousov struct sf_buf *sf; 75586be9f0dSKonstantin Belousov dmar_ctx_entry_t *ctxp; 7561abfd355SKonstantin Belousov struct dmar_domain *domain; 75786be9f0dSKonstantin Belousov 75886be9f0dSKonstantin Belousov DMAR_ASSERT_LOCKED(dmar); 75986be9f0dSKonstantin Belousov KASSERT(ctx->refs >= 1, 76086be9f0dSKonstantin Belousov ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs)); 76186be9f0dSKonstantin Belousov 76286be9f0dSKonstantin Belousov /* 76386be9f0dSKonstantin Belousov * If our reference is not last, only the dereference should 76486be9f0dSKonstantin Belousov * be performed. 76586be9f0dSKonstantin Belousov */ 76686be9f0dSKonstantin Belousov if (ctx->refs > 1) { 76786be9f0dSKonstantin Belousov ctx->refs--; 76886be9f0dSKonstantin Belousov DMAR_UNLOCK(dmar); 76986be9f0dSKonstantin Belousov return; 77086be9f0dSKonstantin Belousov } 77186be9f0dSKonstantin Belousov 77259e37c8aSRuslan Bukin KASSERT((ctx->context.flags & IOMMU_CTX_DISABLED) == 0, 77386be9f0dSKonstantin Belousov ("lost ref on disabled ctx %p", ctx)); 77486be9f0dSKonstantin Belousov 77586be9f0dSKonstantin Belousov /* 77686be9f0dSKonstantin Belousov * Otherwise, the context entry must be cleared before the 77786be9f0dSKonstantin Belousov * page table is destroyed. The mapping of the context 77886be9f0dSKonstantin Belousov * entries page could require sleep, unlock the dmar. 77986be9f0dSKonstantin Belousov */ 78086be9f0dSKonstantin Belousov DMAR_UNLOCK(dmar); 78186be9f0dSKonstantin Belousov TD_PREP_PINNED_ASSERT; 78286be9f0dSKonstantin Belousov ctxp = dmar_map_ctx_entry(ctx, &sf); 78386be9f0dSKonstantin Belousov DMAR_LOCK(dmar); 78486be9f0dSKonstantin Belousov KASSERT(ctx->refs >= 1, 78586be9f0dSKonstantin Belousov ("dmar %p ctx %p refs %u", dmar, ctx, ctx->refs)); 78686be9f0dSKonstantin Belousov 78786be9f0dSKonstantin Belousov /* 78886be9f0dSKonstantin Belousov * Other thread might have referenced the context, in which 78986be9f0dSKonstantin Belousov * case again only the dereference should be performed. 79086be9f0dSKonstantin Belousov */ 79186be9f0dSKonstantin Belousov if (ctx->refs > 1) { 79286be9f0dSKonstantin Belousov ctx->refs--; 79386be9f0dSKonstantin Belousov DMAR_UNLOCK(dmar); 79440d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 79586be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 79686be9f0dSKonstantin Belousov return; 79786be9f0dSKonstantin Belousov } 79886be9f0dSKonstantin Belousov 79959e37c8aSRuslan Bukin KASSERT((ctx->context.flags & IOMMU_CTX_DISABLED) == 0, 80086be9f0dSKonstantin Belousov ("lost ref on disabled ctx %p", ctx)); 80186be9f0dSKonstantin Belousov 80286be9f0dSKonstantin Belousov /* 80386be9f0dSKonstantin Belousov * Clear the context pointer and flush the caches. 80486be9f0dSKonstantin Belousov * XXXKIB: cannot do this if any RMRR entries are still present. 80586be9f0dSKonstantin Belousov */ 80686be9f0dSKonstantin Belousov dmar_pte_clear(&ctxp->ctx1); 80786be9f0dSKonstantin Belousov ctxp->ctx2 = 0; 8086b7c46afSKonstantin Belousov dmar_flush_ctx_to_ram(dmar, ctxp); 80986be9f0dSKonstantin Belousov dmar_inv_ctx_glob(dmar); 81068eeb96aSKonstantin Belousov if ((dmar->hw_ecap & DMAR_ECAP_DI) != 0) { 81168eeb96aSKonstantin Belousov if (dmar->qi_enabled) 81268eeb96aSKonstantin Belousov dmar_qi_invalidate_iotlb_glob_locked(dmar); 81368eeb96aSKonstantin Belousov else 81486be9f0dSKonstantin Belousov dmar_inv_iotlb_glob(dmar); 81568eeb96aSKonstantin Belousov } 81640d951bcSKonstantin Belousov iommu_unmap_pgtbl(sf); 81778b51754SRuslan Bukin domain = CTX2DOM(ctx); 8181abfd355SKonstantin Belousov dmar_ctx_unlink(ctx); 81959e37c8aSRuslan Bukin free(ctx->context.tag, M_DMAR_CTX); 8201abfd355SKonstantin Belousov free(ctx, M_DMAR_CTX); 8211abfd355SKonstantin Belousov dmar_unref_domain_locked(dmar, domain); 82286be9f0dSKonstantin Belousov TD_PINNED_ASSERT; 82386be9f0dSKonstantin Belousov } 82486be9f0dSKonstantin Belousov 825*65b133e5SKonstantin Belousov static void 82686be9f0dSKonstantin Belousov dmar_free_ctx(struct dmar_ctx *ctx) 82786be9f0dSKonstantin Belousov { 82886be9f0dSKonstantin Belousov struct dmar_unit *dmar; 82986be9f0dSKonstantin Belousov 83078b51754SRuslan Bukin dmar = CTX2DMAR(ctx); 83186be9f0dSKonstantin Belousov DMAR_LOCK(dmar); 83286be9f0dSKonstantin Belousov dmar_free_ctx_locked(dmar, ctx); 83386be9f0dSKonstantin Belousov } 83486be9f0dSKonstantin Belousov 8351abfd355SKonstantin Belousov /* 8361abfd355SKonstantin Belousov * Returns with the domain locked. 8371abfd355SKonstantin Belousov */ 83886be9f0dSKonstantin Belousov struct dmar_ctx * 83967499354SRyan Stone dmar_find_ctx_locked(struct dmar_unit *dmar, uint16_t rid) 84086be9f0dSKonstantin Belousov { 8411abfd355SKonstantin Belousov struct dmar_domain *domain; 84286be9f0dSKonstantin Belousov struct dmar_ctx *ctx; 84386be9f0dSKonstantin Belousov 84486be9f0dSKonstantin Belousov DMAR_ASSERT_LOCKED(dmar); 84586be9f0dSKonstantin Belousov 8461abfd355SKonstantin Belousov LIST_FOREACH(domain, &dmar->domains, link) { 8471abfd355SKonstantin Belousov LIST_FOREACH(ctx, &domain->contexts, link) { 848cb9050ddSRuslan Bukin if (ctx->context.rid == rid) 84986be9f0dSKonstantin Belousov return (ctx); 85086be9f0dSKonstantin Belousov } 8511abfd355SKonstantin Belousov } 85286be9f0dSKonstantin Belousov return (NULL); 85386be9f0dSKonstantin Belousov } 85486be9f0dSKonstantin Belousov 85586be9f0dSKonstantin Belousov void 85659e37c8aSRuslan Bukin dmar_domain_free_entry(struct iommu_map_entry *entry, bool free) 85768eeb96aSKonstantin Belousov { 85859e37c8aSRuslan Bukin if ((entry->flags & IOMMU_MAP_ENTRY_RMRR) != 0) 8594670f908SAlan Cox iommu_gas_free_region(entry); 86068eeb96aSKonstantin Belousov else 8614670f908SAlan Cox iommu_gas_free_space(entry); 86268eeb96aSKonstantin Belousov if (free) 8634670f908SAlan Cox iommu_gas_free_entry(entry); 86468eeb96aSKonstantin Belousov else 86568eeb96aSKonstantin Belousov entry->flags = 0; 86668eeb96aSKonstantin Belousov } 86768eeb96aSKonstantin Belousov 86842736dc4SAlan Cox /* 86942736dc4SAlan Cox * If the given value for "free" is true, then the caller must not be using 87042736dc4SAlan Cox * the entry's dmamap_link field. 87142736dc4SAlan Cox */ 87268eeb96aSKonstantin Belousov void 873*65b133e5SKonstantin Belousov dmar_domain_unload_entry(struct iommu_map_entry *entry, bool free, 8748bc36738SAlan Cox bool cansleep) 87568eeb96aSKonstantin Belousov { 87659e37c8aSRuslan Bukin struct dmar_domain *domain; 87768eeb96aSKonstantin Belousov struct dmar_unit *unit; 87868eeb96aSKonstantin Belousov 87978b51754SRuslan Bukin domain = IODOM2DOM(entry->domain); 88078b51754SRuslan Bukin unit = DOM2DMAR(domain); 8818bc36738SAlan Cox 8828bc36738SAlan Cox /* 8838bc36738SAlan Cox * If "free" is false, then the IOTLB invalidation must be performed 8848bc36738SAlan Cox * synchronously. Otherwise, the caller might free the entry before 8858bc36738SAlan Cox * dmar_qi_task() is finished processing it. 8868bc36738SAlan Cox */ 88768eeb96aSKonstantin Belousov if (unit->qi_enabled) { 8888bc36738SAlan Cox if (free) { 889c2515634SAlan Cox DMAR_LOCK(unit); 89042736dc4SAlan Cox dmar_qi_invalidate_locked(domain, entry, true); 89168eeb96aSKonstantin Belousov DMAR_UNLOCK(unit); 89268eeb96aSKonstantin Belousov } else { 893c2515634SAlan Cox dmar_qi_invalidate_sync(domain, entry->start, 894c2515634SAlan Cox entry->end - entry->start, cansleep); 895c2515634SAlan Cox dmar_domain_free_entry(entry, false); 896c2515634SAlan Cox } 897c2515634SAlan Cox } else { 8988bc36738SAlan Cox domain_flush_iotlb_sync(domain, entry->start, entry->end - 8998bc36738SAlan Cox entry->start); 9001abfd355SKonstantin Belousov dmar_domain_free_entry(entry, free); 90168eeb96aSKonstantin Belousov } 90268eeb96aSKonstantin Belousov } 90368eeb96aSKonstantin Belousov 904cf619a92SKonstantin Belousov static bool 905cf619a92SKonstantin Belousov dmar_domain_unload_emit_wait(struct dmar_domain *domain, 90659e37c8aSRuslan Bukin struct iommu_map_entry *entry) 907e164cafcSKonstantin Belousov { 908e164cafcSKonstantin Belousov 909cf619a92SKonstantin Belousov if (TAILQ_NEXT(entry, dmamap_link) == NULL) 910cf619a92SKonstantin Belousov return (true); 911cf619a92SKonstantin Belousov return (domain->batch_no++ % dmar_batch_coalesce == 0); 912e164cafcSKonstantin Belousov } 913e164cafcSKonstantin Belousov 91468eeb96aSKonstantin Belousov void 915*65b133e5SKonstantin Belousov dmar_domain_unload(struct iommu_domain *iodom, 91659e37c8aSRuslan Bukin struct iommu_map_entries_tailq *entries, bool cansleep) 91786be9f0dSKonstantin Belousov { 918da55f86cSAlan Cox struct dmar_domain *domain; 91968eeb96aSKonstantin Belousov struct dmar_unit *unit; 92059e37c8aSRuslan Bukin struct iommu_map_entry *entry, *entry1; 921661bd70bSKonstantin Belousov int error __diagused; 92286be9f0dSKonstantin Belousov 923da55f86cSAlan Cox domain = IODOM2DOM(iodom); 92478b51754SRuslan Bukin unit = DOM2DMAR(domain); 92568eeb96aSKonstantin Belousov 92668eeb96aSKonstantin Belousov TAILQ_FOREACH_SAFE(entry, entries, dmamap_link, entry1) { 92759e37c8aSRuslan Bukin KASSERT((entry->flags & IOMMU_MAP_ENTRY_MAP) != 0, 9281abfd355SKonstantin Belousov ("not mapped entry %p %p", domain, entry)); 9290eed04c8SRuslan Bukin error = iodom->ops->unmap(iodom, entry->start, entry->end - 93015f6baf4SRuslan Bukin entry->start, cansleep ? IOMMU_PGF_WAITOK : 0); 9311abfd355SKonstantin Belousov KASSERT(error == 0, ("unmap %p error %d", domain, error)); 93268eeb96aSKonstantin Belousov if (!unit->qi_enabled) { 9331abfd355SKonstantin Belousov domain_flush_iotlb_sync(domain, entry->start, 93468eeb96aSKonstantin Belousov entry->end - entry->start); 93568eeb96aSKonstantin Belousov TAILQ_REMOVE(entries, entry, dmamap_link); 9361abfd355SKonstantin Belousov dmar_domain_free_entry(entry, true); 93786be9f0dSKonstantin Belousov } 93886be9f0dSKonstantin Belousov } 93968eeb96aSKonstantin Belousov if (TAILQ_EMPTY(entries)) 94068eeb96aSKonstantin Belousov return; 94168eeb96aSKonstantin Belousov 94268eeb96aSKonstantin Belousov KASSERT(unit->qi_enabled, ("loaded entry left")); 94368eeb96aSKonstantin Belousov DMAR_LOCK(unit); 94442736dc4SAlan Cox while ((entry = TAILQ_FIRST(entries)) != NULL) { 94542736dc4SAlan Cox TAILQ_REMOVE(entries, entry, dmamap_link); 94642736dc4SAlan Cox dmar_qi_invalidate_locked(domain, entry, 947cf619a92SKonstantin Belousov dmar_domain_unload_emit_wait(domain, entry)); 94868eeb96aSKonstantin Belousov } 94968eeb96aSKonstantin Belousov DMAR_UNLOCK(unit); 95068eeb96aSKonstantin Belousov } 95186be9f0dSKonstantin Belousov 95259e37c8aSRuslan Bukin struct iommu_ctx * 953*65b133e5SKonstantin Belousov dmar_get_ctx(struct iommu_unit *iommu, device_t dev, uint16_t rid, 95459e37c8aSRuslan Bukin bool id_mapped, bool rmrr_init) 95559e37c8aSRuslan Bukin { 95659e37c8aSRuslan Bukin struct dmar_unit *dmar; 95759e37c8aSRuslan Bukin struct dmar_ctx *ret; 95859e37c8aSRuslan Bukin 95978b51754SRuslan Bukin dmar = IOMMU2DMAR(iommu); 96059e37c8aSRuslan Bukin ret = dmar_get_ctx_for_dev(dmar, dev, rid, id_mapped, rmrr_init); 96178b51754SRuslan Bukin return (CTX2IOCTX(ret)); 96259e37c8aSRuslan Bukin } 96359e37c8aSRuslan Bukin 96459e37c8aSRuslan Bukin void 965*65b133e5SKonstantin Belousov dmar_free_ctx_locked_method(struct iommu_unit *iommu, 966*65b133e5SKonstantin Belousov struct iommu_ctx *context) 96759e37c8aSRuslan Bukin { 96859e37c8aSRuslan Bukin struct dmar_unit *dmar; 96959e37c8aSRuslan Bukin struct dmar_ctx *ctx; 97059e37c8aSRuslan Bukin 97178b51754SRuslan Bukin dmar = IOMMU2DMAR(iommu); 97278b51754SRuslan Bukin ctx = IOCTX2CTX(context); 97359e37c8aSRuslan Bukin dmar_free_ctx_locked(dmar, ctx); 97459e37c8aSRuslan Bukin } 97559e37c8aSRuslan Bukin 97659e37c8aSRuslan Bukin void 977*65b133e5SKonstantin Belousov dmar_free_ctx_method(struct iommu_ctx *context) 97859e37c8aSRuslan Bukin { 97959e37c8aSRuslan Bukin struct dmar_ctx *ctx; 98059e37c8aSRuslan Bukin 98178b51754SRuslan Bukin ctx = IOCTX2CTX(context); 98259e37c8aSRuslan Bukin dmar_free_ctx(ctx); 98359e37c8aSRuslan Bukin } 984