xref: /freebsd/sys/x86/iommu/intel_qi.c (revision b43b8f81578cbb7bddbd6f7b8ebe06a219c88140)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2013 The FreeBSD Foundation
5  *
6  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
7  * under sponsorship from the FreeBSD Foundation.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28  * SUCH DAMAGE.
29  */
30 
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
33 
34 #include "opt_acpi.h"
35 
36 #include <sys/param.h>
37 #include <sys/bus.h>
38 #include <sys/kernel.h>
39 #include <sys/malloc.h>
40 #include <sys/memdesc.h>
41 #include <sys/module.h>
42 #include <sys/rman.h>
43 #include <sys/taskqueue.h>
44 #include <sys/time.h>
45 #include <sys/tree.h>
46 #include <sys/vmem.h>
47 #include <vm/vm.h>
48 #include <vm/vm_extern.h>
49 #include <vm/vm_kern.h>
50 #include <vm/vm_page.h>
51 #include <vm/vm_map.h>
52 #include <contrib/dev/acpica/include/acpi.h>
53 #include <contrib/dev/acpica/include/accommon.h>
54 #include <dev/acpica/acpivar.h>
55 #include <dev/pci/pcireg.h>
56 #include <machine/bus.h>
57 #include <machine/cpu.h>
58 #include <x86/include/busdma_impl.h>
59 #include <dev/iommu/busdma_iommu.h>
60 #include <x86/iommu/intel_reg.h>
61 #include <x86/iommu/intel_dmar.h>
62 
63 static bool
64 dmar_qi_seq_processed(const struct dmar_unit *unit,
65     const struct iommu_qi_genseq *pseq)
66 {
67 
68 	return (pseq->gen < unit->inv_waitd_gen ||
69 	    (pseq->gen == unit->inv_waitd_gen &&
70 	     pseq->seq <= unit->inv_waitd_seq_hw));
71 }
72 
73 static int
74 dmar_enable_qi(struct dmar_unit *unit)
75 {
76 	int error;
77 
78 	DMAR_ASSERT_LOCKED(unit);
79 	unit->hw_gcmd |= DMAR_GCMD_QIE;
80 	dmar_write4(unit, DMAR_GCMD_REG, unit->hw_gcmd);
81 	DMAR_WAIT_UNTIL(((dmar_read4(unit, DMAR_GSTS_REG) & DMAR_GSTS_QIES)
82 	    != 0));
83 	return (error);
84 }
85 
86 static int
87 dmar_disable_qi(struct dmar_unit *unit)
88 {
89 	int error;
90 
91 	DMAR_ASSERT_LOCKED(unit);
92 	unit->hw_gcmd &= ~DMAR_GCMD_QIE;
93 	dmar_write4(unit, DMAR_GCMD_REG, unit->hw_gcmd);
94 	DMAR_WAIT_UNTIL(((dmar_read4(unit, DMAR_GSTS_REG) & DMAR_GSTS_QIES)
95 	    == 0));
96 	return (error);
97 }
98 
99 static void
100 dmar_qi_advance_tail(struct dmar_unit *unit)
101 {
102 
103 	DMAR_ASSERT_LOCKED(unit);
104 	dmar_write4(unit, DMAR_IQT_REG, unit->inv_queue_tail);
105 }
106 
107 static void
108 dmar_qi_ensure(struct dmar_unit *unit, int descr_count)
109 {
110 	uint32_t head;
111 	int bytes;
112 
113 	DMAR_ASSERT_LOCKED(unit);
114 	bytes = descr_count << DMAR_IQ_DESCR_SZ_SHIFT;
115 	for (;;) {
116 		if (bytes <= unit->inv_queue_avail)
117 			break;
118 		/* refill */
119 		head = dmar_read4(unit, DMAR_IQH_REG);
120 		head &= DMAR_IQH_MASK;
121 		unit->inv_queue_avail = head - unit->inv_queue_tail -
122 		    DMAR_IQ_DESCR_SZ;
123 		if (head <= unit->inv_queue_tail)
124 			unit->inv_queue_avail += unit->inv_queue_size;
125 		if (bytes <= unit->inv_queue_avail)
126 			break;
127 
128 		/*
129 		 * No space in the queue, do busy wait.  Hardware must
130 		 * make a progress.  But first advance the tail to
131 		 * inform the descriptor streamer about entries we
132 		 * might have already filled, otherwise they could
133 		 * clog the whole queue..
134 		 */
135 		dmar_qi_advance_tail(unit);
136 		unit->inv_queue_full++;
137 		cpu_spinwait();
138 	}
139 	unit->inv_queue_avail -= bytes;
140 }
141 
142 static void
143 dmar_qi_emit(struct dmar_unit *unit, uint64_t data1, uint64_t data2)
144 {
145 
146 	DMAR_ASSERT_LOCKED(unit);
147 	*(volatile uint64_t *)(unit->inv_queue + unit->inv_queue_tail) = data1;
148 	unit->inv_queue_tail += DMAR_IQ_DESCR_SZ / 2;
149 	KASSERT(unit->inv_queue_tail <= unit->inv_queue_size,
150 	    ("tail overflow 0x%x 0x%jx", unit->inv_queue_tail,
151 	    (uintmax_t)unit->inv_queue_size));
152 	unit->inv_queue_tail &= unit->inv_queue_size - 1;
153 	*(volatile uint64_t *)(unit->inv_queue + unit->inv_queue_tail) = data2;
154 	unit->inv_queue_tail += DMAR_IQ_DESCR_SZ / 2;
155 	KASSERT(unit->inv_queue_tail <= unit->inv_queue_size,
156 	    ("tail overflow 0x%x 0x%jx", unit->inv_queue_tail,
157 	    (uintmax_t)unit->inv_queue_size));
158 	unit->inv_queue_tail &= unit->inv_queue_size - 1;
159 }
160 
161 static void
162 dmar_qi_emit_wait_descr(struct dmar_unit *unit, uint32_t seq, bool intr,
163     bool memw, bool fence)
164 {
165 
166 	DMAR_ASSERT_LOCKED(unit);
167 	dmar_qi_emit(unit, DMAR_IQ_DESCR_WAIT_ID |
168 	    (intr ? DMAR_IQ_DESCR_WAIT_IF : 0) |
169 	    (memw ? DMAR_IQ_DESCR_WAIT_SW : 0) |
170 	    (fence ? DMAR_IQ_DESCR_WAIT_FN : 0) |
171 	    (memw ? DMAR_IQ_DESCR_WAIT_SD(seq) : 0),
172 	    memw ? unit->inv_waitd_seq_hw_phys : 0);
173 }
174 
175 static void
176 dmar_qi_emit_wait_seq(struct dmar_unit *unit, struct iommu_qi_genseq *pseq,
177     bool emit_wait)
178 {
179 	struct iommu_qi_genseq gsec;
180 	uint32_t seq;
181 
182 	KASSERT(pseq != NULL, ("wait descriptor with no place for seq"));
183 	DMAR_ASSERT_LOCKED(unit);
184 	if (unit->inv_waitd_seq == 0xffffffff) {
185 		gsec.gen = unit->inv_waitd_gen;
186 		gsec.seq = unit->inv_waitd_seq;
187 		dmar_qi_ensure(unit, 1);
188 		dmar_qi_emit_wait_descr(unit, gsec.seq, false, true, false);
189 		dmar_qi_advance_tail(unit);
190 		while (!dmar_qi_seq_processed(unit, &gsec))
191 			cpu_spinwait();
192 		unit->inv_waitd_gen++;
193 		unit->inv_waitd_seq = 1;
194 	}
195 	seq = unit->inv_waitd_seq++;
196 	pseq->gen = unit->inv_waitd_gen;
197 	pseq->seq = seq;
198 	if (emit_wait) {
199 		dmar_qi_ensure(unit, 1);
200 		dmar_qi_emit_wait_descr(unit, seq, true, true, false);
201 	}
202 }
203 
204 static void
205 dmar_qi_wait_for_seq(struct dmar_unit *unit, const struct iommu_qi_genseq *gseq,
206     bool nowait)
207 {
208 
209 	DMAR_ASSERT_LOCKED(unit);
210 	unit->inv_seq_waiters++;
211 	while (!dmar_qi_seq_processed(unit, gseq)) {
212 		if (cold || nowait) {
213 			cpu_spinwait();
214 		} else {
215 			msleep(&unit->inv_seq_waiters, &unit->iommu.lock, 0,
216 			    "dmarse", hz);
217 		}
218 	}
219 	unit->inv_seq_waiters--;
220 }
221 
222 void
223 dmar_qi_invalidate_locked(struct dmar_domain *domain, iommu_gaddr_t base,
224     iommu_gaddr_t size, struct iommu_qi_genseq *pseq, bool emit_wait)
225 {
226 	struct dmar_unit *unit;
227 	iommu_gaddr_t isize;
228 	int am;
229 
230 	unit = domain->dmar;
231 	DMAR_ASSERT_LOCKED(unit);
232 	for (; size > 0; base += isize, size -= isize) {
233 		am = calc_am(unit, base, size, &isize);
234 		dmar_qi_ensure(unit, 1);
235 		dmar_qi_emit(unit, DMAR_IQ_DESCR_IOTLB_INV |
236 		    DMAR_IQ_DESCR_IOTLB_PAGE | DMAR_IQ_DESCR_IOTLB_DW |
237 		    DMAR_IQ_DESCR_IOTLB_DR |
238 		    DMAR_IQ_DESCR_IOTLB_DID(domain->domain),
239 		    base | am);
240 	}
241 	dmar_qi_emit_wait_seq(unit, pseq, emit_wait);
242 	dmar_qi_advance_tail(unit);
243 }
244 
245 void
246 dmar_qi_invalidate_ctx_glob_locked(struct dmar_unit *unit)
247 {
248 	struct iommu_qi_genseq gseq;
249 
250 	DMAR_ASSERT_LOCKED(unit);
251 	dmar_qi_ensure(unit, 2);
252 	dmar_qi_emit(unit, DMAR_IQ_DESCR_CTX_INV | DMAR_IQ_DESCR_CTX_GLOB, 0);
253 	dmar_qi_emit_wait_seq(unit, &gseq, true);
254 	dmar_qi_advance_tail(unit);
255 	dmar_qi_wait_for_seq(unit, &gseq, false);
256 }
257 
258 void
259 dmar_qi_invalidate_iotlb_glob_locked(struct dmar_unit *unit)
260 {
261 	struct iommu_qi_genseq gseq;
262 
263 	DMAR_ASSERT_LOCKED(unit);
264 	dmar_qi_ensure(unit, 2);
265 	dmar_qi_emit(unit, DMAR_IQ_DESCR_IOTLB_INV | DMAR_IQ_DESCR_IOTLB_GLOB |
266 	    DMAR_IQ_DESCR_IOTLB_DW | DMAR_IQ_DESCR_IOTLB_DR, 0);
267 	dmar_qi_emit_wait_seq(unit, &gseq, true);
268 	dmar_qi_advance_tail(unit);
269 	dmar_qi_wait_for_seq(unit, &gseq, false);
270 }
271 
272 void
273 dmar_qi_invalidate_iec_glob(struct dmar_unit *unit)
274 {
275 	struct iommu_qi_genseq gseq;
276 
277 	DMAR_ASSERT_LOCKED(unit);
278 	dmar_qi_ensure(unit, 2);
279 	dmar_qi_emit(unit, DMAR_IQ_DESCR_IEC_INV, 0);
280 	dmar_qi_emit_wait_seq(unit, &gseq, true);
281 	dmar_qi_advance_tail(unit);
282 	dmar_qi_wait_for_seq(unit, &gseq, false);
283 }
284 
285 void
286 dmar_qi_invalidate_iec(struct dmar_unit *unit, u_int start, u_int cnt)
287 {
288 	struct iommu_qi_genseq gseq;
289 	u_int c, l;
290 
291 	DMAR_ASSERT_LOCKED(unit);
292 	KASSERT(start < unit->irte_cnt && start < start + cnt &&
293 	    start + cnt <= unit->irte_cnt,
294 	    ("inv iec overflow %d %d %d", unit->irte_cnt, start, cnt));
295 	for (; cnt > 0; cnt -= c, start += c) {
296 		l = ffs(start | cnt) - 1;
297 		c = 1 << l;
298 		dmar_qi_ensure(unit, 1);
299 		dmar_qi_emit(unit, DMAR_IQ_DESCR_IEC_INV |
300 		    DMAR_IQ_DESCR_IEC_IDX | DMAR_IQ_DESCR_IEC_IIDX(start) |
301 		    DMAR_IQ_DESCR_IEC_IM(l), 0);
302 	}
303 	dmar_qi_ensure(unit, 1);
304 	dmar_qi_emit_wait_seq(unit, &gseq, true);
305 	dmar_qi_advance_tail(unit);
306 
307 	/*
308 	 * The caller of the function, in particular,
309 	 * dmar_ir_program_irte(), may be called from the context
310 	 * where the sleeping is forbidden (in fact, the
311 	 * intr_table_lock mutex may be held, locked from
312 	 * intr_shuffle_irqs()).  Wait for the invalidation completion
313 	 * using the busy wait.
314 	 *
315 	 * The impact on the interrupt input setup code is small, the
316 	 * expected overhead is comparable with the chipset register
317 	 * read.  It is more harmful for the parallel DMA operations,
318 	 * since we own the dmar unit lock until whole invalidation
319 	 * queue is processed, which includes requests possibly issued
320 	 * before our request.
321 	 */
322 	dmar_qi_wait_for_seq(unit, &gseq, true);
323 }
324 
325 int
326 dmar_qi_intr(void *arg)
327 {
328 	struct dmar_unit *unit;
329 
330 	unit = arg;
331 	KASSERT(unit->qi_enabled, ("dmar%d: QI is not enabled",
332 	    unit->iommu.unit));
333 	taskqueue_enqueue(unit->qi_taskqueue, &unit->qi_task);
334 	return (FILTER_HANDLED);
335 }
336 
337 static void
338 dmar_qi_task(void *arg, int pending __unused)
339 {
340 	struct dmar_unit *unit;
341 	struct iommu_map_entry *entry;
342 	uint32_t ics;
343 
344 	unit = arg;
345 
346 	/*
347 	 * Request an interrupt on the completion of the next invalidation
348 	 * wait descriptor with the IF field set.
349 	 */
350 	ics = dmar_read4(unit, DMAR_ICS_REG);
351 	if ((ics & DMAR_ICS_IWC) != 0) {
352 		ics = DMAR_ICS_IWC;
353 		dmar_write4(unit, DMAR_ICS_REG, ics);
354 	}
355 
356 	DMAR_LOCK(unit);
357 	for (;;) {
358 		entry = TAILQ_FIRST(&unit->tlb_flush_entries);
359 		if (entry == NULL)
360 			break;
361 		if (!dmar_qi_seq_processed(unit, &entry->gseq))
362 			break;
363 		TAILQ_REMOVE(&unit->tlb_flush_entries, entry, dmamap_link);
364 		DMAR_UNLOCK(unit);
365 		dmar_domain_free_entry(entry, (entry->flags &
366 		    IOMMU_MAP_ENTRY_QI_NF) == 0);
367 		DMAR_LOCK(unit);
368 	}
369 	if (unit->inv_seq_waiters > 0)
370 		wakeup(&unit->inv_seq_waiters);
371 	DMAR_UNLOCK(unit);
372 }
373 
374 int
375 dmar_init_qi(struct dmar_unit *unit)
376 {
377 	uint64_t iqa;
378 	uint32_t ics;
379 	int qi_sz;
380 
381 	if (!DMAR_HAS_QI(unit) || (unit->hw_cap & DMAR_CAP_CM) != 0)
382 		return (0);
383 	unit->qi_enabled = 1;
384 	TUNABLE_INT_FETCH("hw.dmar.qi", &unit->qi_enabled);
385 	if (!unit->qi_enabled)
386 		return (0);
387 
388 	TAILQ_INIT(&unit->tlb_flush_entries);
389 	TASK_INIT(&unit->qi_task, 0, dmar_qi_task, unit);
390 	unit->qi_taskqueue = taskqueue_create_fast("dmarqf", M_WAITOK,
391 	    taskqueue_thread_enqueue, &unit->qi_taskqueue);
392 	taskqueue_start_threads(&unit->qi_taskqueue, 1, PI_AV,
393 	    "dmar%d qi taskq", unit->iommu.unit);
394 
395 	unit->inv_waitd_gen = 0;
396 	unit->inv_waitd_seq = 1;
397 
398 	qi_sz = DMAR_IQA_QS_DEF;
399 	TUNABLE_INT_FETCH("hw.dmar.qi_size", &qi_sz);
400 	if (qi_sz > DMAR_IQA_QS_MAX)
401 		qi_sz = DMAR_IQA_QS_MAX;
402 	unit->inv_queue_size = (1ULL << qi_sz) * PAGE_SIZE;
403 	/* Reserve one descriptor to prevent wraparound. */
404 	unit->inv_queue_avail = unit->inv_queue_size - DMAR_IQ_DESCR_SZ;
405 
406 	/* The invalidation queue reads by DMARs are always coherent. */
407 	unit->inv_queue = kmem_alloc_contig(unit->inv_queue_size, M_WAITOK |
408 	    M_ZERO, 0, dmar_high, PAGE_SIZE, 0, VM_MEMATTR_DEFAULT);
409 	unit->inv_waitd_seq_hw_phys = pmap_kextract(
410 	    (vm_offset_t)&unit->inv_waitd_seq_hw);
411 
412 	DMAR_LOCK(unit);
413 	dmar_write8(unit, DMAR_IQT_REG, 0);
414 	iqa = pmap_kextract(unit->inv_queue);
415 	iqa |= qi_sz;
416 	dmar_write8(unit, DMAR_IQA_REG, iqa);
417 	dmar_enable_qi(unit);
418 	ics = dmar_read4(unit, DMAR_ICS_REG);
419 	if ((ics & DMAR_ICS_IWC) != 0) {
420 		ics = DMAR_ICS_IWC;
421 		dmar_write4(unit, DMAR_ICS_REG, ics);
422 	}
423 	dmar_enable_qi_intr(unit);
424 	DMAR_UNLOCK(unit);
425 
426 	return (0);
427 }
428 
429 void
430 dmar_fini_qi(struct dmar_unit *unit)
431 {
432 	struct iommu_qi_genseq gseq;
433 
434 	if (!unit->qi_enabled)
435 		return;
436 	taskqueue_drain(unit->qi_taskqueue, &unit->qi_task);
437 	taskqueue_free(unit->qi_taskqueue);
438 	unit->qi_taskqueue = NULL;
439 
440 	DMAR_LOCK(unit);
441 	/* quisce */
442 	dmar_qi_ensure(unit, 1);
443 	dmar_qi_emit_wait_seq(unit, &gseq, true);
444 	dmar_qi_advance_tail(unit);
445 	dmar_qi_wait_for_seq(unit, &gseq, false);
446 	/* only after the quisce, disable queue */
447 	dmar_disable_qi_intr(unit);
448 	dmar_disable_qi(unit);
449 	KASSERT(unit->inv_seq_waiters == 0,
450 	    ("dmar%d: waiters on disabled queue", unit->iommu.unit));
451 	DMAR_UNLOCK(unit);
452 
453 	kmem_free(unit->inv_queue, unit->inv_queue_size);
454 	unit->inv_queue = 0;
455 	unit->inv_queue_size = 0;
456 	unit->qi_enabled = 0;
457 }
458 
459 void
460 dmar_enable_qi_intr(struct dmar_unit *unit)
461 {
462 	uint32_t iectl;
463 
464 	DMAR_ASSERT_LOCKED(unit);
465 	KASSERT(DMAR_HAS_QI(unit), ("dmar%d: QI is not supported",
466 	    unit->iommu.unit));
467 	iectl = dmar_read4(unit, DMAR_IECTL_REG);
468 	iectl &= ~DMAR_IECTL_IM;
469 	dmar_write4(unit, DMAR_IECTL_REG, iectl);
470 }
471 
472 void
473 dmar_disable_qi_intr(struct dmar_unit *unit)
474 {
475 	uint32_t iectl;
476 
477 	DMAR_ASSERT_LOCKED(unit);
478 	KASSERT(DMAR_HAS_QI(unit), ("dmar%d: QI is not supported",
479 	    unit->iommu.unit));
480 	iectl = dmar_read4(unit, DMAR_IECTL_REG);
481 	dmar_write4(unit, DMAR_IECTL_REG, iectl | DMAR_IECTL_IM);
482 }
483