2 * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
4 * Copyright (c) 2013 The FreeBSD Foundation
7 * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
8 * under sponsorship from the FreeBSD Foundation.
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
37 #include <sys/param.h>
39 #include <sys/kernel.h>
40 #include <sys/malloc.h>
41 #include <sys/memdesc.h>
42 #include <sys/module.h>
44 #include <sys/taskqueue.h>
49 #include <vm/vm_extern.h>
50 #include <vm/vm_kern.h>
51 #include <vm/vm_page.h>
52 #include <vm/vm_map.h>
53 #include <contrib/dev/acpica/include/acpi.h>
54 #include <contrib/dev/acpica/include/accommon.h>
55 #include <dev/acpica/acpivar.h>
56 #include <dev/pci/pcireg.h>
57 #include <machine/bus.h>
58 #include <machine/cpu.h>
59 #include <x86/include/busdma_impl.h>
60 #include <dev/iommu/busdma_iommu.h>
61 #include <x86/iommu/intel_reg.h>
62 #include <x86/iommu/intel_dmar.h>
65 dmar_qi_seq_processed(const struct dmar_unit *unit,
66 const struct iommu_qi_genseq *pseq)
69 return (pseq->gen < unit->inv_waitd_gen ||
70 (pseq->gen == unit->inv_waitd_gen &&
71 pseq->seq <= unit->inv_waitd_seq_hw));
75 dmar_enable_qi(struct dmar_unit *unit)
79 DMAR_ASSERT_LOCKED(unit);
80 unit->hw_gcmd |= DMAR_GCMD_QIE;
81 dmar_write4(unit, DMAR_GCMD_REG, unit->hw_gcmd);
82 DMAR_WAIT_UNTIL(((dmar_read4(unit, DMAR_GSTS_REG) & DMAR_GSTS_QIES)
88 dmar_disable_qi(struct dmar_unit *unit)
92 DMAR_ASSERT_LOCKED(unit);
93 unit->hw_gcmd &= ~DMAR_GCMD_QIE;
94 dmar_write4(unit, DMAR_GCMD_REG, unit->hw_gcmd);
95 DMAR_WAIT_UNTIL(((dmar_read4(unit, DMAR_GSTS_REG) & DMAR_GSTS_QIES)
101 dmar_qi_advance_tail(struct dmar_unit *unit)
104 DMAR_ASSERT_LOCKED(unit);
105 dmar_write4(unit, DMAR_IQT_REG, unit->inv_queue_tail);
109 dmar_qi_ensure(struct dmar_unit *unit, int descr_count)
114 DMAR_ASSERT_LOCKED(unit);
115 bytes = descr_count << DMAR_IQ_DESCR_SZ_SHIFT;
117 if (bytes <= unit->inv_queue_avail)
120 head = dmar_read4(unit, DMAR_IQH_REG);
121 head &= DMAR_IQH_MASK;
122 unit->inv_queue_avail = head - unit->inv_queue_tail -
124 if (head <= unit->inv_queue_tail)
125 unit->inv_queue_avail += unit->inv_queue_size;
126 if (bytes <= unit->inv_queue_avail)
130 * No space in the queue, do busy wait. Hardware must
131 * make a progress. But first advance the tail to
132 * inform the descriptor streamer about entries we
133 * might have already filled, otherwise they could
134 * clog the whole queue..
136 dmar_qi_advance_tail(unit);
137 unit->inv_queue_full++;
140 unit->inv_queue_avail -= bytes;
144 dmar_qi_emit(struct dmar_unit *unit, uint64_t data1, uint64_t data2)
147 DMAR_ASSERT_LOCKED(unit);
148 *(volatile uint64_t *)(unit->inv_queue + unit->inv_queue_tail) = data1;
149 unit->inv_queue_tail += DMAR_IQ_DESCR_SZ / 2;
150 KASSERT(unit->inv_queue_tail <= unit->inv_queue_size,
151 ("tail overflow 0x%x 0x%jx", unit->inv_queue_tail,
152 (uintmax_t)unit->inv_queue_size));
153 unit->inv_queue_tail &= unit->inv_queue_size - 1;
154 *(volatile uint64_t *)(unit->inv_queue + unit->inv_queue_tail) = data2;
155 unit->inv_queue_tail += DMAR_IQ_DESCR_SZ / 2;
156 KASSERT(unit->inv_queue_tail <= unit->inv_queue_size,
157 ("tail overflow 0x%x 0x%jx", unit->inv_queue_tail,
158 (uintmax_t)unit->inv_queue_size));
159 unit->inv_queue_tail &= unit->inv_queue_size - 1;
163 dmar_qi_emit_wait_descr(struct dmar_unit *unit, uint32_t seq, bool intr,
164 bool memw, bool fence)
167 DMAR_ASSERT_LOCKED(unit);
168 dmar_qi_emit(unit, DMAR_IQ_DESCR_WAIT_ID |
169 (intr ? DMAR_IQ_DESCR_WAIT_IF : 0) |
170 (memw ? DMAR_IQ_DESCR_WAIT_SW : 0) |
171 (fence ? DMAR_IQ_DESCR_WAIT_FN : 0) |
172 (memw ? DMAR_IQ_DESCR_WAIT_SD(seq) : 0),
173 memw ? unit->inv_waitd_seq_hw_phys : 0);
177 dmar_qi_emit_wait_seq(struct dmar_unit *unit, struct iommu_qi_genseq *pseq,
180 struct iommu_qi_genseq gsec;
183 KASSERT(pseq != NULL, ("wait descriptor with no place for seq"));
184 DMAR_ASSERT_LOCKED(unit);
185 if (unit->inv_waitd_seq == 0xffffffff) {
186 gsec.gen = unit->inv_waitd_gen;
187 gsec.seq = unit->inv_waitd_seq;
188 dmar_qi_ensure(unit, 1);
189 dmar_qi_emit_wait_descr(unit, gsec.seq, false, true, false);
190 dmar_qi_advance_tail(unit);
191 while (!dmar_qi_seq_processed(unit, &gsec))
193 unit->inv_waitd_gen++;
194 unit->inv_waitd_seq = 1;
196 seq = unit->inv_waitd_seq++;
197 pseq->gen = unit->inv_waitd_gen;
200 dmar_qi_ensure(unit, 1);
201 dmar_qi_emit_wait_descr(unit, seq, true, true, false);
206 dmar_qi_wait_for_seq(struct dmar_unit *unit, const struct iommu_qi_genseq *gseq,
210 DMAR_ASSERT_LOCKED(unit);
211 unit->inv_seq_waiters++;
212 while (!dmar_qi_seq_processed(unit, gseq)) {
213 if (cold || nowait) {
216 msleep(&unit->inv_seq_waiters, &unit->iommu.lock, 0,
220 unit->inv_seq_waiters--;
224 dmar_qi_invalidate_locked(struct dmar_domain *domain, iommu_gaddr_t base,
225 iommu_gaddr_t size, struct iommu_qi_genseq *pseq, bool emit_wait)
227 struct dmar_unit *unit;
232 DMAR_ASSERT_LOCKED(unit);
233 for (; size > 0; base += isize, size -= isize) {
234 am = calc_am(unit, base, size, &isize);
235 dmar_qi_ensure(unit, 1);
236 dmar_qi_emit(unit, DMAR_IQ_DESCR_IOTLB_INV |
237 DMAR_IQ_DESCR_IOTLB_PAGE | DMAR_IQ_DESCR_IOTLB_DW |
238 DMAR_IQ_DESCR_IOTLB_DR |
239 DMAR_IQ_DESCR_IOTLB_DID(domain->domain),
242 dmar_qi_emit_wait_seq(unit, pseq, emit_wait);
243 dmar_qi_advance_tail(unit);
247 dmar_qi_invalidate_ctx_glob_locked(struct dmar_unit *unit)
249 struct iommu_qi_genseq gseq;
251 DMAR_ASSERT_LOCKED(unit);
252 dmar_qi_ensure(unit, 2);
253 dmar_qi_emit(unit, DMAR_IQ_DESCR_CTX_INV | DMAR_IQ_DESCR_CTX_GLOB, 0);
254 dmar_qi_emit_wait_seq(unit, &gseq, true);
255 dmar_qi_advance_tail(unit);
256 dmar_qi_wait_for_seq(unit, &gseq, false);
260 dmar_qi_invalidate_iotlb_glob_locked(struct dmar_unit *unit)
262 struct iommu_qi_genseq gseq;
264 DMAR_ASSERT_LOCKED(unit);
265 dmar_qi_ensure(unit, 2);
266 dmar_qi_emit(unit, DMAR_IQ_DESCR_IOTLB_INV | DMAR_IQ_DESCR_IOTLB_GLOB |
267 DMAR_IQ_DESCR_IOTLB_DW | DMAR_IQ_DESCR_IOTLB_DR, 0);
268 dmar_qi_emit_wait_seq(unit, &gseq, true);
269 dmar_qi_advance_tail(unit);
270 dmar_qi_wait_for_seq(unit, &gseq, false);
274 dmar_qi_invalidate_iec_glob(struct dmar_unit *unit)
276 struct iommu_qi_genseq gseq;
278 DMAR_ASSERT_LOCKED(unit);
279 dmar_qi_ensure(unit, 2);
280 dmar_qi_emit(unit, DMAR_IQ_DESCR_IEC_INV, 0);
281 dmar_qi_emit_wait_seq(unit, &gseq, true);
282 dmar_qi_advance_tail(unit);
283 dmar_qi_wait_for_seq(unit, &gseq, false);
287 dmar_qi_invalidate_iec(struct dmar_unit *unit, u_int start, u_int cnt)
289 struct iommu_qi_genseq gseq;
292 DMAR_ASSERT_LOCKED(unit);
293 KASSERT(start < unit->irte_cnt && start < start + cnt &&
294 start + cnt <= unit->irte_cnt,
295 ("inv iec overflow %d %d %d", unit->irte_cnt, start, cnt));
296 for (; cnt > 0; cnt -= c, start += c) {
297 l = ffs(start | cnt) - 1;
299 dmar_qi_ensure(unit, 1);
300 dmar_qi_emit(unit, DMAR_IQ_DESCR_IEC_INV |
301 DMAR_IQ_DESCR_IEC_IDX | DMAR_IQ_DESCR_IEC_IIDX(start) |
302 DMAR_IQ_DESCR_IEC_IM(l), 0);
304 dmar_qi_ensure(unit, 1);
305 dmar_qi_emit_wait_seq(unit, &gseq, true);
306 dmar_qi_advance_tail(unit);
309 * The caller of the function, in particular,
310 * dmar_ir_program_irte(), may be called from the context
311 * where the sleeping is forbidden (in fact, the
312 * intr_table_lock mutex may be held, locked from
313 * intr_shuffle_irqs()). Wait for the invalidation completion
314 * using the busy wait.
316 * The impact on the interrupt input setup code is small, the
317 * expected overhead is comparable with the chipset register
318 * read. It is more harmful for the parallel DMA operations,
319 * since we own the dmar unit lock until whole invalidation
320 * queue is processed, which includes requests possibly issued
321 * before our request.
323 dmar_qi_wait_for_seq(unit, &gseq, true);
327 dmar_qi_intr(void *arg)
329 struct dmar_unit *unit;
332 KASSERT(unit->qi_enabled, ("dmar%d: QI is not enabled",
334 taskqueue_enqueue(unit->qi_taskqueue, &unit->qi_task);
335 return (FILTER_HANDLED);
339 dmar_qi_task(void *arg, int pending __unused)
341 struct dmar_unit *unit;
342 struct iommu_map_entry *entry;
349 entry = TAILQ_FIRST(&unit->tlb_flush_entries);
352 if (!dmar_qi_seq_processed(unit, &entry->gseq))
354 TAILQ_REMOVE(&unit->tlb_flush_entries, entry, dmamap_link);
356 dmar_domain_free_entry(entry, (entry->flags &
357 IOMMU_MAP_ENTRY_QI_NF) == 0);
360 ics = dmar_read4(unit, DMAR_ICS_REG);
361 if ((ics & DMAR_ICS_IWC) != 0) {
363 dmar_write4(unit, DMAR_ICS_REG, ics);
365 if (unit->inv_seq_waiters > 0)
366 wakeup(&unit->inv_seq_waiters);
371 dmar_init_qi(struct dmar_unit *unit)
377 if (!DMAR_HAS_QI(unit) || (unit->hw_cap & DMAR_CAP_CM) != 0)
379 unit->qi_enabled = 1;
380 TUNABLE_INT_FETCH("hw.dmar.qi", &unit->qi_enabled);
381 if (!unit->qi_enabled)
384 TAILQ_INIT(&unit->tlb_flush_entries);
385 TASK_INIT(&unit->qi_task, 0, dmar_qi_task, unit);
386 unit->qi_taskqueue = taskqueue_create_fast("dmarqf", M_WAITOK,
387 taskqueue_thread_enqueue, &unit->qi_taskqueue);
388 taskqueue_start_threads(&unit->qi_taskqueue, 1, PI_AV,
389 "dmar%d qi taskq", unit->iommu.unit);
391 unit->inv_waitd_gen = 0;
392 unit->inv_waitd_seq = 1;
394 qi_sz = DMAR_IQA_QS_DEF;
395 TUNABLE_INT_FETCH("hw.dmar.qi_size", &qi_sz);
396 if (qi_sz > DMAR_IQA_QS_MAX)
397 qi_sz = DMAR_IQA_QS_MAX;
398 unit->inv_queue_size = (1ULL << qi_sz) * PAGE_SIZE;
399 /* Reserve one descriptor to prevent wraparound. */
400 unit->inv_queue_avail = unit->inv_queue_size - DMAR_IQ_DESCR_SZ;
402 /* The invalidation queue reads by DMARs are always coherent. */
403 unit->inv_queue = kmem_alloc_contig(unit->inv_queue_size, M_WAITOK |
404 M_ZERO, 0, dmar_high, PAGE_SIZE, 0, VM_MEMATTR_DEFAULT);
405 unit->inv_waitd_seq_hw_phys = pmap_kextract(
406 (vm_offset_t)&unit->inv_waitd_seq_hw);
409 dmar_write8(unit, DMAR_IQT_REG, 0);
410 iqa = pmap_kextract(unit->inv_queue);
412 dmar_write8(unit, DMAR_IQA_REG, iqa);
413 dmar_enable_qi(unit);
414 ics = dmar_read4(unit, DMAR_ICS_REG);
415 if ((ics & DMAR_ICS_IWC) != 0) {
417 dmar_write4(unit, DMAR_ICS_REG, ics);
419 dmar_enable_qi_intr(unit);
426 dmar_fini_qi(struct dmar_unit *unit)
428 struct iommu_qi_genseq gseq;
430 if (!unit->qi_enabled)
432 taskqueue_drain(unit->qi_taskqueue, &unit->qi_task);
433 taskqueue_free(unit->qi_taskqueue);
434 unit->qi_taskqueue = NULL;
438 dmar_qi_ensure(unit, 1);
439 dmar_qi_emit_wait_seq(unit, &gseq, true);
440 dmar_qi_advance_tail(unit);
441 dmar_qi_wait_for_seq(unit, &gseq, false);
442 /* only after the quisce, disable queue */
443 dmar_disable_qi_intr(unit);
444 dmar_disable_qi(unit);
445 KASSERT(unit->inv_seq_waiters == 0,
446 ("dmar%d: waiters on disabled queue", unit->iommu.unit));
449 kmem_free(unit->inv_queue, unit->inv_queue_size);
451 unit->inv_queue_size = 0;
452 unit->qi_enabled = 0;
456 dmar_enable_qi_intr(struct dmar_unit *unit)
460 DMAR_ASSERT_LOCKED(unit);
461 KASSERT(DMAR_HAS_QI(unit), ("dmar%d: QI is not supported",
463 iectl = dmar_read4(unit, DMAR_IECTL_REG);
464 iectl &= ~DMAR_IECTL_IM;
465 dmar_write4(unit, DMAR_IECTL_REG, iectl);
469 dmar_disable_qi_intr(struct dmar_unit *unit)
473 DMAR_ASSERT_LOCKED(unit);
474 KASSERT(DMAR_HAS_QI(unit), ("dmar%d: QI is not supported",
476 iectl = dmar_read4(unit, DMAR_IECTL_REG);
477 dmar_write4(unit, DMAR_IECTL_REG, iectl | DMAR_IECTL_IM);