2 * Copyright (c) 2015 The FreeBSD Foundation
5 * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
6 * under sponsorship from the FreeBSD Foundation.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 #include <sys/cdefs.h>
31 __FBSDID("$FreeBSD$");
33 #include <sys/param.h>
34 #include <sys/systm.h>
36 #include <sys/kernel.h>
38 #include <sys/malloc.h>
39 #include <sys/memdesc.h>
40 #include <sys/mutex.h>
42 #include <sys/rwlock.h>
43 #include <sys/sysctl.h>
44 #include <sys/taskqueue.h>
48 #include <vm/vm_extern.h>
49 #include <vm/vm_kern.h>
50 #include <vm/vm_object.h>
51 #include <vm/vm_page.h>
52 #include <dev/pci/pcireg.h>
53 #include <dev/pci/pcivar.h>
54 #include <machine/bus.h>
55 #include <machine/intr_machdep.h>
56 #include <x86/include/apicreg.h>
57 #include <x86/include/apicvar.h>
58 #include <x86/include/busdma_impl.h>
59 #include <dev/iommu/busdma_iommu.h>
60 #include <x86/iommu/intel_reg.h>
61 #include <x86/iommu/intel_dmar.h>
62 #include <x86/iommu/iommu_intrmap.h>
64 static struct dmar_unit *dmar_ir_find(device_t src, uint16_t *rid,
66 static void dmar_ir_program_irte(struct dmar_unit *unit, u_int idx,
67 uint64_t low, uint16_t rid);
68 static int dmar_ir_free_irte(struct dmar_unit *unit, u_int cookie);
71 iommu_alloc_msi_intr(device_t src, u_int *cookies, u_int count)
73 struct dmar_unit *unit;
78 unit = dmar_ir_find(src, NULL, NULL);
79 if (unit == NULL || !unit->ir_enabled) {
80 for (i = 0; i < count; i++)
85 error = vmem_alloc(unit->irtids, count, M_FIRSTFIT | M_NOWAIT,
88 KASSERT(error != EOPNOTSUPP,
89 ("impossible EOPNOTSUPP from vmem"));
93 for (i = 0; i < count; i++)
99 iommu_map_msi_intr(device_t src, u_int cpu, u_int vector, u_int cookie,
100 uint64_t *addr, uint32_t *data)
102 struct dmar_unit *unit;
107 unit = dmar_ir_find(src, &rid, &is_dmar);
109 KASSERT(unit == NULL, ("DMAR cannot translate itself"));
112 * See VT-d specification, 5.1.6 Remapping Hardware -
113 * Interrupt Programming.
116 *addr = MSI_INTEL_ADDR_BASE | ((cpu & 0xff) << 12);
118 *addr |= ((uint64_t)cpu & 0xffffff00) << 32;
120 KASSERT(cpu <= 0xff, ("cpu id too big %d", cpu));
123 if (unit == NULL || !unit->ir_enabled || cookie == -1)
126 low = (DMAR_X2APIC(unit) ? DMAR_IRTE1_DST_x2APIC(cpu) :
127 DMAR_IRTE1_DST_xAPIC(cpu)) | DMAR_IRTE1_V(vector) |
128 DMAR_IRTE1_DLM_FM | DMAR_IRTE1_TM_EDGE | DMAR_IRTE1_RH_DIRECT |
129 DMAR_IRTE1_DM_PHYSICAL | DMAR_IRTE1_P;
130 dmar_ir_program_irte(unit, cookie, low, rid);
134 * See VT-d specification, 5.1.5.2 MSI and MSI-X
135 * Register Programming.
137 *addr = MSI_INTEL_ADDR_BASE | ((cookie & 0x7fff) << 5) |
138 ((cookie & 0x8000) << 2) | 0x18;
145 iommu_unmap_msi_intr(device_t src, u_int cookie)
147 struct dmar_unit *unit;
151 unit = dmar_ir_find(src, NULL, NULL);
152 return (dmar_ir_free_irte(unit, cookie));
156 iommu_map_ioapic_intr(u_int ioapic_id, u_int cpu, u_int vector, bool edge,
157 bool activehi, int irq, u_int *cookie, uint32_t *hi, uint32_t *lo)
159 struct dmar_unit *unit;
160 vmem_addr_t vmem_res;
166 unit = dmar_find_ioapic(ioapic_id, &rid);
167 if (unit == NULL || !unit->ir_enabled) {
172 error = vmem_alloc(unit->irtids, 1, M_FIRSTFIT | M_NOWAIT, &vmem_res);
174 KASSERT(error != EOPNOTSUPP,
175 ("impossible EOPNOTSUPP from vmem"));
182 low |= DMAR_IRTE1_DLM_ExtINT;
185 low |= DMAR_IRTE1_DLM_NMI;
188 low |= DMAR_IRTE1_DLM_SMI;
191 KASSERT(vector != 0, ("No vector for IRQ %u", irq));
192 low |= DMAR_IRTE1_DLM_FM | DMAR_IRTE1_V(vector);
195 low |= (DMAR_X2APIC(unit) ? DMAR_IRTE1_DST_x2APIC(cpu) :
196 DMAR_IRTE1_DST_xAPIC(cpu)) |
197 (edge ? DMAR_IRTE1_TM_EDGE : DMAR_IRTE1_TM_LEVEL) |
198 DMAR_IRTE1_RH_DIRECT | DMAR_IRTE1_DM_PHYSICAL | DMAR_IRTE1_P;
199 dmar_ir_program_irte(unit, idx, low, rid);
203 * See VT-d specification, 5.1.5.1 I/OxAPIC
206 iorte = (1ULL << 48) | ((uint64_t)(idx & 0x7fff) << 49) |
207 ((idx & 0x8000) != 0 ? (1 << 11) : 0) |
208 (edge ? IOART_TRGREDG : IOART_TRGRLVL) |
209 (activehi ? IOART_INTAHI : IOART_INTALO) |
210 IOART_DELFIXED | vector;
219 iommu_unmap_ioapic_intr(u_int ioapic_id, u_int *cookie)
221 struct dmar_unit *unit;
228 unit = dmar_find_ioapic(ioapic_id, NULL);
229 KASSERT(unit != NULL && unit->ir_enabled,
230 ("unmap: cookie %d unit %p", idx, unit));
231 return (dmar_ir_free_irte(unit, idx));
234 static struct dmar_unit *
235 dmar_ir_find(device_t src, uint16_t *rid, int *is_dmar)
237 devclass_t src_class;
238 struct dmar_unit *unit;
241 * We need to determine if the interrupt source generates FSB
242 * interrupts. If yes, it is either DMAR, in which case
243 * interrupts are not remapped. Or it is HPET, and interrupts
244 * are remapped. For HPET, source id is reported by HPET
245 * record in DMAR ACPI table.
249 src_class = device_get_devclass(src);
250 if (src_class == devclass_find("dmar")) {
254 } else if (src_class == devclass_find("hpet")) {
255 unit = dmar_find_hpet(src, rid);
257 unit = dmar_find(src, bootverbose);
258 if (unit != NULL && rid != NULL)
259 iommu_get_requester(src, rid);
265 dmar_ir_program_irte(struct dmar_unit *unit, u_int idx, uint64_t low,
271 KASSERT(idx < unit->irte_cnt,
272 ("bad cookie %d %d", idx, unit->irte_cnt));
273 irte = &(unit->irt[idx]);
274 high = DMAR_IRTE2_SVT_RID | DMAR_IRTE2_SQ_RID |
275 DMAR_IRTE2_SID_RID(rid);
277 device_printf(unit->dev,
278 "programming irte[%d] rid %#x high %#jx low %#jx\n",
279 idx, rid, (uintmax_t)high, (uintmax_t)low);
282 if ((irte->irte1 & DMAR_IRTE1_P) != 0) {
284 * The rte is already valid. Assume that the request
285 * is to remap the interrupt for balancing. Only low
286 * word of rte needs to be changed. Assert that the
287 * high word contains expected value.
289 KASSERT(irte->irte2 == high,
290 ("irte2 mismatch, %jx %jx", (uintmax_t)irte->irte2,
292 dmar_pte_update(&irte->irte1, low);
294 dmar_pte_store(&irte->irte2, high);
295 dmar_pte_store(&irte->irte1, low);
297 dmar_qi_invalidate_iec(unit, idx, 1);
303 dmar_ir_free_irte(struct dmar_unit *unit, u_int cookie)
307 KASSERT(unit != NULL && unit->ir_enabled,
308 ("unmap: cookie %d unit %p", cookie, unit));
309 KASSERT(cookie < unit->irte_cnt,
310 ("bad cookie %u %u", cookie, unit->irte_cnt));
311 irte = &(unit->irt[cookie]);
312 dmar_pte_clear(&irte->irte1);
313 dmar_pte_clear(&irte->irte2);
315 dmar_qi_invalidate_iec(unit, cookie, 1);
317 vmem_free(unit->irtids, cookie, 1);
325 return (powerof2(v) ? v : 1 << fls(v));
329 dmar_init_irt(struct dmar_unit *unit)
332 if ((unit->hw_ecap & DMAR_ECAP_IR) == 0)
334 unit->ir_enabled = 1;
335 TUNABLE_INT_FETCH("hw.dmar.ir", &unit->ir_enabled);
336 if (!unit->ir_enabled)
338 if (!unit->qi_enabled) {
339 unit->ir_enabled = 0;
341 device_printf(unit->dev,
342 "QI disabled, disabling interrupt remapping\n");
345 unit->irte_cnt = clp2(num_io_irqs);
346 unit->irt = (dmar_irte_t *)(uintptr_t)kmem_alloc_contig(
347 unit->irte_cnt * sizeof(dmar_irte_t), M_ZERO | M_WAITOK, 0,
348 dmar_high, PAGE_SIZE, 0, DMAR_IS_COHERENT(unit) ?
349 VM_MEMATTR_DEFAULT : VM_MEMATTR_UNCACHEABLE);
350 if (unit->irt == NULL)
352 unit->irt_phys = pmap_kextract((vm_offset_t)unit->irt);
353 unit->irtids = vmem_create("dmarirt", 0, unit->irte_cnt, 1, 0,
354 M_FIRSTFIT | M_NOWAIT);
356 dmar_load_irt_ptr(unit);
357 dmar_qi_invalidate_iec_glob(unit);
361 * Initialize mappings for already configured interrupt pins.
362 * Required, because otherwise the interrupts fault without
368 dmar_enable_ir(unit);
374 dmar_fini_irt(struct dmar_unit *unit)
377 unit->ir_enabled = 0;
378 if (unit->irt != NULL) {
379 dmar_disable_ir(unit);
380 dmar_qi_invalidate_iec_glob(unit);
381 vmem_destroy(unit->irtids);
382 kmem_free((vm_offset_t)unit->irt, unit->irte_cnt *
383 sizeof(dmar_irte_t));