2 * Copyright 2014 Olivier Houchard <cognet@FreeBSD.org>
3 * Copyright 2014 Svatopluk Kraus <onwahe@gmail.com>
4 * Copyright 2014 Michal Meloun <meloun@miracle.cz>
5 * Copyright 2014 Andrew Turner <andrew@FreeBSD.org>
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 #include "opt_ktrace.h"
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
35 #include <sys/param.h>
37 #include <sys/systm.h>
39 #include <sys/kernel.h>
41 #include <sys/mutex.h>
42 #include <sys/signalvar.h>
46 #include <sys/ktrace.h>
51 #include <vm/vm_kern.h>
52 #include <vm/vm_map.h>
53 #include <vm/vm_extern.h>
54 #include <vm/vm_param.h>
56 #include <machine/acle-compat.h>
57 #include <machine/cpu.h>
58 #include <machine/frame.h>
59 #include <machine/machdep.h>
60 #include <machine/pcb.h>
64 #include <machine/db_machdep.h>
68 #include <sys/dtrace_bsd.h>
71 extern char cachebailout[];
74 int last_fault_code; /* For the benefit of pmap_fault_fixup() */
83 typedef int abort_func_t(struct trapframe *, u_int, u_int, u_int, u_int,
84 struct thread *, struct ksig *);
86 static abort_func_t abort_fatal;
87 static abort_func_t abort_align;
88 static abort_func_t abort_icache;
96 * How are the aborts handled?
99 * - Always fatal as we do not know what does it mean.
100 * Imprecise External Abort:
101 * - Always fatal, but can be handled somehow in the future.
102 * Now, due to PCIe buggy hardware, ignored.
103 * Precise External Abort:
104 * - Always fatal, but who knows in the future???
106 * - Special handling.
107 * External Translation Abort (L1 & L2)
108 * - Always fatal as something is screwed up in page tables or hardware.
109 * Domain Fault (L1 & L2):
110 * - Always fatal as we do not play game with domains.
112 * - Everything should be aligned in kernel with exception of user to kernel
113 * and vice versa data copying, so if pcb_onfault is not set, it's fatal.
114 * We generate signal in case of abort from user mode.
115 * Instruction cache maintenance:
116 * - According to manual, this is translation fault during cache maintenance
117 * operation. So, it could be really complex in SMP case and fuzzy too
118 * for cache operations working on virtual addresses. For now, we will
119 * consider this abort as fatal. In fact, no cache maintenance on
120 * not mapped virtual addresses should be called. As cache maintenance
121 * operation (except DMB, DSB, and Flush Prefetch Buffer) are priviledged,
122 * the abort is fatal for user mode as well for now. (This is good place to
123 * note that cache maintenance on virtual address fill TLB.)
124 * Acces Bit (L1 & L2):
125 * - Fast hardware emulation for kernel and user mode.
126 * Translation Fault (L1 & L2):
127 * - Standard fault mechanism is held including vm_fault().
128 * Permission Fault (L1 & L2):
129 * - Fast hardware emulation of modify bits and in other cases, standard
130 * fault mechanism is held including vm_fault().
133 static const struct abort aborts[] = {
134 {abort_fatal, "Undefined Code (0x000)"},
135 {abort_align, "Alignment Fault"},
136 {abort_fatal, "Debug Event"},
137 {NULL, "Access Bit (L1)"},
138 {NULL, "Instruction cache maintenance"},
139 {NULL, "Translation Fault (L1)"},
140 {NULL, "Access Bit (L2)"},
141 {NULL, "Translation Fault (L2)"},
143 {abort_fatal, "External Abort"},
144 {abort_fatal, "Domain Fault (L1)"},
145 {abort_fatal, "Undefined Code (0x00A)"},
146 {abort_fatal, "Domain Fault (L2)"},
147 {abort_fatal, "External Translation Abort (L1)"},
148 {NULL, "Permission Fault (L1)"},
149 {abort_fatal, "External Translation Abort (L2)"},
150 {NULL, "Permission Fault (L2)"},
152 {abort_fatal, "TLB Conflict Abort"},
153 {abort_fatal, "Undefined Code (0x401)"},
154 {abort_fatal, "Undefined Code (0x402)"},
155 {abort_fatal, "Undefined Code (0x403)"},
156 {abort_fatal, "Undefined Code (0x404)"},
157 {abort_fatal, "Undefined Code (0x405)"},
158 {abort_fatal, "Asynchronous External Abort"},
159 {abort_fatal, "Undefined Code (0x407)"},
161 {abort_fatal, "Asynchronous Parity Error on Memory Access"},
162 {abort_fatal, "Parity Error on Memory Access"},
163 {abort_fatal, "Undefined Code (0x40A)"},
164 {abort_fatal, "Undefined Code (0x40B)"},
165 {abort_fatal, "Parity Error on Translation (L1)"},
166 {abort_fatal, "Undefined Code (0x40D)"},
167 {abort_fatal, "Parity Error on Translation (L2)"},
168 {abort_fatal, "Undefined Code (0x40F)"}
172 call_trapsignal(struct thread *td, int sig, int code, vm_offset_t addr)
176 CTR4(KTR_TRAP, "%s: addr: %#x, sig: %d, code: %d",
177 __func__, addr, sig, code);
180 * TODO: some info would be nice to know
181 * if we are serving data or prefetch abort.
184 ksiginfo_init_trap(&ksi);
187 ksi.ksi_addr = (void *)addr;
188 trapsignal(td, &ksi);
192 * abort_imprecise() handles the following abort:
194 * FAULT_EA_IMPREC - Imprecise External Abort
196 * The imprecise means that we don't know where the abort happened,
197 * thus FAR is undefined. The abort should not never fire, but hot
198 * plugging or accidental hardware failure can be the cause of it.
199 * If the abort happens, it can even be on different (thread) context.
200 * Without any additional support, the abort is fatal, as we do not
201 * know what really happened.
203 * QQQ: Some additional functionality, like pcb_onfault but global,
204 * can be implemented. Imprecise handlers could be registered
205 * which tell us if the abort is caused by something they know
206 * about. They should return one of three codes like:
210 * The handlers should be called until some of them returns
211 * FAULT_IS_MINE value or all was called. If all handlers return
212 * FAULT_IS_NOT_MINE value, then the abort is fatal.
215 abort_imprecise(struct trapframe *tf, u_int fsr, u_int prefetch, bool usermode)
219 * XXX - We can got imprecise abort as result of access
220 * to not-present PCI/PCIe configuration space.
225 abort_fatal(tf, FAULT_EA_IMPREC, fsr, 0, prefetch, curthread, NULL);
228 * Returning from this function means that we ignore
229 * the abort for good reason. Note that imprecise abort
230 * could fire any time even in user mode.
236 userret(curthread, tf);
241 * abort_debug() handles the following abort:
243 * FAULT_DEBUG - Debug Event
247 abort_debug(struct trapframe *tf, u_int fsr, u_int prefetch, bool usermode,
255 call_trapsignal(td, SIGTRAP, TRAP_BRKPT, far);
259 kdb_trap((prefetch) ? T_BREAKPOINT : T_WATCHPOINT, 0, tf);
261 printf("No debugger in kernel.\n");
269 * FAR, FSR, and everything what can be lost after enabling
270 * interrupts must be grabbed before the interrupts will be
271 * enabled. Note that when interrupts will be enabled, we
272 * could even migrate to another CPU ...
274 * TODO: move quick cases to ASM
277 abort_handler(struct trapframe *tf, int prefetch)
294 PCPU_INC(cnt.v_trap);
297 fsr = (prefetch) ? cp15_ifsr_get(): cp15_dfsr_get();
299 far = (prefetch) ? cp15_ifar_get() : cp15_dfar_get();
301 far = (prefetch) ? TRAPF_PC(tf) : cp15_dfar_get();
304 idx = FSR_TO_FAULT(fsr);
305 usermode = TRAPF_USERMODE(tf); /* Abort came from user mode? */
309 CTR6(KTR_TRAP, "%s: fsr %#x (idx %u) far %#x prefetch %u usermode %d",
310 __func__, fsr, idx, far, prefetch, usermode);
313 * Firstly, handle aborts that are not directly related to mapping.
315 if (__predict_false(idx == FAULT_EA_IMPREC)) {
316 abort_imprecise(tf, fsr, prefetch, usermode);
320 if (__predict_false(idx == FAULT_DEBUG)) {
321 abort_debug(tf, fsr, prefetch, usermode, far);
326 * ARM has a set of unprivileged load and store instructions
327 * (LDRT/LDRBT/STRT/STRBT ...) which are supposed to be used in other
328 * than user mode and OS should recognize their aborts and behave
329 * appropriately. However, there is no way how to do that reasonably
330 * in general unless we restrict the handling somehow.
332 * For now, these instructions are used only in copyin()/copyout()
333 * like functions where usermode buffers are checked in advance that
334 * they are not from KVA space. Thus, no action is needed here.
338 * (1) Handle access and R/W hardware emulation aborts.
339 * (2) Check that abort is not on pmap essential address ranges.
340 * There is no way how to fix it, so we don't even try.
342 rv = pmap_fault(PCPU_GET(curpmap), far, fsr, idx, usermode);
343 if (rv == KERN_SUCCESS)
351 if (rv == KERN_INVALID_ADDRESS)
354 if (__predict_false((td->td_pflags & TDP_NOFAULTING) != 0)) {
356 * Due to both processor errata and lazy TLB invalidation when
357 * access restrictions are removed from virtual pages, memory
358 * accesses that are allowed by the physical mapping layer may
359 * nonetheless cause one spurious page fault per virtual page.
360 * When the thread is executing a "no faulting" section that
361 * is bracketed by vm_fault_{disable,enable}_pagefaults(),
362 * every page fault is treated as a spurious page fault,
363 * unless it accesses the same virtual address as the most
364 * recent page fault within the same "no faulting" section.
366 if (td->td_md.md_spurflt_addr != far ||
367 (td->td_pflags & TDP_RESETSPUR) != 0) {
368 td->td_md.md_spurflt_addr = far;
369 td->td_pflags &= ~TDP_RESETSPUR;
371 tlb_flush_local(far & ~PAGE_MASK);
376 * If we get a page fault while in a critical section, then
377 * it is most likely a fatal kernel page fault. The kernel
378 * is already going to panic trying to get a sleep lock to
379 * do the VM lookup, so just consider it a fatal trap so the
380 * kernel can print out a useful trap message and even get
383 * If we get a page fault while holding a non-sleepable
384 * lock, then it is most likely a fatal kernel page fault.
385 * If WITNESS is enabled, then it's going to whine about
386 * bogus LORs with various VM locks, so just skip to the
387 * fatal trap handling directly.
389 if (td->td_critnest != 0 ||
390 WITNESS_CHECK(WARN_SLEEPOK | WARN_GIANTOK, NULL,
391 "Kernel page fault") != 0) {
392 abort_fatal(tf, idx, fsr, far, prefetch, td, &ksig);
397 /* Re-enable interrupts if they were enabled previously. */
398 if (td->td_md.md_spinlock_count == 0) {
399 if (__predict_true(tf->tf_spsr & PSR_I) == 0)
400 enable_interrupts(PSR_I);
401 if (__predict_true(tf->tf_spsr & PSR_F) == 0)
402 enable_interrupts(PSR_F);
408 if (td->td_cowgen != p->p_cowgen)
409 thread_cow_update(td);
412 /* Invoke the appropriate handler, if necessary. */
413 if (__predict_false(aborts[idx].func != NULL)) {
414 if ((aborts[idx].func)(tf, idx, fsr, far, prefetch, td, &ksig))
420 * At this point, we're dealing with one of the following aborts:
422 * FAULT_ICACHE - I-cache maintenance
423 * FAULT_TRAN_xx - Translation
424 * FAULT_PERM_xx - Permission
428 * Don't pass faulting cache operation to vm_fault(). We don't want
429 * to handle all vm stuff at this moment.
432 if (__predict_false(pcb->pcb_onfault == cachebailout)) {
433 tf->tf_r0 = far; /* return failing address */
434 tf->tf_pc = (register_t)pcb->pcb_onfault;
438 /* Handle remaining I-cache aborts. */
439 if (idx == FAULT_ICACHE) {
440 if (abort_icache(tf, idx, fsr, far, prefetch, td, &ksig))
445 va = trunc_page(far);
446 if (va >= KERNBASE) {
448 * Don't allow user-mode faults in kernel address space.
456 * This is a fault on non-kernel virtual memory. If curproc
457 * is NULL or curproc->p_vmspace is NULL the fault is fatal.
459 vm = (p != NULL) ? p->p_vmspace : NULL;
464 if (!usermode && (td->td_intr_nesting_level != 0 ||
465 pcb->pcb_onfault == NULL)) {
466 abort_fatal(tf, idx, fsr, far, prefetch, td, &ksig);
471 ftype = (fsr & FSR_WNR) ? VM_PROT_WRITE : VM_PROT_READ;
473 ftype |= VM_PROT_EXECUTE;
476 last_fault_code = fsr;
480 onfault = pcb->pcb_onfault;
481 pcb->pcb_onfault = NULL;
484 /* Fault in the page. */
485 rv = vm_fault(map, va, ftype, VM_FAULT_NORMAL);
488 pcb->pcb_onfault = onfault;
491 if (__predict_true(rv == KERN_SUCCESS))
495 if (td->td_intr_nesting_level == 0 &&
496 pcb->pcb_onfault != NULL) {
498 tf->tf_pc = (int)pcb->pcb_onfault;
501 CTR2(KTR_TRAP, "%s: vm_fault() failed with %d", __func__, rv);
502 abort_fatal(tf, idx, fsr, far, prefetch, td, &ksig);
507 ksig.code = (rv == KERN_PROTECTION_FAILURE) ? SEGV_ACCERR : SEGV_MAPERR;
511 call_trapsignal(td, ksig.sig, ksig.code, ksig.addr);
518 * abort_fatal() handles the following data aborts:
520 * FAULT_DEBUG - Debug Event
521 * FAULT_ACCESS_xx - Acces Bit
522 * FAULT_EA_PREC - Precise External Abort
523 * FAULT_DOMAIN_xx - Domain Fault
524 * FAULT_EA_TRAN_xx - External Translation Abort
525 * FAULT_EA_IMPREC - Imprecise External Abort
526 * + all undefined codes for ABORT
528 * We should never see these on a properly functioning system.
530 * This function is also called by the other handlers if they
531 * detect a fatal problem.
533 * Note: If 'l' is NULL, we assume we're dealing with a prefetch abort.
536 abort_fatal(struct trapframe *tf, u_int idx, u_int fsr, u_int far,
537 u_int prefetch, struct thread *td, struct ksig *ksig)
543 usermode = TRAPF_USERMODE(tf);
546 if (dtrace_trap_func != NULL && (*dtrace_trap_func)(tf, far))
551 mode = usermode ? "user" : "kernel";
552 rw_mode = fsr & FSR_WNR ? "write" : "read";
553 disable_interrupts(PSR_I|PSR_F);
556 printf("Fatal %s mode data abort: '%s' on %s\n", mode,
557 aborts[idx].desc, rw_mode);
558 printf("trapframe: %p\nFSR=%08x, FAR=", tf, fsr);
559 if (idx != FAULT_EA_IMPREC)
560 printf("%08x, ", far);
563 printf("spsr=%08x\n", tf->tf_spsr);
565 printf("Fatal %s mode prefetch abort at 0x%08x\n",
567 printf("trapframe: %p, spsr=%08x\n", tf, tf->tf_spsr);
570 printf("r0 =%08x, r1 =%08x, r2 =%08x, r3 =%08x\n",
571 tf->tf_r0, tf->tf_r1, tf->tf_r2, tf->tf_r3);
572 printf("r4 =%08x, r5 =%08x, r6 =%08x, r7 =%08x\n",
573 tf->tf_r4, tf->tf_r5, tf->tf_r6, tf->tf_r7);
574 printf("r8 =%08x, r9 =%08x, r10=%08x, r11=%08x\n",
575 tf->tf_r8, tf->tf_r9, tf->tf_r10, tf->tf_r11);
576 printf("r12=%08x, ", tf->tf_r12);
579 printf("usp=%08x, ulr=%08x",
580 tf->tf_usr_sp, tf->tf_usr_lr);
582 printf("ssp=%08x, slr=%08x",
583 tf->tf_svc_sp, tf->tf_svc_lr);
584 printf(", pc =%08x\n\n", tf->tf_pc);
587 if (debugger_on_panic || kdb_active)
588 kdb_trap(fsr, 0, tf);
590 panic("Fatal abort");
595 * abort_align() handles the following data abort:
597 * FAULT_ALIGN - Alignment fault
599 * Everything should be aligned in kernel with exception of user to kernel
600 * and vice versa data copying, so if pcb_onfault is not set, it's fatal.
601 * We generate signal in case of abort from user mode.
604 abort_align(struct trapframe *tf, u_int idx, u_int fsr, u_int far,
605 u_int prefetch, struct thread *td, struct ksig *ksig)
609 usermode = TRAPF_USERMODE(tf);
611 if (td->td_intr_nesting_level == 0 && td != NULL &&
612 td->td_pcb->pcb_onfault != NULL) {
614 tf->tf_pc = (int)td->td_pcb->pcb_onfault;
617 abort_fatal(tf, idx, fsr, far, prefetch, td, ksig);
619 /* Deliver a bus error signal to the process */
620 ksig->code = BUS_ADRALN;
627 * abort_icache() handles the following data abort:
629 * FAULT_ICACHE - Instruction cache maintenance
631 * According to manual, FAULT_ICACHE is translation fault during cache
632 * maintenance operation. In fact, no cache maintenance operation on
633 * not mapped virtual addresses should be called. As cache maintenance
634 * operation (except DMB, DSB, and Flush Prefetch Buffer) are priviledged,
635 * the abort is concider as fatal for now. However, all the matter with
636 * cache maintenance operation on virtual addresses could be really complex
637 * and fuzzy in SMP case, so maybe in future standard fault mechanism
638 * should be held here including vm_fault() calling.
641 abort_icache(struct trapframe *tf, u_int idx, u_int fsr, u_int far,
642 u_int prefetch, struct thread *td, struct ksig *ksig)
645 abort_fatal(tf, idx, fsr, far, prefetch, td, ksig);