2 * Copyright (C) 1995, 1996 Wolfgang Solfrank.
3 * Copyright (C) 1995, 1996 TooLs GmbH.
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
14 * 3. All advertising materials mentioning features or use of this software
15 * must display the following acknowledgement:
16 * This product includes software developed by TooLs GmbH.
17 * 4. The name of TooLs GmbH may not be used to endorse or promote products
18 * derived from this software without specific prior written permission.
20 * THIS SOFTWARE IS PROVIDED BY TOOLS GMBH ``AS IS'' AND ANY EXPRESS OR
21 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
22 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
23 * IN NO EVENT SHALL TOOLS GMBH BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
26 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
27 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
28 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
29 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31 * $NetBSD: trap.c,v 1.58 2002/03/04 04:07:35 dbj Exp $
34 #include <sys/cdefs.h>
35 __FBSDID("$FreeBSD$");
37 #include <sys/param.h>
42 #include <sys/mutex.h>
43 #include <sys/pioctl.h>
44 #include <sys/ptrace.h>
45 #include <sys/reboot.h>
46 #include <sys/syscall.h>
47 #include <sys/sysent.h>
48 #include <sys/systm.h>
49 #include <sys/kernel.h>
51 #include <sys/signalvar.h>
52 #include <sys/vmmeter.h>
54 #include <security/audit/audit.h>
58 #include <vm/vm_extern.h>
59 #include <vm/vm_param.h>
60 #include <vm/vm_kern.h>
61 #include <vm/vm_map.h>
62 #include <vm/vm_page.h>
64 #include <machine/_inttypes.h>
65 #include <machine/altivec.h>
66 #include <machine/cpu.h>
67 #include <machine/db_machdep.h>
68 #include <machine/fpu.h>
69 #include <machine/frame.h>
70 #include <machine/pcb.h>
71 #include <machine/psl.h>
72 #include <machine/trap.h>
73 #include <machine/spr.h>
74 #include <machine/sr.h>
76 /* Below matches setjmp.S */
77 #define FAULTBUF_LR 21
80 #define FAULTBUF_CR 22
81 #define FAULTBUF_R14 3
83 #define MOREARGS(sp) ((caddr_t)((uintptr_t)(sp) + \
84 sizeof(struct callframe) - 3*sizeof(register_t))) /* more args go here */
86 static void trap_fatal(struct trapframe *frame);
87 static void printtrap(u_int vector, struct trapframe *frame, int isfatal,
89 static int trap_pfault(struct trapframe *frame, int user);
90 static int fix_unaligned(struct thread *td, struct trapframe *frame);
91 static int handle_onfault(struct trapframe *frame);
92 static void syscall(struct trapframe *frame);
94 #if defined(__powerpc64__) && defined(AIM)
95 void handle_kernel_slb_spill(int, register_t, register_t);
96 static int handle_user_slb_spill(pmap_t pm, vm_offset_t addr);
100 extern vm_offset_t __startkernel;
103 int db_trap_glue(struct trapframe *); /* Called from trap_subr.S */
106 struct powerpc_exception {
112 #include <sys/dtrace_bsd.h>
114 int (*dtrace_invop_jump_addr)(struct trapframe *);
117 static struct powerpc_exception powerpc_exceptions[] = {
118 { EXC_CRIT, "critical input" },
119 { EXC_RST, "system reset" },
120 { EXC_MCHK, "machine check" },
121 { EXC_DSI, "data storage interrupt" },
122 { EXC_DSE, "data segment exception" },
123 { EXC_ISI, "instruction storage interrupt" },
124 { EXC_ISE, "instruction segment exception" },
125 { EXC_EXI, "external interrupt" },
126 { EXC_ALI, "alignment" },
127 { EXC_PGM, "program" },
128 { EXC_HEA, "hypervisor emulation assistance" },
129 { EXC_FPU, "floating-point unavailable" },
130 { EXC_APU, "auxiliary proc unavailable" },
131 { EXC_DECR, "decrementer" },
132 { EXC_FIT, "fixed-interval timer" },
133 { EXC_WDOG, "watchdog timer" },
134 { EXC_SC, "system call" },
135 { EXC_TRC, "trace" },
136 { EXC_FPA, "floating-point assist" },
137 { EXC_DEBUG, "debug" },
138 { EXC_PERF, "performance monitoring" },
139 { EXC_VEC, "altivec unavailable" },
140 { EXC_VSX, "vsx unavailable" },
141 { EXC_FAC, "facility unavailable" },
142 { EXC_ITMISS, "instruction tlb miss" },
143 { EXC_DLMISS, "data load tlb miss" },
144 { EXC_DSMISS, "data store tlb miss" },
145 { EXC_BPT, "instruction breakpoint" },
146 { EXC_SMI, "system management" },
147 { EXC_VECAST_G4, "altivec assist" },
148 { EXC_THRM, "thermal management" },
149 { EXC_RUNMODETRC, "run mode/trace" },
153 #define ESR_BITMASK \
155 "\040b0\037b1\036b2\035b3\034PIL\033PRR\032PTR\031FP" \
156 "\030ST\027b9\026DLK\025ILK\024b12\023b13\022BO\021PIE" \
157 "\020b16\017b17\016b18\015b19\014b20\013b21\012b22\011b23" \
158 "\010SPE\007EPID\006b26\005b27\004b28\003b29\002b30\001b31"
159 #define MCSR_BITMASK \
161 "\040MCP\037ICERR\036DCERR\035TLBPERR\034L2MMU_MHIT\033b5\032b6\031b7" \
162 "\030b8\027b9\026b10\025NMI\024MAV\023MEA\022b14\021IF" \
163 "\020LD\017ST\016LDG\015b19\014b20\013b21\012b22\011b23" \
164 "\010b24\007b25\006b26\005b27\004b28\003b29\002TLBSYNC\001BSL2_ERR"
165 #define MSSSR_BITMASK \
167 "\040b0\037b1\036b2\035b3\034b4\033b5\032b6\031b7" \
168 "\030b8\027b9\026b10\025b11\024b12\023L2TAG\022L2DAT\021L3TAG" \
169 "\020L3DAT\017APE\016DPE\015TEA\014b20\013b21\012b22\011b23" \
170 "\010b24\007b25\006b26\005b27\004b28\003b29\002b30\001b31"
174 trapname(u_int vector)
176 struct powerpc_exception *pe;
178 for (pe = powerpc_exceptions; pe->vector != EXC_LAST; pe++) {
179 if (pe->vector == vector)
187 frame_is_trap_inst(struct trapframe *frame)
190 return (frame->exc == EXC_PGM && frame->srr1 & EXC_PGM_TRAP);
192 return ((frame->cpu.booke.esr & ESR_PTR) != 0);
197 trap(struct trapframe *frame)
221 type = ucode = frame->exc;
223 user = frame->srr1 & PSL_PR;
225 CTR3(KTR_TRAP, "trap: %s type=%s (%s)", td->td_name,
226 trapname(type), user ? "user" : "kernel");
230 * A trap can occur while DTrace executes a probe. Before
231 * executing the probe, DTrace blocks re-scheduling and sets
232 * a flag in its per-cpu flags to indicate that it doesn't
233 * want to fault. On returning from the probe, the no-fault
234 * flag is cleared and finally re-scheduling is enabled.
236 * If the DTrace kernel module has registered a trap handler,
237 * call it and if it returns non-zero, assume that it has
238 * handled the trap and modified the trap frame so that this
239 * function can return normally.
241 if (dtrace_trap_func != NULL && (*dtrace_trap_func)(frame, type) != 0)
247 td->td_frame = frame;
248 if (td->td_cowgen != p->p_cowgen)
249 thread_cow_update(td);
251 /* User Mode Traps */
255 frame->srr1 &= ~PSL_SE;
260 #if defined(__powerpc64__) && defined(AIM)
263 if (handle_user_slb_spill(&p->p_vmspace->vm_pmap,
264 (type == EXC_ISE) ? frame->srr0 : frame->dar) != 0){
272 sig = trap_pfault(frame, 1);
282 KASSERT((td->td_pcb->pcb_flags & PCB_FPU) != PCB_FPU,
283 ("FPU already enabled for thread"));
288 KASSERT((td->td_pcb->pcb_flags & PCB_VEC) != PCB_VEC,
289 ("Altivec already enabled for thread"));
294 KASSERT((td->td_pcb->pcb_flags & PCB_VSX) != PCB_VSX,
295 ("VSX already enabled for thread"));
296 if (!(td->td_pcb->pcb_flags & PCB_VEC))
298 if (!(td->td_pcb->pcb_flags & PCB_FPU))
300 td->td_pcb->pcb_flags |= PCB_VSX;
305 fscr = mfspr(SPR_FSCR);
306 if ((fscr & FSCR_IC_MASK) == FSCR_IC_HTM) {
307 CTR0(KTR_TRAP, "Hardware Transactional Memory subsystem disabled");
321 * We get a VPU assist exception for IEEE mode
322 * vector operations on denormalized floats.
323 * Emulating this is a giant pain, so for now,
324 * just switch off IEEE mode and treat them as
329 td->td_pcb->pcb_vec.vscr |= ALTIVEC_VSCR_NJ;
334 if (fix_unaligned(td, frame) != 0) {
342 case EXC_DEBUG: /* Single stepping */
343 mtspr(SPR_DBSR, mfspr(SPR_DBSR));
344 frame->srr1 &= ~PSL_DE;
345 frame->cpu.booke.dbcr0 &= ~(DBCR0_IDM | DBCR0_IC);
351 /* Identify the trap reason */
352 if (frame_is_trap_inst(frame)) {
354 inst = fuword32((const void *)frame->srr0);
355 if (inst == 0x0FFFDDDD &&
356 dtrace_pid_probe_ptr != NULL) {
357 (*dtrace_pid_probe_ptr)(frame);
364 sig = ppc_instr_emulate(frame, td->td_pcb);
366 if (frame->srr1 & EXC_PGM_PRIV)
368 else if (frame->srr1 & EXC_PGM_ILLEGAL)
370 } else if (sig == SIGFPE)
371 ucode = FPE_FLTINV; /* Punt for now, invalid operation. */
377 * Note that this may not be recoverable for the user
378 * process, depending on the type of machine check,
379 * but it at least prevents the kernel from dying.
389 /* Kernel Mode Traps */
391 KASSERT(cold || td->td_ucred != NULL,
392 ("kernel trap doesn't have ucred"));
396 if (frame_is_trap_inst(frame)) {
397 if (*(uint32_t *)frame->srr0 == EXC_DTRACE) {
398 if (dtrace_invop_jump_addr != NULL) {
399 dtrace_invop_jump_addr(frame);
406 if (db_trap_glue(frame))
410 #if defined(__powerpc64__) && defined(AIM)
412 if (td->td_pcb->pcb_cpu.aim.usr_vsid != 0 &&
413 (frame->dar & SEGMENT_MASK) == USER_ADDR) {
414 __asm __volatile ("slbmte %0, %1" ::
415 "r"(td->td_pcb->pcb_cpu.aim.usr_vsid),
422 if (trap_pfault(frame, 0) == 0)
426 if (handle_onfault(frame))
436 if (p->p_sysent->sv_transtrap != NULL)
437 sig = (p->p_sysent->sv_transtrap)(sig, type);
438 ksiginfo_init_trap(&ksi);
440 ksi.ksi_code = (int) ucode; /* XXX, not POSIX */
441 ksi.ksi_addr = (void *)frame->srr0;
442 ksi.ksi_trapno = type;
443 trapsignal(td, &ksi);
450 trap_fatal(struct trapframe *frame)
456 printtrap(frame->exc, frame, 1, (frame->srr1 & PSL_PR));
458 if (debugger_on_trap) {
459 kdb_why = KDB_WHY_TRAP;
460 handled = kdb_trap(frame->exc, 0, frame);
461 kdb_why = KDB_WHY_UNSET;
466 panic("%s trap", trapname(frame->exc));
470 cpu_printtrap(u_int vector, struct trapframe *frame, int isfatal, int user)
479 printf(" dsisr = 0x%lx\n",
480 (u_long)frame->cpu.aim.dsisr);
485 printf(" msssr0 = 0x%b\n",
486 (int)mfspr(SPR_MSSSR0), MSSSR_BITMASK);
494 pa = mfspr(SPR_MCARU);
495 pa = (pa << 32) | (u_register_t)mfspr(SPR_MCAR);
496 printf(" mcsr = 0x%b\n",
497 (int)mfspr(SPR_MCSR), MCSR_BITMASK);
498 printf(" mcar = 0x%jx\n", (uintmax_t)pa);
500 printf(" esr = 0x%b\n",
501 (int)frame->cpu.booke.esr, ESR_BITMASK);
506 printtrap(u_int vector, struct trapframe *frame, int isfatal, int user)
510 printf("%s %s trap:\n", isfatal ? "fatal" : "handled",
511 user ? "user" : "kernel");
513 printf(" exception = 0x%x (%s)\n", vector, trapname(vector));
518 printf(" virtual address = 0x%" PRIxPTR "\n", frame->dar);
523 printf(" virtual address = 0x%" PRIxPTR "\n", frame->srr0);
528 cpu_printtrap(vector, frame, isfatal, user);
529 printf(" srr0 = 0x%" PRIxPTR " (0x%" PRIxPTR ")\n",
530 frame->srr0, frame->srr0 - (register_t)(__startkernel - KERNBASE));
531 printf(" srr1 = 0x%lx\n", (u_long)frame->srr1);
532 printf(" current msr = 0x%" PRIxPTR "\n", mfmsr());
533 printf(" lr = 0x%" PRIxPTR " (0x%" PRIxPTR ")\n",
534 frame->lr, frame->lr - (register_t)(__startkernel - KERNBASE));
535 printf(" curthread = %p\n", curthread);
536 if (curthread != NULL)
537 printf(" pid = %d, comm = %s\n",
538 curthread->td_proc->p_pid, curthread->td_name);
543 * Handles a fatal fault when we have onfault state to recover. Returns
544 * non-zero if there was onfault recovery state available.
547 handle_onfault(struct trapframe *frame)
553 fb = td->td_pcb->pcb_onfault;
555 frame->srr0 = (*fb)->_jb[FAULTBUF_LR];
556 frame->fixreg[1] = (*fb)->_jb[FAULTBUF_R1];
557 frame->fixreg[2] = (*fb)->_jb[FAULTBUF_R2];
558 frame->fixreg[3] = 1;
559 frame->cr = (*fb)->_jb[FAULTBUF_CR];
560 bcopy(&(*fb)->_jb[FAULTBUF_R14], &frame->fixreg[14],
561 18 * sizeof(register_t));
562 td->td_pcb->pcb_onfault = NULL; /* Returns twice, not thrice */
569 cpu_fetch_syscall_args(struct thread *td)
572 struct trapframe *frame;
573 struct syscall_args *sa;
579 frame = td->td_frame;
582 sa->code = frame->fixreg[0];
583 params = (caddr_t)(frame->fixreg + FIRSTARG);
586 if (sa->code == SYS_syscall) {
588 * code is first argument,
589 * followed by actual args.
591 sa->code = *(register_t *) params;
592 params += sizeof(register_t);
594 } else if (sa->code == SYS___syscall) {
596 * Like syscall, but code is a quad,
597 * so as to maintain quad alignment
598 * for the rest of the args.
600 if (SV_PROC_FLAG(p, SV_ILP32)) {
601 params += sizeof(register_t);
602 sa->code = *(register_t *) params;
603 params += sizeof(register_t);
606 sa->code = *(register_t *) params;
607 params += sizeof(register_t);
612 if (p->p_sysent->sv_mask)
613 sa->code &= p->p_sysent->sv_mask;
614 if (sa->code >= p->p_sysent->sv_size)
615 sa->callp = &p->p_sysent->sv_table[0];
617 sa->callp = &p->p_sysent->sv_table[sa->code];
619 sa->narg = sa->callp->sy_narg;
621 if (SV_PROC_FLAG(p, SV_ILP32)) {
622 argsz = sizeof(uint32_t);
624 for (i = 0; i < n; i++)
625 sa->args[i] = ((u_register_t *)(params))[i] &
628 argsz = sizeof(uint64_t);
630 for (i = 0; i < n; i++)
631 sa->args[i] = ((u_register_t *)(params))[i];
635 error = copyin(MOREARGS(frame->fixreg[1]), sa->args + n,
636 (sa->narg - n) * argsz);
641 if (SV_PROC_FLAG(p, SV_ILP32) && sa->narg > n) {
642 /* Expand the size of arguments copied from the stack */
644 for (i = sa->narg; i >= n; i--)
645 sa->args[i] = ((uint32_t *)(&sa->args[n]))[i-n];
650 td->td_retval[0] = 0;
651 td->td_retval[1] = frame->fixreg[FIRSTARG + 1];
656 #include "../../kern/subr_syscall.c"
659 syscall(struct trapframe *frame)
665 td->td_frame = frame;
667 #if defined(__powerpc64__) && defined(AIM)
669 * Speculatively restore last user SLB segment, which we know is
670 * invalid already, since we are likely to do copyin()/copyout().
672 if (td->td_pcb->pcb_cpu.aim.usr_vsid != 0)
673 __asm __volatile ("slbmte %0, %1; isync" ::
674 "r"(td->td_pcb->pcb_cpu.aim.usr_vsid), "r"(USER_SLB_SLBE));
677 error = syscallenter(td);
678 syscallret(td, error);
681 #if defined(__powerpc64__) && defined(AIM)
682 /* Handle kernel SLB faults -- runs in real mode, all seat belts off */
684 handle_kernel_slb_spill(int type, register_t dar, register_t srr0)
686 struct slb *slbcache;
691 addr = (type == EXC_ISE) ? srr0 : dar;
692 slbcache = PCPU_GET(aim.slb);
693 esid = (uintptr_t)addr >> ADDR_SR_SHFT;
694 slbe = (esid << SLBE_ESID_SHIFT) | SLBE_VALID;
696 /* See if the hardware flushed this somehow (can happen in LPARs) */
697 for (i = 0; i < n_slbs; i++)
698 if (slbcache[i].slbe == (slbe | (uint64_t)i))
701 /* Not in the map, needs to actually be added */
702 slbv = kernel_va_to_slbv(addr);
703 if (slbcache[USER_SLB_SLOT].slbe == 0) {
704 for (i = 0; i < n_slbs; i++) {
705 if (i == USER_SLB_SLOT)
707 if (!(slbcache[i].slbe & SLBE_VALID))
712 slbcache[USER_SLB_SLOT].slbe = 1;
715 /* Sacrifice a random SLB entry that is not the user entry */
717 if (i == USER_SLB_SLOT)
721 /* Write new entry */
722 slbcache[i].slbv = slbv;
723 slbcache[i].slbe = slbe | (uint64_t)i;
725 /* Trap handler will restore from cache on exit */
729 handle_user_slb_spill(pmap_t pm, vm_offset_t addr)
731 struct slb *user_entry;
735 if (pm->pm_slb == NULL)
738 esid = (uintptr_t)addr >> ADDR_SR_SHFT;
741 user_entry = user_va_to_slb_entry(pm, addr);
743 if (user_entry == NULL) {
744 /* allocate_vsid auto-spills it */
745 (void)allocate_user_vsid(pm, esid, 0);
748 * Check that another CPU has not already mapped this.
749 * XXX: Per-thread SLB caches would be better.
751 for (i = 0; i < pm->pm_slb_len; i++)
752 if (pm->pm_slb[i] == user_entry)
755 if (i == pm->pm_slb_len)
756 slb_insert_user(pm, user_entry);
765 trap_pfault(struct trapframe *frame, int user)
776 if (frame->exc == EXC_ISI) {
778 ftype = VM_PROT_EXECUTE;
779 if (frame->srr1 & SRR1_ISI_PFAULT)
780 ftype |= VM_PROT_READ;
784 if (frame->cpu.booke.esr & ESR_ST)
786 if (frame->cpu.aim.dsisr & DSISR_STORE)
788 ftype = VM_PROT_WRITE;
790 ftype = VM_PROT_READ;
794 KASSERT(p->p_vmspace != NULL, ("trap_pfault: vmspace NULL"));
795 map = &p->p_vmspace->vm_map;
797 rv = pmap_decode_kernel_ptr(eva, &is_user, &eva);
802 map = &p->p_vmspace->vm_map;
806 va = trunc_page(eva);
808 /* Fault in the page. */
809 rv = vm_fault(map, va, ftype, VM_FAULT_NORMAL);
811 * XXXDTRACE: add dtrace_doubletrap_func here?
814 if (rv == KERN_SUCCESS)
817 if (!user && handle_onfault(frame))
824 * For now, this only deals with the particular unaligned access case
825 * that gcc tends to generate. Eventually it should handle all of the
826 * possibilities that can happen on a 32-bit PowerPC in big-endian mode.
830 fix_unaligned(struct thread *td, struct trapframe *frame)
832 struct thread *fputhread;
840 indicator = (frame->cpu.booke.esr & (ESR_ST|ESR_SPE));
841 if (indicator & ESR_SPE) {
842 if (copyin((void *)frame->srr0, &inst, sizeof(inst)) != 0)
844 reg = EXC_ALI_SPE_REG(inst);
845 fpr = (double *)td->td_pcb->pcb_vec.vr[reg];
846 fputhread = PCPU_GET(vecthread);
848 /* Juggle the SPE to ensure that we've initialized
849 * the registers, and that their current state is in
852 if (fputhread != td) {
859 if (!(indicator & ESR_ST)) {
860 if (copyin((void *)frame->dar, fpr,
861 sizeof(double)) != 0)
863 frame->fixreg[reg] = td->td_pcb->pcb_vec.vr[reg][1];
866 td->td_pcb->pcb_vec.vr[reg][1] = frame->fixreg[reg];
867 if (copyout(fpr, (void *)frame->dar,
868 sizeof(double)) != 0)
874 indicator = EXC_ALI_OPCODE_INDICATOR(frame->cpu.aim.dsisr);
879 reg = EXC_ALI_RST(frame->cpu.aim.dsisr);
880 fpr = &td->td_pcb->pcb_fpu.fpr[reg].fpr;
881 fputhread = PCPU_GET(fputhread);
883 /* Juggle the FPU to ensure that we've initialized
884 * the FPRs, and that their current state is in
887 if (fputhread != td) {
894 if (indicator == EXC_ALI_LFD) {
895 if (copyin((void *)frame->dar, fpr,
896 sizeof(double)) != 0)
900 if (copyout(fpr, (void *)frame->dar,
901 sizeof(double)) != 0)
914 db_trap_glue(struct trapframe *frame)
917 if (!(frame->srr1 & PSL_PR)
918 && (frame->exc == EXC_TRC || frame->exc == EXC_RUNMODETRC
919 || frame_is_trap_inst(frame)
920 || frame->exc == EXC_BPT
921 || frame->exc == EXC_DEBUG
922 || frame->exc == EXC_DSI)) {
923 int type = frame->exc;
925 /* Ignore DTrace traps. */
926 if (*(uint32_t *)frame->srr0 == EXC_DTRACE)
928 if (frame_is_trap_inst(frame)) {
931 return (kdb_trap(type, 0, frame));