2 * Copyright (c) 2014 Andrew Turner
3 * Copyright (c) 2015-2017 Ruslan Bukin <br@bsdpad.com>
6 * Portions of this software were developed by SRI International and the
7 * University of Cambridge Computer Laboratory under DARPA/AFRL contract
8 * FA8750-10-C-0237 ("CTSRD"), as part of the DARPA CRASH research programme.
10 * Portions of this software were developed by the University of Cambridge
11 * Computer Laboratory as part of the CTSRD Project, with support from the
12 * UK Higher Education Innovation Fund (HEIF).
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions
17 * 1. Redistributions of source code must retain the above copyright
18 * notice, this list of conditions and the following disclaimer.
19 * 2. Redistributions in binary form must reproduce the above copyright
20 * notice, this list of conditions and the following disclaimer in the
21 * documentation and/or other materials provided with the distribution.
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36 #include "opt_platform.h"
38 #include <sys/cdefs.h>
39 __FBSDID("$FreeBSD$");
41 #include <sys/param.h>
42 #include <sys/systm.h>
48 #include <sys/imgact.h>
50 #include <sys/kernel.h>
51 #include <sys/limits.h>
52 #include <sys/linker.h>
53 #include <sys/msgbuf.h>
56 #include <sys/ptrace.h>
57 #include <sys/reboot.h>
58 #include <sys/rwlock.h>
59 #include <sys/sched.h>
60 #include <sys/signalvar.h>
61 #include <sys/syscallsubr.h>
62 #include <sys/sysent.h>
63 #include <sys/sysproto.h>
64 #include <sys/ucontext.h>
67 #include <vm/vm_kern.h>
68 #include <vm/vm_object.h>
69 #include <vm/vm_page.h>
71 #include <vm/vm_map.h>
72 #include <vm/vm_pager.h>
74 #include <machine/riscvreg.h>
75 #include <machine/cpu.h>
76 #include <machine/kdb.h>
77 #include <machine/machdep.h>
78 #include <machine/pcb.h>
79 #include <machine/reg.h>
80 #include <machine/trap.h>
81 #include <machine/vmparam.h>
82 #include <machine/intr.h>
83 #include <machine/sbi.h>
85 #include <machine/asm.h>
88 #include <machine/fpe.h>
92 #include <dev/fdt/fdt_common.h>
93 #include <dev/ofw/openfirm.h>
96 struct pcpu __pcpu[MAXCPU];
98 static struct trapframe proc0_tf;
100 vm_paddr_t phys_avail[PHYS_AVAIL_SIZE + 2];
101 vm_paddr_t dump_avail[PHYS_AVAIL_SIZE + 2];
108 #define DTB_SIZE_MAX (1024 * 1024)
110 #define PHYSMAP_SIZE (2 * (VM_PHYSSEG_MAX - 1))
111 vm_paddr_t physmap[PHYSMAP_SIZE];
114 struct kva_md_info kmi;
116 int64_t dcache_line_size; /* The minimum D cache line size */
117 int64_t icache_line_size; /* The minimum I cache line size */
118 int64_t idcache_line_size; /* The minimum cache line size */
121 extern int *initstack_end;
125 uintptr_t mcall_trap(uintptr_t mcause, uintptr_t* regs);
128 mcall_trap(uintptr_t mcause, uintptr_t* regs)
135 cpu_startup(void *dummy)
140 vm_ksubmap_init(&kmi);
142 vm_pager_bufferinit();
145 SYSINIT(cpu, SI_SUB_CPU, SI_ORDER_FIRST, cpu_startup, NULL);
148 cpu_idle_wakeup(int cpu)
155 fill_regs(struct thread *td, struct reg *regs)
157 struct trapframe *frame;
159 frame = td->td_frame;
160 regs->sepc = frame->tf_sepc;
161 regs->sstatus = frame->tf_sstatus;
162 regs->ra = frame->tf_ra;
163 regs->sp = frame->tf_sp;
164 regs->gp = frame->tf_gp;
165 regs->tp = frame->tf_tp;
167 memcpy(regs->t, frame->tf_t, sizeof(regs->t));
168 memcpy(regs->s, frame->tf_s, sizeof(regs->s));
169 memcpy(regs->a, frame->tf_a, sizeof(regs->a));
175 set_regs(struct thread *td, struct reg *regs)
177 struct trapframe *frame;
179 frame = td->td_frame;
180 frame->tf_sepc = regs->sepc;
181 frame->tf_sstatus = regs->sstatus;
182 frame->tf_ra = regs->ra;
183 frame->tf_sp = regs->sp;
184 frame->tf_gp = regs->gp;
185 frame->tf_tp = regs->tp;
187 memcpy(frame->tf_t, regs->t, sizeof(frame->tf_t));
188 memcpy(frame->tf_s, regs->s, sizeof(frame->tf_s));
189 memcpy(frame->tf_a, regs->a, sizeof(frame->tf_a));
195 fill_fpregs(struct thread *td, struct fpreg *regs)
202 if ((pcb->pcb_fpflags & PCB_FP_STARTED) != 0) {
204 * If we have just been running FPE instructions we will
205 * need to save the state to memcpy it below.
209 memcpy(regs->fp_x, pcb->pcb_x, sizeof(regs->fp_x));
210 regs->fp_fcsr = pcb->pcb_fcsr;
213 memset(regs->fp_x, 0, sizeof(regs->fp_x));
219 set_fpregs(struct thread *td, struct fpreg *regs)
226 memcpy(pcb->pcb_x, regs->fp_x, sizeof(regs->fp_x));
227 pcb->pcb_fcsr = regs->fp_fcsr;
234 fill_dbregs(struct thread *td, struct dbreg *regs)
237 panic("fill_dbregs");
241 set_dbregs(struct thread *td, struct dbreg *regs)
248 ptrace_set_pc(struct thread *td, u_long addr)
251 panic("ptrace_set_pc");
256 ptrace_single_step(struct thread *td)
264 ptrace_clear_single_step(struct thread *td)
272 exec_setregs(struct thread *td, struct image_params *imgp, u_long stack)
274 struct trapframe *tf;
280 memset(tf, 0, sizeof(struct trapframe));
283 tf->tf_sp = STACKALIGN(stack);
284 tf->tf_ra = imgp->entry_addr;
285 tf->tf_sepc = imgp->entry_addr;
287 pcb->pcb_fpflags &= ~PCB_FP_STARTED;
290 /* Sanity check these are the same size, they will be memcpy'd to and fro */
291 CTASSERT(sizeof(((struct trapframe *)0)->tf_a) ==
292 sizeof((struct gpregs *)0)->gp_a);
293 CTASSERT(sizeof(((struct trapframe *)0)->tf_s) ==
294 sizeof((struct gpregs *)0)->gp_s);
295 CTASSERT(sizeof(((struct trapframe *)0)->tf_t) ==
296 sizeof((struct gpregs *)0)->gp_t);
297 CTASSERT(sizeof(((struct trapframe *)0)->tf_a) ==
298 sizeof((struct reg *)0)->a);
299 CTASSERT(sizeof(((struct trapframe *)0)->tf_s) ==
300 sizeof((struct reg *)0)->s);
301 CTASSERT(sizeof(((struct trapframe *)0)->tf_t) ==
302 sizeof((struct reg *)0)->t);
304 /* Support for FDT configurations only. */
308 get_mcontext(struct thread *td, mcontext_t *mcp, int clear_ret)
310 struct trapframe *tf = td->td_frame;
312 memcpy(mcp->mc_gpregs.gp_t, tf->tf_t, sizeof(mcp->mc_gpregs.gp_t));
313 memcpy(mcp->mc_gpregs.gp_s, tf->tf_s, sizeof(mcp->mc_gpregs.gp_s));
314 memcpy(mcp->mc_gpregs.gp_a, tf->tf_a, sizeof(mcp->mc_gpregs.gp_a));
316 if (clear_ret & GET_MC_CLEAR_RET) {
317 mcp->mc_gpregs.gp_a[0] = 0;
318 mcp->mc_gpregs.gp_t[0] = 0; /* clear syscall error */
321 mcp->mc_gpregs.gp_ra = tf->tf_ra;
322 mcp->mc_gpregs.gp_sp = tf->tf_sp;
323 mcp->mc_gpregs.gp_gp = tf->tf_gp;
324 mcp->mc_gpregs.gp_tp = tf->tf_tp;
325 mcp->mc_gpregs.gp_sepc = tf->tf_sepc;
326 mcp->mc_gpregs.gp_sstatus = tf->tf_sstatus;
332 set_mcontext(struct thread *td, mcontext_t *mcp)
334 struct trapframe *tf;
338 memcpy(tf->tf_t, mcp->mc_gpregs.gp_t, sizeof(tf->tf_t));
339 memcpy(tf->tf_s, mcp->mc_gpregs.gp_s, sizeof(tf->tf_s));
340 memcpy(tf->tf_a, mcp->mc_gpregs.gp_a, sizeof(tf->tf_a));
342 tf->tf_ra = mcp->mc_gpregs.gp_ra;
343 tf->tf_sp = mcp->mc_gpregs.gp_sp;
344 tf->tf_gp = mcp->mc_gpregs.gp_gp;
345 tf->tf_sepc = mcp->mc_gpregs.gp_sepc;
346 tf->tf_sstatus = mcp->mc_gpregs.gp_sstatus;
352 get_fpcontext(struct thread *td, mcontext_t *mcp)
359 curpcb = curthread->td_pcb;
361 KASSERT(td->td_pcb == curpcb, ("Invalid fpe pcb"));
363 if ((curpcb->pcb_fpflags & PCB_FP_STARTED) != 0) {
365 * If we have just been running FPE instructions we will
366 * need to save the state to memcpy it below.
370 KASSERT((curpcb->pcb_fpflags & ~PCB_FP_USERMASK) == 0,
371 ("Non-userspace FPE flags set in get_fpcontext"));
372 memcpy(mcp->mc_fpregs.fp_x, curpcb->pcb_x,
373 sizeof(mcp->mc_fpregs));
374 mcp->mc_fpregs.fp_fcsr = curpcb->pcb_fcsr;
375 mcp->mc_fpregs.fp_flags = curpcb->pcb_fpflags;
376 mcp->mc_flags |= _MC_FP_VALID;
384 set_fpcontext(struct thread *td, mcontext_t *mcp)
391 if ((mcp->mc_flags & _MC_FP_VALID) != 0) {
392 curpcb = curthread->td_pcb;
393 /* FPE usage is enabled, override registers. */
394 memcpy(curpcb->pcb_x, mcp->mc_fpregs.fp_x,
395 sizeof(mcp->mc_fpregs));
396 curpcb->pcb_fcsr = mcp->mc_fpregs.fp_fcsr;
397 curpcb->pcb_fpflags = mcp->mc_fpregs.fp_flags & PCB_FP_USERMASK;
411 if (!sched_runnable())
428 * Flush the D-cache for non-DMA I/O so that the I-cache can
429 * be made coherent later.
432 cpu_flush_dcache(void *ptr, size_t len)
438 /* Get current clock frequency for the given CPU ID. */
440 cpu_est_clockrate(int cpu_id, uint64_t *rate)
443 panic("cpu_est_clockrate");
447 cpu_pcpu_init(struct pcpu *pcpu, int cpuid, size_t size)
457 if (td->td_md.md_spinlock_count == 0) {
458 td->td_md.md_spinlock_count = 1;
459 td->td_md.md_saved_sstatus_ie = intr_disable();
461 td->td_md.md_spinlock_count++;
469 register_t sstatus_ie;
473 sstatus_ie = td->td_md.md_saved_sstatus_ie;
474 td->td_md.md_spinlock_count--;
475 if (td->td_md.md_spinlock_count == 0)
476 intr_restore(sstatus_ie);
479 #ifndef _SYS_SYSPROTO_H_
480 struct sigreturn_args {
486 sys_sigreturn(struct thread *td, struct sigreturn_args *uap)
494 if (copyin(uap->sigcntxp, &uc, sizeof(uc)))
498 * Make sure the processor mode has not been tampered with and
499 * interrupts have not been disabled.
500 * Supervisor interrupts in user mode are always enabled.
502 sstatus = uc.uc_mcontext.mc_gpregs.gp_sstatus;
503 if ((sstatus & SSTATUS_SPP) != 0)
506 error = set_mcontext(td, &uc.uc_mcontext);
510 set_fpcontext(td, &uc.uc_mcontext);
512 /* Restore signal mask. */
513 kern_sigprocmask(td, SIG_SETMASK, &uc.uc_sigmask, NULL, 0);
515 return (EJUSTRETURN);
519 * Construct a PCB from a trapframe. This is called from kdb_trap() where
520 * we want to start a backtrace from the function that caused us to enter
521 * the debugger. We have the context in the trapframe, but base the trace
522 * on the PCB. The PCB doesn't have to be perfect, as long as it contains
523 * enough for a backtrace.
526 makectx(struct trapframe *tf, struct pcb *pcb)
529 memcpy(pcb->pcb_t, tf->tf_t, sizeof(tf->tf_t));
530 memcpy(pcb->pcb_s, tf->tf_s, sizeof(tf->tf_s));
531 memcpy(pcb->pcb_a, tf->tf_a, sizeof(tf->tf_a));
533 pcb->pcb_ra = tf->tf_ra;
534 pcb->pcb_sp = tf->tf_sp;
535 pcb->pcb_gp = tf->tf_gp;
536 pcb->pcb_tp = tf->tf_tp;
537 pcb->pcb_sepc = tf->tf_sepc;
541 sendsig(sig_t catcher, ksiginfo_t *ksi, sigset_t *mask)
543 struct sigframe *fp, frame;
544 struct sysentvec *sysent;
545 struct trapframe *tf;
554 PROC_LOCK_ASSERT(p, MA_OWNED);
556 sig = ksi->ksi_signo;
558 mtx_assert(&psp->ps_mtx, MA_OWNED);
561 onstack = sigonstack(tf->tf_sp);
563 CTR4(KTR_SIG, "sendsig: td=%p (%s) catcher=%p sig=%d", td, p->p_comm,
566 /* Allocate and validate space for the signal handler context. */
567 if ((td->td_pflags & TDP_ALTSTACK) != 0 && !onstack &&
568 SIGISMEMBER(psp->ps_sigonstack, sig)) {
569 fp = (struct sigframe *)((uintptr_t)td->td_sigstk.ss_sp +
570 td->td_sigstk.ss_size);
572 fp = (struct sigframe *)td->td_frame->tf_sp;
575 /* Make room, keeping the stack aligned */
577 fp = (struct sigframe *)STACKALIGN(fp);
579 /* Fill in the frame to copy out */
580 get_mcontext(td, &frame.sf_uc.uc_mcontext, 0);
581 get_fpcontext(td, &frame.sf_uc.uc_mcontext);
582 frame.sf_si = ksi->ksi_info;
583 frame.sf_uc.uc_sigmask = *mask;
584 frame.sf_uc.uc_stack.ss_flags = (td->td_pflags & TDP_ALTSTACK) ?
585 ((onstack) ? SS_ONSTACK : 0) : SS_DISABLE;
586 frame.sf_uc.uc_stack = td->td_sigstk;
587 mtx_unlock(&psp->ps_mtx);
588 PROC_UNLOCK(td->td_proc);
590 /* Copy the sigframe out to the user's stack. */
591 if (copyout(&frame, fp, sizeof(*fp)) != 0) {
592 /* Process has trashed its stack. Kill it. */
593 CTR2(KTR_SIG, "sendsig: sigexit td=%p fp=%p", td, fp);
599 tf->tf_a[1] = (register_t)&fp->sf_si;
600 tf->tf_a[2] = (register_t)&fp->sf_uc;
602 tf->tf_sepc = (register_t)catcher;
603 tf->tf_sp = (register_t)fp;
605 sysent = p->p_sysent;
606 if (sysent->sv_sigcode_base != 0)
607 tf->tf_ra = (register_t)sysent->sv_sigcode_base;
609 tf->tf_ra = (register_t)(sysent->sv_psstrings -
610 *(sysent->sv_szsigcode));
612 CTR3(KTR_SIG, "sendsig: return td=%p pc=%#x sp=%#x", td, tf->tf_sepc,
616 mtx_lock(&psp->ps_mtx);
620 init_proc0(vm_offset_t kstack)
625 proc_linkup0(&proc0, &thread0);
626 thread0.td_kstack = kstack;
627 thread0.td_pcb = (struct pcb *)(thread0.td_kstack) - 1;
628 thread0.td_pcb->pcb_fpflags = 0;
629 thread0.td_frame = &proc0_tf;
630 pcpup->pc_curpcb = thread0.td_pcb;
634 add_physmap_entry(uint64_t base, uint64_t length, vm_paddr_t *physmap,
637 u_int i, insert_idx, _physmap_idx;
639 _physmap_idx = *physmap_idxp;
645 * Find insertion point while checking for overlap. Start off by
646 * assuming the new entry will be added to the end.
648 insert_idx = _physmap_idx;
649 for (i = 0; i <= _physmap_idx; i += 2) {
650 if (base < physmap[i + 1]) {
651 if (base + length <= physmap[i]) {
655 if (boothowto & RB_VERBOSE)
657 "Overlapping memory regions, ignoring second region\n");
662 /* See if we can prepend to the next entry. */
663 if (insert_idx <= _physmap_idx &&
664 base + length == physmap[insert_idx]) {
665 physmap[insert_idx] = base;
669 /* See if we can append to the previous entry. */
670 if (insert_idx > 0 && base == physmap[insert_idx - 1]) {
671 physmap[insert_idx - 1] += length;
676 *physmap_idxp = _physmap_idx;
677 if (_physmap_idx == PHYSMAP_SIZE) {
679 "Too many segments in the physical address map, giving up\n");
684 * Move the last 'N' entries down to make room for the new
687 for (i = _physmap_idx; i > insert_idx; i -= 2) {
688 physmap[i] = physmap[i - 2];
689 physmap[i + 1] = physmap[i - 1];
692 /* Insert the new entry. */
693 physmap[insert_idx] = base;
694 physmap[insert_idx + 1] = base + length;
696 printf("physmap[%d] = 0x%016lx\n", insert_idx, base);
697 printf("physmap[%d] = 0x%016lx\n", insert_idx + 1, base + length);
703 try_load_dtb(caddr_t kmdp, vm_offset_t dtbp)
706 #if defined(FDT_DTB_STATIC)
707 dtbp = (vm_offset_t)&fdt_static_dtb;
710 if (dtbp == (vm_offset_t)NULL) {
711 printf("ERROR loading DTB\n");
715 if (OF_install(OFW_FDT, 0) == FALSE)
716 panic("Cannot install FDT");
718 if (OF_init((void *)dtbp) != 0)
719 panic("OF_init failed with the found device tree");
731 * Fake up a boot descriptor table.
732 * RISCVTODO: This needs to be done via loader (when it's available).
735 fake_preload_metadata(struct riscv_bootparams *rvbp __unused)
737 static uint32_t fake_preload[35];
739 vm_offset_t zstart = 0, zend = 0;
741 vm_offset_t lastaddr;
746 fake_preload[i++] = MODINFO_NAME;
747 fake_preload[i++] = strlen("kernel") + 1;
748 strcpy((char*)&fake_preload[i++], "kernel");
750 fake_preload[i++] = MODINFO_TYPE;
751 fake_preload[i++] = strlen("elf64 kernel") + 1;
752 strcpy((char*)&fake_preload[i++], "elf64 kernel");
754 fake_preload[i++] = MODINFO_ADDR;
755 fake_preload[i++] = sizeof(vm_offset_t);
756 *(vm_offset_t *)&fake_preload[i++] =
757 (vm_offset_t)(KERNBASE + KERNENTRY);
759 fake_preload[i++] = MODINFO_SIZE;
760 fake_preload[i++] = sizeof(vm_offset_t);
761 fake_preload[i++] = (vm_offset_t)&end -
762 (vm_offset_t)(KERNBASE + KERNENTRY);
767 if (*(uint32_t *)KERNVIRTADDR == MAGIC_TRAMP_NUMBER) {
768 fake_preload[i++] = MODINFO_METADATA|MODINFOMD_SSYM;
769 fake_preload[i++] = sizeof(vm_offset_t);
770 fake_preload[i++] = *(uint32_t *)(KERNVIRTADDR + 4);
771 fake_preload[i++] = MODINFO_METADATA|MODINFOMD_ESYM;
772 fake_preload[i++] = sizeof(vm_offset_t);
773 fake_preload[i++] = *(uint32_t *)(KERNVIRTADDR + 8);
774 lastaddr = *(uint32_t *)(KERNVIRTADDR + 8);
776 zstart = *(uint32_t *)(KERNVIRTADDR + 4);
777 db_fetch_ksymtab(zstart, zend);
781 lastaddr = (vm_offset_t)&end;
782 fake_preload[i++] = 0;
784 preload_metadata = (void *)fake_preload;
790 initriscv(struct riscv_bootparams *rvbp)
792 struct mem_region mem_regions[FDT_MEM_REGIONS];
793 vm_offset_t rstart, rend;
796 vm_offset_t lastaddr;
801 /* Set the module data location */
802 lastaddr = fake_preload_metadata(rvbp);
804 /* Find the kernel address */
805 kmdp = preload_search_by_type("elf kernel");
807 kmdp = preload_search_by_type("elf64 kernel");
809 boothowto = RB_VERBOSE | RB_SINGLE;
810 boothowto = RB_VERBOSE;
815 try_load_dtb(kmdp, rvbp->dtbp_virt);
818 /* Load the physical memory ranges */
822 /* Grab physical memory regions information from device tree. */
823 if (fdt_get_mem_regions(mem_regions, &mem_regions_sz, NULL) != 0)
824 panic("Cannot get physical memory regions");
827 e = s + DTB_SIZE_MAX;
829 for (i = 0; i < mem_regions_sz; i++) {
830 rstart = mem_regions[i].mr_start;
831 rend = (mem_regions[i].mr_start + mem_regions[i].mr_size);
833 if ((rstart < s) && (rend > e)) {
834 /* Exclude DTB region. */
835 add_physmap_entry(rstart, (s - rstart), physmap, &physmap_idx);
836 add_physmap_entry(e, (rend - e), physmap, &physmap_idx);
838 add_physmap_entry(mem_regions[i].mr_start,
839 mem_regions[i].mr_size, physmap, &physmap_idx);
844 /* Set the pcpu data, this is needed by pmap_bootstrap */
846 pcpu_init(pcpup, 0, sizeof(struct pcpu));
848 /* Set the pcpu pointer */
849 __asm __volatile("mv gp, %0" :: "r"(pcpup));
851 PCPU_SET(curthread, &thread0);
853 /* Do basic tuning, hz etc */
858 /* Bootstrap enough of pmap to enter the kernel proper */
859 kernlen = (lastaddr - KERNBASE);
860 pmap_bootstrap(rvbp->kern_l1pt, mem_regions[0].mr_start, kernlen);
864 init_proc0(rvbp->kern_stack);
866 /* set page table base register for thread0 */
867 thread0.td_pcb->pcb_l1addr = \
868 (rvbp->kern_l1pt - KERNBASE + rvbp->kern_phys);
870 msgbufinit(msgbufp, msgbufsize);
872 init_param2(physmem);
880 bzero(void *buf, size_t len)