2 * Copyright (c) 2006 Peter Wemm
3 * Copyright (c) 2015 The FreeBSD Foundation
5 * Copyright (c) 2019 Mitchell Horne
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
32 #include "opt_watchdog.h"
34 #include <sys/param.h>
35 #include <sys/systm.h>
38 #include <sys/kernel.h>
39 #include <sys/kerneldump.h>
40 #include <sys/msgbuf.h>
41 #include <sys/watchdog.h>
42 #include <sys/vmmeter.h>
45 #include <vm/vm_param.h>
46 #include <vm/vm_page.h>
47 #include <vm/vm_phys.h>
48 #include <vm/vm_dumpset.h>
51 #include <machine/atomic.h>
52 #include <machine/elf.h>
53 #include <machine/md_var.h>
54 #include <machine/minidump.h>
56 CTASSERT(sizeof(struct kerneldumpheader) == 512);
58 static struct kerneldumpheader kdh;
60 /* Handle chunked writes. */
63 static size_t dumpsize;
65 static uint64_t tmpbuffer[PAGE_SIZE / sizeof(uint64_t)];
68 blk_flush(struct dumperinfo *di)
75 error = dump_append(di, dump_va, 0, fragsz);
81 * Write a block of data to the dump file.
83 * Caller can provide data through a pointer or by specifying its
86 * XXX writes using pa should be no larger than PAGE_SIZE.
89 blk_write(struct dumperinfo *di, char *ptr, vm_paddr_t pa, size_t sz)
95 maxdumpsz = min(di->maxiosize, MAXDUMPPGS * PAGE_SIZE);
96 if (maxdumpsz == 0) /* seatbelt */
97 maxdumpsz = PAGE_SIZE;
99 if ((sz % PAGE_SIZE) != 0) {
100 printf("size not page aligned\n");
103 if (ptr != NULL && pa != 0) {
104 printf("cant have both va and pa!\n");
107 if ((((uintptr_t)pa) % PAGE_SIZE) != 0) {
108 printf("address not page aligned %#lx\n", (uintptr_t)pa);
113 * If we're doing a virtual dump, flush any
114 * pre-existing pa pages.
116 error = blk_flush(di);
121 len = maxdumpsz - fragsz;
125 dumpsys_pb_progress(len);
126 wdog_kern_pat(WD_LASTVAL);
129 error = dump_append(di, ptr, 0, len);
135 dump_va = (void *)PHYS_TO_DMAP(pa);
139 error = blk_flush(di);
144 /* Check for user abort */
149 printf(" (CTRL-C to abort) ");
156 cpu_minidumpsys(struct dumperinfo *di, const struct minidumpstate *state)
158 pd_entry_t *l1, *l2, l2e;
160 struct minidumphdr mdhdr;
163 vm_offset_t va, kva_max;
175 /* Snapshot the KVA upper bound in case it grows. */
176 kva_max = kernel_vm_end;
179 * Walk the kernel page table pages, setting the active entries in the
182 * NB: for a live dump, we may be racing with updates to the page
183 * tables, so care must be taken to read each entry only once.
185 for (va = VM_MIN_KERNEL_ADDRESS; va < kva_max; va += L2_SIZE) {
186 pmapsize += PAGE_SIZE;
187 if (!pmap_get_tables(pmap_kernel(), va, &l1, &l2, &l3))
190 /* We should always be using the l2 table for kvm */
194 /* l2 may be a superpage */
195 l2e = atomic_load_64(l2);
196 if ((l2e & PTE_RWX) != 0) {
197 pa = (l2e >> PTE_PPN1_S) << L2_SHIFT;
198 for (i = 0; i < Ln_ENTRIES; i++, pa += PAGE_SIZE) {
199 if (vm_phys_is_dumpable(pa))
200 vm_page_dump_add(state->dump_bitset,
204 for (i = 0; i < Ln_ENTRIES; i++) {
205 l3e = atomic_load_64(&l3[i]);
206 if ((l3e & PTE_V) == 0)
208 pa = (l3e >> PTE_PPN0_S) * PAGE_SIZE;
209 if (PHYS_IN_DMAP(pa) && vm_phys_is_dumpable(pa))
210 vm_page_dump_add(state->dump_bitset,
216 /* Calculate dump size */
217 mbp = state->msgbufp;
219 dumpsize += round_page(mbp->msg_size);
220 dumpsize += round_page(sizeof(dump_avail));
221 dumpsize += round_page(BITSET_SIZE(vm_page_dump_pages));
222 VM_PAGE_DUMP_FOREACH(state->dump_bitset, pa) {
223 /* Clear out undumpable pages now if needed */
224 if (PHYS_IN_DMAP(pa) && vm_phys_is_dumpable(pa))
225 dumpsize += PAGE_SIZE;
227 vm_page_dump_drop(state->dump_bitset, pa);
229 dumpsize += PAGE_SIZE;
231 dumpsys_pb_init(dumpsize);
233 /* Initialize mdhdr */
234 bzero(&mdhdr, sizeof(mdhdr));
235 strcpy(mdhdr.magic, MINIDUMP_MAGIC);
236 mdhdr.version = MINIDUMP_VERSION;
237 mdhdr.msgbufsize = mbp->msg_size;
238 mdhdr.bitmapsize = round_page(BITSET_SIZE(vm_page_dump_pages));
239 mdhdr.pmapsize = pmapsize;
240 mdhdr.kernbase = KERNBASE;
241 mdhdr.dmapphys = DMAP_MIN_PHYSADDR;
242 mdhdr.dmapbase = DMAP_MIN_ADDRESS;
243 mdhdr.dmapend = DMAP_MAX_ADDRESS;
244 mdhdr.dumpavailsize = round_page(sizeof(dump_avail));
246 dump_init_header(di, &kdh, KERNELDUMPMAGIC, KERNELDUMP_RISCV_VERSION,
249 error = dump_start(di, &kdh);
253 printf("Dumping %llu out of %ju MB:", (long long)dumpsize >> 20,
254 ptoa((uintmax_t)physmem) / 1048576);
256 /* Dump minidump header */
257 bzero(&tmpbuffer, sizeof(tmpbuffer));
258 bcopy(&mdhdr, &tmpbuffer, sizeof(mdhdr));
259 error = blk_write(di, (char *)&tmpbuffer, 0, PAGE_SIZE);
263 /* Dump msgbuf up front */
264 error = blk_write(di, mbp->msg_ptr, 0, round_page(mbp->msg_size));
268 /* Dump dump_avail */
269 _Static_assert(sizeof(dump_avail) <= sizeof(tmpbuffer),
270 "Large dump_avail not handled");
271 bzero(tmpbuffer, sizeof(tmpbuffer));
272 memcpy(tmpbuffer, dump_avail, sizeof(dump_avail));
273 error = blk_write(di, (char *)&tmpbuffer, 0, PAGE_SIZE);
278 error = blk_write(di, (char *)vm_page_dump, 0,
279 round_page(BITSET_SIZE(vm_page_dump_pages)));
283 /* Dump kernel page directory pages */
284 bzero(&tmpbuffer, sizeof(tmpbuffer));
285 for (va = VM_MIN_KERNEL_ADDRESS; va < kva_max; va += L2_SIZE) {
286 if (!pmap_get_tables(pmap_kernel(), va, &l1, &l2, &l3)) {
287 /* We always write a page, even if it is zero */
288 error = blk_write(di, (char *)&tmpbuffer, 0, PAGE_SIZE);
291 /* Flush, in case we reuse tmpbuffer in the same block */
292 error = blk_flush(di);
298 l2e = atomic_load_64(l2);
299 if ((l2e & PTE_RWX) != 0) {
300 /* Generate fake l3 entries based on the l2 superpage */
301 for (i = 0; i < Ln_ENTRIES; i++) {
302 tmpbuffer[i] = (l2e | (i << PTE_PPN0_S));
304 /* We always write a page, even if it is zero */
305 error = blk_write(di, (char *)&tmpbuffer, 0, PAGE_SIZE);
308 /* Flush, in case we reuse tmpbuffer in the same block */
309 error = blk_flush(di);
312 bzero(&tmpbuffer, sizeof(tmpbuffer));
314 pa = (l2e >> PTE_PPN0_S) * PAGE_SIZE;
317 * We always write a page, even if it is zero. If pa
318 * is malformed, write the zeroed tmpbuffer.
320 if (PHYS_IN_DMAP(pa) && vm_phys_is_dumpable(pa))
321 error = blk_write(di, NULL, pa, PAGE_SIZE);
323 error = blk_write(di, (char *)&tmpbuffer, 0,
330 /* Dump memory chunks */
331 /* XXX cluster it up and use blk_dump() */
332 VM_PAGE_DUMP_FOREACH(state->dump_bitset, pa) {
333 error = blk_write(di, 0, pa, PAGE_SIZE);
338 error = blk_flush(di);
342 error = dump_finish(di, &kdh);
346 printf("\nDump complete\n");
354 if (error == ENOSPC) {
355 printf("Dump map grown while dumping. ");
356 if (retry_count < 5) {
357 printf("Retrying...\n");
360 printf("Dump failed.\n");
362 else if (error == ECANCELED)
363 printf("Dump aborted\n");
364 else if (error == E2BIG) {
365 printf("Dump failed. Partition too small (about %lluMB were "
366 "needed this time).\n", (long long)dumpsize >> 20);
368 printf("** DUMP FAILED (ERROR %d) **\n", error);