]> CyberLeo.Net >> Repos - FreeBSD/FreeBSD.git/blob - sys/compat/linprocfs/linprocfs.c
unbount: Vendor import 1.14.0rc1
[FreeBSD/FreeBSD.git] / sys / compat / linprocfs / linprocfs.c
1 /*-
2  * SPDX-License-Identifier: BSD-4-Clause
3  *
4  * Copyright (c) 2000 Dag-Erling Coïdan Smørgrav
5  * Copyright (c) 1999 Pierre Beyssac
6  * Copyright (c) 1993 Jan-Simon Pendry
7  * Copyright (c) 1993
8  *      The Regents of the University of California.  All rights reserved.
9  *
10  * This code is derived from software contributed to Berkeley by
11  * Jan-Simon Pendry.
12  *
13  * Redistribution and use in source and binary forms, with or without
14  * modification, are permitted provided that the following conditions
15  * are met:
16  * 1. Redistributions of source code must retain the above copyright
17  *    notice, this list of conditions and the following disclaimer.
18  * 2. Redistributions in binary form must reproduce the above copyright
19  *    notice, this list of conditions and the following disclaimer in the
20  *    documentation and/or other materials provided with the distribution.
21  * 3. All advertising materials mentioning features or use of this software
22  *    must display the following acknowledgement:
23  *      This product includes software developed by the University of
24  *      California, Berkeley and its contributors.
25  * 4. Neither the name of the University nor the names of its contributors
26  *    may be used to endorse or promote products derived from this software
27  *    without specific prior written permission.
28  *
29  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
30  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
31  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
32  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
33  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
34  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
35  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
36  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
37  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
38  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
39  * SUCH DAMAGE.
40  *
41  *      @(#)procfs_status.c     8.4 (Berkeley) 6/15/94
42  */
43
44 #include <sys/cdefs.h>
45 __FBSDID("$FreeBSD$");
46
47 #include <sys/param.h>
48 #include <sys/queue.h>
49 #include <sys/blist.h>
50 #include <sys/conf.h>
51 #include <sys/exec.h>
52 #include <sys/fcntl.h>
53 #include <sys/filedesc.h>
54 #include <sys/jail.h>
55 #include <sys/kernel.h>
56 #include <sys/limits.h>
57 #include <sys/linker.h>
58 #include <sys/lock.h>
59 #include <sys/malloc.h>
60 #include <sys/msg.h>
61 #include <sys/mutex.h>
62 #include <sys/namei.h>
63 #include <sys/proc.h>
64 #include <sys/ptrace.h>
65 #include <sys/resourcevar.h>
66 #include <sys/resource.h>
67 #include <sys/sbuf.h>
68 #include <sys/sem.h>
69 #include <sys/shm.h>
70 #include <sys/smp.h>
71 #include <sys/socket.h>
72 #include <sys/syscallsubr.h>
73 #include <sys/sysctl.h>
74 #include <sys/sysent.h>
75 #include <sys/systm.h>
76 #include <sys/time.h>
77 #include <sys/tty.h>
78 #include <sys/user.h>
79 #include <sys/uuid.h>
80 #include <sys/vmmeter.h>
81 #include <sys/vnode.h>
82 #include <sys/bus.h>
83
84 #include <net/if.h>
85 #include <net/if_var.h>
86 #include <net/if_types.h>
87
88 #include <vm/vm.h>
89 #include <vm/vm_extern.h>
90 #include <vm/pmap.h>
91 #include <vm/vm_map.h>
92 #include <vm/vm_param.h>
93 #include <vm/vm_object.h>
94 #include <vm/swap_pager.h>
95
96 #include <machine/clock.h>
97
98 #include <geom/geom.h>
99 #include <geom/geom_int.h>
100
101 #if defined(__i386__) || defined(__amd64__)
102 #include <machine/cputypes.h>
103 #include <machine/md_var.h>
104 #endif /* __i386__ || __amd64__ */
105
106 #include <compat/linux/linux.h>
107 #include <compat/linux/linux_mib.h>
108 #include <compat/linux/linux_misc.h>
109 #include <compat/linux/linux_util.h>
110 #include <fs/pseudofs/pseudofs.h>
111 #include <fs/procfs/procfs.h>
112
113 /*
114  * Various conversion macros
115  */
116 #define T2J(x) ((long)(((x) * 100ULL) / (stathz ? stathz : hz)))        /* ticks to jiffies */
117 #define T2CS(x) ((unsigned long)(((x) * 100ULL) / (stathz ? stathz : hz)))      /* ticks to centiseconds */
118 #define T2S(x) ((x) / (stathz ? stathz : hz))           /* ticks to seconds */
119 #define B2K(x) ((x) >> 10)                              /* bytes to kbytes */
120 #define B2P(x) ((x) >> PAGE_SHIFT)                      /* bytes to pages */
121 #define P2B(x) ((x) << PAGE_SHIFT)                      /* pages to bytes */
122 #define P2K(x) ((x) << (PAGE_SHIFT - 10))               /* pages to kbytes */
123 #define TV2J(x) ((x)->tv_sec * 100UL + (x)->tv_usec / 10000)
124
125 /**
126  * @brief Mapping of ki_stat in struct kinfo_proc to the linux state
127  *
128  * The linux procfs state field displays one of the characters RSDZTW to
129  * denote running, sleeping in an interruptible wait, waiting in an
130  * uninterruptible disk sleep, a zombie process, process is being traced
131  * or stopped, or process is paging respectively.
132  *
133  * Our struct kinfo_proc contains the variable ki_stat which contains a
134  * value out of SIDL, SRUN, SSLEEP, SSTOP, SZOMB, SWAIT and SLOCK.
135  *
136  * This character array is used with ki_stati-1 as an index and tries to
137  * map our states to suitable linux states.
138  */
139 static char linux_state[] = "RRSTZDD";
140
141 /*
142  * Filler function for proc/meminfo
143  */
144 static int
145 linprocfs_domeminfo(PFS_FILL_ARGS)
146 {
147         unsigned long memtotal;         /* total memory in bytes */
148         unsigned long memfree;          /* free memory in bytes */
149         unsigned long cached;           /* page cache */
150         unsigned long buffers;          /* buffer cache */
151         unsigned long long swaptotal;   /* total swap space in bytes */
152         unsigned long long swapused;    /* used swap space in bytes */
153         unsigned long long swapfree;    /* free swap space in bytes */
154         size_t sz;
155         int error, i, j;
156
157         memtotal = physmem * PAGE_SIZE;
158         memfree = (unsigned long)vm_free_count() * PAGE_SIZE;
159         swap_pager_status(&i, &j);
160         swaptotal = (unsigned long long)i * PAGE_SIZE;
161         swapused = (unsigned long long)j * PAGE_SIZE;
162         swapfree = swaptotal - swapused;
163
164         /*
165          * This value may exclude wired pages, but we have no good way of
166          * accounting for that.
167          */
168         cached =
169             (vm_active_count() + vm_inactive_count() + vm_laundry_count()) *
170             PAGE_SIZE;
171
172         sz = sizeof(buffers);
173         error = kernel_sysctlbyname(curthread, "vfs.bufspace", &buffers, &sz,
174             NULL, 0, 0, 0);
175         if (error != 0)
176                 buffers = 0;
177
178         sbuf_printf(sb,
179             "MemTotal: %9lu kB\n"
180             "MemFree:  %9lu kB\n"
181             "Buffers:  %9lu kB\n"
182             "Cached:   %9lu kB\n"
183             "SwapTotal:%9llu kB\n"
184             "SwapFree: %9llu kB\n",
185             B2K(memtotal), B2K(memfree), B2K(buffers),
186             B2K(cached), B2K(swaptotal), B2K(swapfree));
187
188         return (0);
189 }
190
191 #if defined(__i386__) || defined(__amd64__)
192 /*
193  * Filler function for proc/cpuinfo (i386 & amd64 version)
194  */
195 static int
196 linprocfs_docpuinfo(PFS_FILL_ARGS)
197 {
198         int hw_model[2];
199         char model[128];
200         uint64_t freq;
201         size_t size;
202         u_int cache_size[4];
203         int fqmhz, fqkhz;
204         int i, j;
205
206         /*
207          * We default the flags to include all non-conflicting flags,
208          * and the Intel versions of conflicting flags.
209          */
210         static char *cpu_feature_names[] = {
211                 /*  0 */ "fpu", "vme", "de", "pse",
212                 /*  4 */ "tsc", "msr", "pae", "mce",
213                 /*  8 */ "cx8", "apic", "", "sep",
214                 /* 12 */ "mtrr", "pge", "mca", "cmov",
215                 /* 16 */ "pat", "pse36", "pn", "clflush",
216                 /* 20 */ "", "dts", "acpi", "mmx",
217                 /* 24 */ "fxsr", "sse", "sse2", "ss",
218                 /* 28 */ "ht", "tm", "ia64", "pbe"
219         };
220
221         static char *amd_feature_names[] = {
222                 /*  0 */ "", "", "", "",
223                 /*  4 */ "", "", "", "",
224                 /*  8 */ "", "", "", "syscall",
225                 /* 12 */ "", "", "", "",
226                 /* 16 */ "", "", "", "mp",
227                 /* 20 */ "nx", "", "mmxext", "",
228                 /* 24 */ "", "fxsr_opt", "pdpe1gb", "rdtscp",
229                 /* 28 */ "", "lm", "3dnowext", "3dnow"
230         };
231
232         static char *cpu_feature2_names[] = {
233                 /*  0 */ "pni", "pclmulqdq", "dtes64", "monitor",
234                 /*  4 */ "ds_cpl", "vmx", "smx", "est",
235                 /*  8 */ "tm2", "ssse3", "cid", "sdbg",
236                 /* 12 */ "fma", "cx16", "xtpr", "pdcm",
237                 /* 16 */ "", "pcid", "dca", "sse4_1",
238                 /* 20 */ "sse4_2", "x2apic", "movbe", "popcnt",
239                 /* 24 */ "tsc_deadline_timer", "aes", "xsave", "",
240                 /* 28 */ "avx", "f16c", "rdrand", "hypervisor"
241         };
242
243         static char *amd_feature2_names[] = {
244                 /*  0 */ "lahf_lm", "cmp_legacy", "svm", "extapic",
245                 /*  4 */ "cr8_legacy", "abm", "sse4a", "misalignsse",
246                 /*  8 */ "3dnowprefetch", "osvw", "ibs", "xop",
247                 /* 12 */ "skinit", "wdt", "", "lwp",
248                 /* 16 */ "fma4", "tce", "", "nodeid_msr",
249                 /* 20 */ "", "tbm", "topoext", "perfctr_core",
250                 /* 24 */ "perfctr_nb", "", "bpext", "ptsc",
251                 /* 28 */ "perfctr_llc", "mwaitx", "", ""
252         };
253
254         static char *cpu_stdext_feature_names[] = {
255                 /*  0 */ "fsgsbase", "tsc_adjust", "", "bmi1",
256                 /*  4 */ "hle", "avx2", "", "smep",
257                 /*  8 */ "bmi2", "erms", "invpcid", "rtm",
258                 /* 12 */ "cqm", "", "mpx", "rdt_a",
259                 /* 16 */ "avx512f", "avx512dq", "rdseed", "adx",
260                 /* 20 */ "smap", "avx512ifma", "", "clflushopt",
261                 /* 24 */ "clwb", "intel_pt", "avx512pf", "avx512er",
262                 /* 28 */ "avx512cd", "sha_ni", "avx512bw", "avx512vl"
263         };
264
265         static char *power_flags[] = {
266                 "ts",           "fid",          "vid",
267                 "ttp",          "tm",           "stc",
268                 "100mhzsteps",  "hwpstate",     "",
269                 "cpb",          "eff_freq_ro",  "proc_feedback",
270                 "acc_power",
271         };
272
273         hw_model[0] = CTL_HW;
274         hw_model[1] = HW_MODEL;
275         model[0] = '\0';
276         size = sizeof(model);
277         if (kernel_sysctl(td, hw_model, 2, &model, &size, 0, 0, 0, 0) != 0)
278                 strcpy(model, "unknown");
279 #ifdef __i386__
280         switch (cpu_vendor_id) {
281         case CPU_VENDOR_AMD:
282                 if (cpu_class < CPUCLASS_686)
283                         cpu_feature_names[16] = "fcmov";
284                 break;
285         case CPU_VENDOR_CYRIX:
286                 cpu_feature_names[24] = "cxmmx";
287                 break;
288         }
289 #endif
290         if (cpu_exthigh >= 0x80000006)
291                 do_cpuid(0x80000006, cache_size);
292         else
293                 memset(cache_size, 0, sizeof(cache_size));
294         for (i = 0; i < mp_ncpus; ++i) {
295                 fqmhz = 0;
296                 fqkhz = 0;
297                 freq = atomic_load_acq_64(&tsc_freq);
298                 if (freq != 0) {
299                         fqmhz = (freq + 4999) / 1000000;
300                         fqkhz = ((freq + 4999) / 10000) % 100;
301                 }
302                 sbuf_printf(sb,
303                     "processor\t: %d\n"
304                     "vendor_id\t: %.20s\n"
305                     "cpu family\t: %u\n"
306                     "model\t\t: %u\n"
307                     "model name\t: %s\n"
308                     "stepping\t: %u\n"
309                     "cpu MHz\t\t: %d.%02d\n"
310                     "cache size\t: %d KB\n"
311                     "physical id\t: %d\n"
312                     "siblings\t: %d\n"
313                     "core id\t\t: %d\n"
314                     "cpu cores\t: %d\n"
315                     "apicid\t\t: %d\n"
316                     "initial apicid\t: %d\n"
317                     "fpu\t\t: %s\n"
318                     "fpu_exception\t: %s\n"
319                     "cpuid level\t: %d\n"
320                     "wp\t\t: %s\n",
321                     i, cpu_vendor, CPUID_TO_FAMILY(cpu_id),
322                     CPUID_TO_MODEL(cpu_id), model, cpu_id & CPUID_STEPPING,
323                     fqmhz, fqkhz,
324                     (cache_size[2] >> 16), 0, mp_ncpus, i, mp_ncpus,
325                     i, i, /*cpu_id & CPUID_LOCAL_APIC_ID ??*/
326                     (cpu_feature & CPUID_FPU) ? "yes" : "no", "yes",
327                     CPUID_TO_FAMILY(cpu_id), "yes");
328                 sbuf_cat(sb, "flags\t\t:");
329                 for (j = 0; j < nitems(cpu_feature_names); j++)
330                         if (cpu_feature & (1 << j) &&
331                             cpu_feature_names[j][0] != '\0')
332                                 sbuf_printf(sb, " %s", cpu_feature_names[j]);
333                 for (j = 0; j < nitems(amd_feature_names); j++)
334                         if (amd_feature & (1 << j) &&
335                             amd_feature_names[j][0] != '\0')
336                                 sbuf_printf(sb, " %s", amd_feature_names[j]);
337                 for (j = 0; j < nitems(cpu_feature2_names); j++)
338                         if (cpu_feature2 & (1 << j) &&
339                             cpu_feature2_names[j][0] != '\0')
340                                 sbuf_printf(sb, " %s", cpu_feature2_names[j]);
341                 for (j = 0; j < nitems(amd_feature2_names); j++)
342                         if (amd_feature2 & (1 << j) &&
343                             amd_feature2_names[j][0] != '\0')
344                                 sbuf_printf(sb, " %s", amd_feature2_names[j]);
345                 for (j = 0; j < nitems(cpu_stdext_feature_names); j++)
346                         if (cpu_stdext_feature & (1 << j) &&
347                             cpu_stdext_feature_names[j][0] != '\0')
348                                 sbuf_printf(sb, " %s",
349                                     cpu_stdext_feature_names[j]);
350                 sbuf_cat(sb, "\n");
351                 sbuf_printf(sb,
352                     "bugs\t\t: %s\n"
353                     "bogomips\t: %d.%02d\n"
354                     "clflush size\t: %d\n"
355                     "cache_alignment\t: %d\n"
356                     "address sizes\t: %d bits physical, %d bits virtual\n",
357 #if defined(I586_CPU) && !defined(NO_F00F_HACK)
358                     (has_f00f_bug) ? "Intel F00F" : "",
359 #else
360                     "",
361 #endif
362                     fqmhz * 2, fqkhz,
363                     cpu_clflush_line_size, cpu_clflush_line_size,
364                     cpu_maxphyaddr,
365                     (cpu_maxphyaddr > 32) ? 48 : 0);
366                 sbuf_cat(sb, "power management: ");
367                 for (j = 0; j < nitems(power_flags); j++)
368                         if (amd_pminfo & (1 << j))
369                                 sbuf_printf(sb, " %s", power_flags[j]);
370                 sbuf_cat(sb, "\n\n");
371
372                 /* XXX per-cpu vendor / class / model / id? */
373         }
374         sbuf_cat(sb, "\n");
375
376         return (0);
377 }
378 #else
379 /* ARM64TODO: implement non-stubbed linprocfs_docpuinfo */
380 static int
381 linprocfs_docpuinfo(PFS_FILL_ARGS)
382 {
383         int i;
384
385         for (i = 0; i < mp_ncpus; ++i) {
386                 sbuf_printf(sb,
387                     "processor\t: %d\n"
388                     "BogoMIPS\t: %d.%02d\n",
389                     i, 0, 0);
390                 sbuf_cat(sb, "Features\t: ");
391                 sbuf_cat(sb, "\n");
392                 sbuf_printf(sb,
393                     "CPU implementer\t: \n"
394                     "CPU architecture: \n"
395                     "CPU variant\t: 0x%x\n"
396                     "CPU part\t: 0x%x\n"
397                     "CPU revision\t: %d\n",
398                     0, 0, 0);
399                 sbuf_cat(sb, "\n");
400         }
401
402         return (0);
403 }
404 #endif /* __i386__ || __amd64__ */
405
406 static const char *path_slash_sys = "/sys";
407 static const char *fstype_sysfs = "sysfs";
408
409 static int
410 _mtab_helper(const struct pfs_node *pn, const struct statfs *sp,
411     const char **mntfrom, const char **mntto, const char **fstype)
412 {
413         /* determine device name */
414         *mntfrom = sp->f_mntfromname;
415
416         /* determine mount point */
417         *mntto = sp->f_mntonname;
418
419         /* determine fs type */
420         *fstype = sp->f_fstypename;
421         if (strcmp(*fstype, pn->pn_info->pi_name) == 0)
422                 *mntfrom = *fstype = "proc";
423         else if (strcmp(*fstype, "procfs") == 0)
424                 return (ECANCELED);
425
426         if (strcmp(*fstype, "autofs") == 0) {
427                 /*
428                  * FreeBSD uses eg "map -hosts", whereas Linux
429                  * expects just "-hosts".
430                  */
431                 if (strncmp(*mntfrom, "map ", 4) == 0)
432                         *mntfrom += 4;
433         }
434
435         if (strcmp(*fstype, "linsysfs") == 0) {
436                 *mntfrom = path_slash_sys;
437                 *fstype = fstype_sysfs;
438         } else {
439                 /* For Linux msdosfs is called vfat */
440                 if (strcmp(*fstype, "msdosfs") == 0)
441                         *fstype = "vfat";
442         }
443         return (0);
444 }
445
446 static void
447 _sbuf_mntoptions_helper(struct sbuf *sb, uint64_t f_flags)
448 {
449         sbuf_cat(sb, (f_flags & MNT_RDONLY) ? "ro" : "rw");
450 #define ADD_OPTION(opt, name) \
451         if (f_flags & (opt)) sbuf_cat(sb, "," name);
452         ADD_OPTION(MNT_SYNCHRONOUS,     "sync");
453         ADD_OPTION(MNT_NOEXEC,          "noexec");
454         ADD_OPTION(MNT_NOSUID,          "nosuid");
455         ADD_OPTION(MNT_UNION,           "union");
456         ADD_OPTION(MNT_ASYNC,           "async");
457         ADD_OPTION(MNT_SUIDDIR,         "suiddir");
458         ADD_OPTION(MNT_NOSYMFOLLOW,     "nosymfollow");
459         ADD_OPTION(MNT_NOATIME,         "noatime");
460 #undef ADD_OPTION
461 }
462
463 /*
464  * Filler function for proc/mtab and proc/<pid>/mounts.
465  *
466  * /proc/mtab doesn't exist in Linux' procfs, but is included here so
467  * users can symlink /compat/linux/etc/mtab to /proc/mtab
468  */
469 static int
470 linprocfs_domtab(PFS_FILL_ARGS)
471 {
472         struct nameidata nd;
473         const char *lep, *mntto, *mntfrom, *fstype;
474         char *dlep, *flep;
475         size_t lep_len;
476         int error;
477         struct statfs *buf, *sp;
478         size_t count;
479
480         /* resolve symlinks etc. in the emulation tree prefix */
481         /*
482          * Ideally, this would use the current chroot rather than some
483          * hardcoded path.
484          */
485         NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, linux_emul_path);
486         flep = NULL;
487         error = namei(&nd);
488         lep = linux_emul_path;
489         if (error == 0) {
490                 if (vn_fullpath(nd.ni_vp, &dlep, &flep) == 0)
491                         lep = dlep;
492                 vrele(nd.ni_vp);
493         }
494         lep_len = strlen(lep);
495
496         buf = NULL;
497         error = kern_getfsstat(td, &buf, SIZE_T_MAX, &count,
498             UIO_SYSSPACE, MNT_WAIT);
499         if (error != 0) {
500                 free(buf, M_TEMP);
501                 free(flep, M_TEMP);
502                 return (error);
503         }
504
505         for (sp = buf; count > 0; sp++, count--) {
506                 error = _mtab_helper(pn, sp, &mntfrom, &mntto, &fstype);
507                 if (error != 0) {
508                         MPASS(error == ECANCELED);
509                         continue;
510                 }
511
512                 /* determine mount point */
513                 if (strncmp(mntto, lep, lep_len) == 0 && mntto[lep_len] == '/')
514                         mntto += lep_len;
515
516                 sbuf_printf(sb, "%s %s %s ", mntfrom, mntto, fstype);
517                 _sbuf_mntoptions_helper(sb, sp->f_flags);
518                 /* a real Linux mtab will also show NFS options */
519                 sbuf_printf(sb, " 0 0\n");
520         }
521
522         free(buf, M_TEMP);
523         free(flep, M_TEMP);
524         return (error);
525 }
526
527 static int
528 linprocfs_doprocmountinfo(PFS_FILL_ARGS)
529 {
530         struct nameidata nd;
531         const char *mntfrom, *mntto, *fstype;
532         const char *lep;
533         char *dlep, *flep;
534         struct statfs *buf, *sp;
535         size_t count, lep_len;
536         int error;
537
538         /*
539          * Ideally, this would use the current chroot rather than some
540          * hardcoded path.
541          */
542         NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, linux_emul_path);
543         flep = NULL;
544         error = namei(&nd);
545         lep = linux_emul_path;
546         if (error == 0) {
547                 if (vn_fullpath(nd.ni_vp, &dlep, &flep) == 0)
548                         lep = dlep;
549                 vrele(nd.ni_vp);
550         }
551         lep_len = strlen(lep);
552
553         buf = NULL;
554         error = kern_getfsstat(td, &buf, SIZE_T_MAX, &count,
555             UIO_SYSSPACE, MNT_WAIT);
556         if (error != 0)
557                 goto out;
558
559         for (sp = buf; count > 0; sp++, count--) {
560                 error = _mtab_helper(pn, sp, &mntfrom, &mntto, &fstype);
561                 if (error != 0) {
562                         MPASS(error == ECANCELED);
563                         continue;
564                 }
565
566                 if (strncmp(mntto, lep, lep_len) == 0 && mntto[lep_len] == '/')
567                         mntto += lep_len;
568 #if 0
569                 /*
570                  * If the prefix is a chroot, and this mountpoint is not under
571                  * the prefix, we should skip it.  Leave it for now for
572                  * consistency with procmtab above.
573                  */
574                 else
575                         continue;
576 #endif
577
578                 /*
579                  * (1) mount id
580                  *
581                  * (2) parent mount id -- we don't have this cheaply, so
582                  * provide a dummy value
583                  *
584                  * (3) major:minor -- ditto
585                  *
586                  * (4) root filesystem mount -- probably a namespaces thing
587                  *
588                  * (5) mountto path
589                  */
590                 sbuf_printf(sb, "%u 0 0:0 / %s ",
591                     sp->f_fsid.val[0] ^ sp->f_fsid.val[1], mntto);
592                 /* (6) mount options */
593                 _sbuf_mntoptions_helper(sb, sp->f_flags);
594                 /*
595                  * (7) zero or more optional fields -- again, namespace related
596                  *
597                  * (8) End of variable length fields separator ("-")
598                  *
599                  * (9) fstype
600                  *
601                  * (10) mount from
602                  *
603                  * (11) "superblock" options -- like (6), but different
604                  * semantics in Linux
605                  */
606                 sbuf_printf(sb, " - %s %s %s\n", fstype, mntfrom,
607                     (sp->f_flags & MNT_RDONLY) ? "ro" : "rw");
608         }
609
610         error = 0;
611 out:
612         free(buf, M_TEMP);
613         free(flep, M_TEMP);
614         return (error);
615 }
616
617 /*
618  * Filler function for proc/partitions
619  */
620 static int
621 linprocfs_dopartitions(PFS_FILL_ARGS)
622 {
623         struct g_class *cp;
624         struct g_geom *gp;
625         struct g_provider *pp;
626         int major, minor;
627
628         g_topology_lock();
629         sbuf_printf(sb, "major minor  #blocks  name rio rmerge rsect "
630             "ruse wio wmerge wsect wuse running use aveq\n");
631
632         LIST_FOREACH(cp, &g_classes, class) {
633                 if (strcmp(cp->name, "DISK") == 0 ||
634                     strcmp(cp->name, "PART") == 0)
635                         LIST_FOREACH(gp, &cp->geom, geom) {
636                                 LIST_FOREACH(pp, &gp->provider, provider) {
637                                         if (linux_driver_get_major_minor(
638                                             pp->name, &major, &minor) != 0) {
639                                                 major = 0;
640                                                 minor = 0;
641                                         }
642                                         sbuf_printf(sb, "%d %d %lld %s "
643                                             "%d %d %d %d %d "
644                                              "%d %d %d %d %d %d\n",
645                                              major, minor,
646                                              (long long)pp->mediasize, pp->name,
647                                              0, 0, 0, 0, 0,
648                                              0, 0, 0, 0, 0, 0);
649                                 }
650                         }
651         }
652         g_topology_unlock();
653
654         return (0);
655 }
656
657 /*
658  * Filler function for proc/stat
659  *
660  * Output depends on kernel version:
661  *
662  * v2.5.40 <=
663  *   user nice system idle
664  * v2.5.41
665  *   user nice system idle iowait
666  * v2.6.11
667  *   user nice system idle iowait irq softirq steal
668  * v2.6.24
669  *   user nice system idle iowait irq softirq steal guest
670  * v2.6.33 >=
671  *   user nice system idle iowait irq softirq steal guest guest_nice
672  */
673 static int
674 linprocfs_dostat(PFS_FILL_ARGS)
675 {
676         struct pcpu *pcpu;
677         long cp_time[CPUSTATES];
678         long *cp;
679         struct timeval boottime;
680         int i;
681         char *zero_pad;
682         bool has_intr = true;
683
684         if (linux_kernver(td) >= LINUX_KERNVER(2,6,33)) {
685                 zero_pad = " 0 0 0 0\n";
686         } else if (linux_kernver(td) >= LINUX_KERNVER(2,6,24)) {
687                 zero_pad = " 0 0 0\n";
688         } else if (linux_kernver(td) >= LINUX_KERNVER(2,6,11)) {
689                 zero_pad = " 0 0\n";
690         } else if (linux_kernver(td) >= LINUX_KERNVER(2,5,41)) {
691                 has_intr = false;
692                 zero_pad = " 0\n";
693         } else {
694                 has_intr = false;
695                 zero_pad = "\n";
696         }
697
698         read_cpu_time(cp_time);
699         getboottime(&boottime);
700         /* Parameters common to all versions */
701         sbuf_printf(sb, "cpu %lu %lu %lu %lu",
702             T2J(cp_time[CP_USER]),
703             T2J(cp_time[CP_NICE]),
704             T2J(cp_time[CP_SYS]),
705             T2J(cp_time[CP_IDLE]));
706
707         /* Print interrupt stats if available */
708         if (has_intr) {
709                 sbuf_printf(sb, " 0 %lu", T2J(cp_time[CP_INTR]));
710         }
711
712         /* Pad out remaining fields depending on version */
713         sbuf_printf(sb, "%s", zero_pad);
714
715         CPU_FOREACH(i) {
716                 pcpu = pcpu_find(i);
717                 cp = pcpu->pc_cp_time;
718                 sbuf_printf(sb, "cpu%d %lu %lu %lu %lu", i,
719                     T2J(cp[CP_USER]),
720                     T2J(cp[CP_NICE]),
721                     T2J(cp[CP_SYS]),
722                     T2J(cp[CP_IDLE]));
723
724                 if (has_intr) {
725                         sbuf_printf(sb, " 0 %lu", T2J(cp[CP_INTR]));
726                 }
727
728                 sbuf_printf(sb, "%s", zero_pad);
729         }
730         sbuf_printf(sb,
731             "disk 0 0 0 0\n"
732             "page %ju %ju\n"
733             "swap %ju %ju\n"
734             "intr %ju\n"
735             "ctxt %ju\n"
736             "btime %lld\n",
737             (uintmax_t)VM_CNT_FETCH(v_vnodepgsin),
738             (uintmax_t)VM_CNT_FETCH(v_vnodepgsout),
739             (uintmax_t)VM_CNT_FETCH(v_swappgsin),
740             (uintmax_t)VM_CNT_FETCH(v_swappgsout),
741             (uintmax_t)VM_CNT_FETCH(v_intr),
742             (uintmax_t)VM_CNT_FETCH(v_swtch),
743             (long long)boottime.tv_sec);
744         return (0);
745 }
746
747 static int
748 linprocfs_doswaps(PFS_FILL_ARGS)
749 {
750         struct xswdev xsw;
751         uintmax_t total, used;
752         int n;
753         char devname[SPECNAMELEN + 1];
754
755         sbuf_printf(sb, "Filename\t\t\t\tType\t\tSize\tUsed\tPriority\n");
756         for (n = 0; ; n++) {
757                 if (swap_dev_info(n, &xsw, devname, sizeof(devname)) != 0)
758                         break;
759                 total = (uintmax_t)xsw.xsw_nblks * PAGE_SIZE / 1024;
760                 used  = (uintmax_t)xsw.xsw_used * PAGE_SIZE / 1024;
761
762                 /*
763                  * The space and not tab after the device name is on
764                  * purpose.  Linux does so.
765                  */
766                 sbuf_printf(sb, "/dev/%-34s unknown\t\t%jd\t%jd\t-1\n",
767                     devname, total, used);
768         }
769         return (0);
770 }
771
772 /*
773  * Filler function for proc/uptime
774  */
775 static int
776 linprocfs_douptime(PFS_FILL_ARGS)
777 {
778         long cp_time[CPUSTATES];
779         struct timeval tv;
780
781         getmicrouptime(&tv);
782         read_cpu_time(cp_time);
783         sbuf_printf(sb, "%lld.%02ld %ld.%02lu\n",
784             (long long)tv.tv_sec, tv.tv_usec / 10000,
785             T2S(cp_time[CP_IDLE] / mp_ncpus),
786             T2CS(cp_time[CP_IDLE] / mp_ncpus) % 100);
787         return (0);
788 }
789
790 /*
791  * Get OS build date
792  */
793 static void
794 linprocfs_osbuild(struct thread *td, struct sbuf *sb)
795 {
796 #if 0
797         char osbuild[256];
798         char *cp1, *cp2;
799
800         strncpy(osbuild, version, 256);
801         osbuild[255] = '\0';
802         cp1 = strstr(osbuild, "\n");
803         cp2 = strstr(osbuild, ":");
804         if (cp1 && cp2) {
805                 *cp1 = *cp2 = '\0';
806                 cp1 = strstr(osbuild, "#");
807         } else
808                 cp1 = NULL;
809         if (cp1)
810                 sbuf_printf(sb, "%s%s", cp1, cp2 + 1);
811         else
812 #endif
813                 sbuf_cat(sb, "#4 Sun Dec 18 04:30:00 CET 1977");
814 }
815
816 /*
817  * Get OS builder
818  */
819 static void
820 linprocfs_osbuilder(struct thread *td, struct sbuf *sb)
821 {
822 #if 0
823         char builder[256];
824         char *cp;
825
826         cp = strstr(version, "\n    ");
827         if (cp) {
828                 strncpy(builder, cp + 5, 256);
829                 builder[255] = '\0';
830                 cp = strstr(builder, ":");
831                 if (cp)
832                         *cp = '\0';
833         }
834         if (cp)
835                 sbuf_cat(sb, builder);
836         else
837 #endif
838                 sbuf_cat(sb, "des@freebsd.org");
839 }
840
841 /*
842  * Filler function for proc/version
843  */
844 static int
845 linprocfs_doversion(PFS_FILL_ARGS)
846 {
847         char osname[LINUX_MAX_UTSNAME];
848         char osrelease[LINUX_MAX_UTSNAME];
849
850         linux_get_osname(td, osname);
851         linux_get_osrelease(td, osrelease);
852         sbuf_printf(sb, "%s version %s (", osname, osrelease);
853         linprocfs_osbuilder(td, sb);
854         sbuf_cat(sb, ") (gcc version " __VERSION__ ") ");
855         linprocfs_osbuild(td, sb);
856         sbuf_cat(sb, "\n");
857
858         return (0);
859 }
860
861 /*
862  * Filler function for proc/loadavg
863  */
864 static int
865 linprocfs_doloadavg(PFS_FILL_ARGS)
866 {
867
868         sbuf_printf(sb,
869             "%d.%02d %d.%02d %d.%02d %d/%d %d\n",
870             (int)(averunnable.ldavg[0] / averunnable.fscale),
871             (int)(averunnable.ldavg[0] * 100 / averunnable.fscale % 100),
872             (int)(averunnable.ldavg[1] / averunnable.fscale),
873             (int)(averunnable.ldavg[1] * 100 / averunnable.fscale % 100),
874             (int)(averunnable.ldavg[2] / averunnable.fscale),
875             (int)(averunnable.ldavg[2] * 100 / averunnable.fscale % 100),
876             1,                          /* number of running tasks */
877             nprocs,                     /* number of tasks */
878             lastpid                     /* the last pid */
879         );
880         return (0);
881 }
882
883 static int
884 linprocfs_get_tty_nr(struct proc *p)
885 {
886         struct session *sp;
887         const char *ttyname;
888         int error, major, minor, nr;
889
890         PROC_LOCK_ASSERT(p, MA_OWNED);
891         sx_assert(&proctree_lock, SX_LOCKED);
892
893         if ((p->p_flag & P_CONTROLT) == 0)
894                 return (-1);
895
896         sp = p->p_pgrp->pg_session;
897         if (sp == NULL)
898                 return (-1);
899
900         ttyname = devtoname(sp->s_ttyp->t_dev);
901         error = linux_driver_get_major_minor(ttyname, &major, &minor);
902         if (error != 0)
903                 return (-1);
904
905         nr = makedev(major, minor);
906         return (nr);
907 }
908
909 /*
910  * Filler function for proc/pid/stat
911  */
912 static int
913 linprocfs_doprocstat(PFS_FILL_ARGS)
914 {
915         struct kinfo_proc kp;
916         struct timeval boottime;
917         char state;
918         static int ratelimit = 0;
919         int tty_nr;
920         vm_offset_t startcode, startdata;
921
922         getboottime(&boottime);
923         sx_slock(&proctree_lock);
924         PROC_LOCK(p);
925         fill_kinfo_proc(p, &kp);
926         tty_nr = linprocfs_get_tty_nr(p);
927         sx_sunlock(&proctree_lock);
928         if (p->p_vmspace) {
929            startcode = (vm_offset_t)p->p_vmspace->vm_taddr;
930            startdata = (vm_offset_t)p->p_vmspace->vm_daddr;
931         } else {
932            startcode = 0;
933            startdata = 0;
934         }
935         sbuf_printf(sb, "%d", p->p_pid);
936 #define PS_ADD(name, fmt, arg) sbuf_printf(sb, " " fmt, arg)
937         PS_ADD("comm",          "(%s)", p->p_comm);
938         if (kp.ki_stat > sizeof(linux_state)) {
939                 state = 'R';
940
941                 if (ratelimit == 0) {
942                         printf("linprocfs: don't know how to handle unknown FreeBSD state %d/%zd, mapping to R\n",
943                             kp.ki_stat, sizeof(linux_state));
944                         ++ratelimit;
945                 }
946         } else
947                 state = linux_state[kp.ki_stat - 1];
948         PS_ADD("state",         "%c",   state);
949         PS_ADD("ppid",          "%d",   p->p_pptr ? p->p_pptr->p_pid : 0);
950         PS_ADD("pgrp",          "%d",   p->p_pgid);
951         PS_ADD("session",       "%d",   p->p_session->s_sid);
952         PROC_UNLOCK(p);
953         PS_ADD("tty",           "%d",   tty_nr);
954         PS_ADD("tpgid",         "%d",   kp.ki_tpgid);
955         PS_ADD("flags",         "%u",   0); /* XXX */
956         PS_ADD("minflt",        "%lu",  kp.ki_rusage.ru_minflt);
957         PS_ADD("cminflt",       "%lu",  kp.ki_rusage_ch.ru_minflt);
958         PS_ADD("majflt",        "%lu",  kp.ki_rusage.ru_majflt);
959         PS_ADD("cmajflt",       "%lu",  kp.ki_rusage_ch.ru_majflt);
960         PS_ADD("utime",         "%ld",  TV2J(&kp.ki_rusage.ru_utime));
961         PS_ADD("stime",         "%ld",  TV2J(&kp.ki_rusage.ru_stime));
962         PS_ADD("cutime",        "%ld",  TV2J(&kp.ki_rusage_ch.ru_utime));
963         PS_ADD("cstime",        "%ld",  TV2J(&kp.ki_rusage_ch.ru_stime));
964         PS_ADD("priority",      "%d",   kp.ki_pri.pri_user);
965         PS_ADD("nice",          "%d",   kp.ki_nice); /* 19 (nicest) to -19 */
966         PS_ADD("0",             "%d",   0); /* removed field */
967         PS_ADD("itrealvalue",   "%d",   0); /* XXX */
968         PS_ADD("starttime",     "%lu",  TV2J(&kp.ki_start) - TV2J(&boottime));
969         PS_ADD("vsize",         "%ju",  P2K((uintmax_t)kp.ki_size));
970         PS_ADD("rss",           "%ju",  (uintmax_t)kp.ki_rssize);
971         PS_ADD("rlim",          "%lu",  kp.ki_rusage.ru_maxrss);
972         PS_ADD("startcode",     "%ju",  (uintmax_t)startcode);
973         PS_ADD("endcode",       "%ju",  (uintmax_t)startdata);
974         PS_ADD("startstack",    "%u",   0); /* XXX */
975         PS_ADD("kstkesp",       "%u",   0); /* XXX */
976         PS_ADD("kstkeip",       "%u",   0); /* XXX */
977         PS_ADD("signal",        "%u",   0); /* XXX */
978         PS_ADD("blocked",       "%u",   0); /* XXX */
979         PS_ADD("sigignore",     "%u",   0); /* XXX */
980         PS_ADD("sigcatch",      "%u",   0); /* XXX */
981         PS_ADD("wchan",         "%u",   0); /* XXX */
982         PS_ADD("nswap",         "%lu",  kp.ki_rusage.ru_nswap);
983         PS_ADD("cnswap",        "%lu",  kp.ki_rusage_ch.ru_nswap);
984         PS_ADD("exitsignal",    "%d",   0); /* XXX */
985         PS_ADD("processor",     "%u",   kp.ki_lastcpu);
986         PS_ADD("rt_priority",   "%u",   0); /* XXX */ /* >= 2.5.19 */
987         PS_ADD("policy",        "%u",   kp.ki_pri.pri_class); /* >= 2.5.19 */
988 #undef PS_ADD
989         sbuf_putc(sb, '\n');
990
991         return (0);
992 }
993
994 /*
995  * Filler function for proc/pid/statm
996  */
997 static int
998 linprocfs_doprocstatm(PFS_FILL_ARGS)
999 {
1000         struct kinfo_proc kp;
1001         segsz_t lsize;
1002
1003         sx_slock(&proctree_lock);
1004         PROC_LOCK(p);
1005         fill_kinfo_proc(p, &kp);
1006         PROC_UNLOCK(p);
1007         sx_sunlock(&proctree_lock);
1008
1009         /*
1010          * See comments in linprocfs_doprocstatus() regarding the
1011          * computation of lsize.
1012          */
1013         /* size resident share trs drs lrs dt */
1014         sbuf_printf(sb, "%ju ", B2P((uintmax_t)kp.ki_size));
1015         sbuf_printf(sb, "%ju ", (uintmax_t)kp.ki_rssize);
1016         sbuf_printf(sb, "%ju ", (uintmax_t)0); /* XXX */
1017         sbuf_printf(sb, "%ju ", (uintmax_t)kp.ki_tsize);
1018         sbuf_printf(sb, "%ju ", (uintmax_t)(kp.ki_dsize + kp.ki_ssize));
1019         lsize = B2P(kp.ki_size) - kp.ki_dsize -
1020             kp.ki_ssize - kp.ki_tsize - 1;
1021         sbuf_printf(sb, "%ju ", (uintmax_t)lsize);
1022         sbuf_printf(sb, "%ju\n", (uintmax_t)0); /* XXX */
1023
1024         return (0);
1025 }
1026
1027 /*
1028  * Filler function for proc/pid/status
1029  */
1030 static int
1031 linprocfs_doprocstatus(PFS_FILL_ARGS)
1032 {
1033         struct kinfo_proc kp;
1034         char *state;
1035         segsz_t lsize;
1036         struct thread *td2;
1037         struct sigacts *ps;
1038         l_sigset_t siglist, sigignore, sigcatch;
1039         int i;
1040
1041         sx_slock(&proctree_lock);
1042         PROC_LOCK(p);
1043         td2 = FIRST_THREAD_IN_PROC(p); /* XXXKSE pretend only one thread */
1044
1045         if (P_SHOULDSTOP(p)) {
1046                 state = "T (stopped)";
1047         } else {
1048                 switch(p->p_state) {
1049                 case PRS_NEW:
1050                         state = "I (idle)";
1051                         break;
1052                 case PRS_NORMAL:
1053                         if (p->p_flag & P_WEXIT) {
1054                                 state = "X (exiting)";
1055                                 break;
1056                         }
1057                         switch(TD_GET_STATE(td2)) {
1058                         case TDS_INHIBITED:
1059                                 state = "S (sleeping)";
1060                                 break;
1061                         case TDS_RUNQ:
1062                         case TDS_RUNNING:
1063                                 state = "R (running)";
1064                                 break;
1065                         default:
1066                                 state = "? (unknown)";
1067                                 break;
1068                         }
1069                         break;
1070                 case PRS_ZOMBIE:
1071                         state = "Z (zombie)";
1072                         break;
1073                 default:
1074                         state = "? (unknown)";
1075                         break;
1076                 }
1077         }
1078
1079         fill_kinfo_proc(p, &kp);
1080         sx_sunlock(&proctree_lock);
1081
1082         sbuf_printf(sb, "Name:\t%s\n",          p->p_comm); /* XXX escape */
1083         sbuf_printf(sb, "State:\t%s\n",         state);
1084
1085         /*
1086          * Credentials
1087          */
1088         sbuf_printf(sb, "Tgid:\t%d\n",          p->p_pid);
1089         sbuf_printf(sb, "Pid:\t%d\n",           p->p_pid);
1090         sbuf_printf(sb, "PPid:\t%d\n",          kp.ki_ppid );
1091         sbuf_printf(sb, "TracerPid:\t%d\n",     kp.ki_tracer );
1092         sbuf_printf(sb, "Uid:\t%d\t%d\t%d\t%d\n", p->p_ucred->cr_ruid,
1093                                                 p->p_ucred->cr_uid,
1094                                                 p->p_ucred->cr_svuid,
1095                                                 /* FreeBSD doesn't have fsuid */
1096                                                 p->p_ucred->cr_uid);
1097         sbuf_printf(sb, "Gid:\t%d\t%d\t%d\t%d\n", p->p_ucred->cr_rgid,
1098                                                 p->p_ucred->cr_gid,
1099                                                 p->p_ucred->cr_svgid,
1100                                                 /* FreeBSD doesn't have fsgid */
1101                                                 p->p_ucred->cr_gid);
1102         sbuf_cat(sb, "Groups:\t");
1103         for (i = 0; i < p->p_ucred->cr_ngroups; i++)
1104                 sbuf_printf(sb, "%d ",          p->p_ucred->cr_groups[i]);
1105         PROC_UNLOCK(p);
1106         sbuf_putc(sb, '\n');
1107
1108         /*
1109          * Memory
1110          *
1111          * While our approximation of VmLib may not be accurate (I
1112          * don't know of a simple way to verify it, and I'm not sure
1113          * it has much meaning anyway), I believe it's good enough.
1114          *
1115          * The same code that could (I think) accurately compute VmLib
1116          * could also compute VmLck, but I don't really care enough to
1117          * implement it. Submissions are welcome.
1118          */
1119         sbuf_printf(sb, "VmSize:\t%8ju kB\n",   B2K((uintmax_t)kp.ki_size));
1120         sbuf_printf(sb, "VmLck:\t%8u kB\n",     P2K(0)); /* XXX */
1121         sbuf_printf(sb, "VmRSS:\t%8ju kB\n",    P2K((uintmax_t)kp.ki_rssize));
1122         sbuf_printf(sb, "VmData:\t%8ju kB\n",   P2K((uintmax_t)kp.ki_dsize));
1123         sbuf_printf(sb, "VmStk:\t%8ju kB\n",    P2K((uintmax_t)kp.ki_ssize));
1124         sbuf_printf(sb, "VmExe:\t%8ju kB\n",    P2K((uintmax_t)kp.ki_tsize));
1125         lsize = B2P(kp.ki_size) - kp.ki_dsize -
1126             kp.ki_ssize - kp.ki_tsize - 1;
1127         sbuf_printf(sb, "VmLib:\t%8ju kB\n",    P2K((uintmax_t)lsize));
1128
1129         /*
1130          * Signal masks
1131          */
1132         PROC_LOCK(p);
1133         bsd_to_linux_sigset(&p->p_siglist, &siglist);
1134         ps = p->p_sigacts;
1135         mtx_lock(&ps->ps_mtx);
1136         bsd_to_linux_sigset(&ps->ps_sigignore, &sigignore);
1137         bsd_to_linux_sigset(&ps->ps_sigcatch, &sigcatch);
1138         mtx_unlock(&ps->ps_mtx);
1139         PROC_UNLOCK(p);
1140
1141         sbuf_printf(sb, "SigPnd:\t%016jx\n",    siglist.__mask);
1142         /*
1143          * XXX. SigBlk - target thread's signal mask, td_sigmask.
1144          * To implement SigBlk pseudofs should support proc/tid dir entries.
1145          */
1146         sbuf_printf(sb, "SigBlk:\t%016x\n",     0);
1147         sbuf_printf(sb, "SigIgn:\t%016jx\n",    sigignore.__mask);
1148         sbuf_printf(sb, "SigCgt:\t%016jx\n",    sigcatch.__mask);
1149
1150         /*
1151          * Linux also prints the capability masks, but we don't have
1152          * capabilities yet, and when we do get them they're likely to
1153          * be meaningless to Linux programs, so we lie. XXX
1154          */
1155         sbuf_printf(sb, "CapInh:\t%016x\n",     0);
1156         sbuf_printf(sb, "CapPrm:\t%016x\n",     0);
1157         sbuf_printf(sb, "CapEff:\t%016x\n",     0);
1158
1159         return (0);
1160 }
1161
1162 /*
1163  * Filler function for proc/pid/cwd
1164  */
1165 static int
1166 linprocfs_doproccwd(PFS_FILL_ARGS)
1167 {
1168         struct pwd *pwd;
1169         char *fullpath = "unknown";
1170         char *freepath = NULL;
1171
1172         pwd = pwd_hold_proc(p);
1173         vn_fullpath(pwd->pwd_cdir, &fullpath, &freepath);
1174         sbuf_printf(sb, "%s", fullpath);
1175         if (freepath)
1176                 free(freepath, M_TEMP);
1177         pwd_drop(pwd);
1178         return (0);
1179 }
1180
1181 /*
1182  * Filler function for proc/pid/root
1183  */
1184 static int
1185 linprocfs_doprocroot(PFS_FILL_ARGS)
1186 {
1187         struct pwd *pwd;
1188         struct vnode *vp;
1189         char *fullpath = "unknown";
1190         char *freepath = NULL;
1191
1192         pwd = pwd_hold_proc(p);
1193         vp = jailed(p->p_ucred) ? pwd->pwd_jdir : pwd->pwd_rdir;
1194         vn_fullpath(vp, &fullpath, &freepath);
1195         sbuf_printf(sb, "%s", fullpath);
1196         if (freepath)
1197                 free(freepath, M_TEMP);
1198         pwd_drop(pwd);
1199         return (0);
1200 }
1201
1202 /*
1203  * Filler function for proc/pid/cmdline
1204  */
1205 static int
1206 linprocfs_doproccmdline(PFS_FILL_ARGS)
1207 {
1208         int ret;
1209
1210         PROC_LOCK(p);
1211         if ((ret = p_cansee(td, p)) != 0) {
1212                 PROC_UNLOCK(p);
1213                 return (ret);
1214         }
1215
1216         /*
1217          * Mimic linux behavior and pass only processes with usermode
1218          * address space as valid.  Return zero silently otherwize.
1219          */
1220         if (p->p_vmspace == &vmspace0) {
1221                 PROC_UNLOCK(p);
1222                 return (0);
1223         }
1224         if (p->p_args != NULL) {
1225                 sbuf_bcpy(sb, p->p_args->ar_args, p->p_args->ar_length);
1226                 PROC_UNLOCK(p);
1227                 return (0);
1228         }
1229
1230         if ((p->p_flag & P_SYSTEM) != 0) {
1231                 PROC_UNLOCK(p);
1232                 return (0);
1233         }
1234
1235         PROC_UNLOCK(p);
1236
1237         ret = proc_getargv(td, p, sb);
1238         return (ret);
1239 }
1240
1241 /*
1242  * Filler function for proc/pid/environ
1243  */
1244 static int
1245 linprocfs_doprocenviron(PFS_FILL_ARGS)
1246 {
1247
1248         /*
1249          * Mimic linux behavior and pass only processes with usermode
1250          * address space as valid.  Return zero silently otherwize.
1251          */
1252         if (p->p_vmspace == &vmspace0)
1253                 return (0);
1254
1255         return (proc_getenvv(td, p, sb));
1256 }
1257
1258 static char l32_map_str[] = "%08lx-%08lx %s%s%s%s %08lx %02x:%02x %lu%s%s\n";
1259 static char l64_map_str[] = "%016lx-%016lx %s%s%s%s %08lx %02x:%02x %lu%s%s\n";
1260 static char vdso_str[] = "      [vdso]";
1261 static char stack_str[] = "      [stack]";
1262
1263 /*
1264  * Filler function for proc/pid/maps
1265  */
1266 static int
1267 linprocfs_doprocmaps(PFS_FILL_ARGS)
1268 {
1269         struct vmspace *vm;
1270         vm_map_t map;
1271         vm_map_entry_t entry, tmp_entry;
1272         vm_object_t obj, tobj, lobj;
1273         vm_offset_t e_start, e_end;
1274         vm_ooffset_t off;
1275         vm_prot_t e_prot;
1276         unsigned int last_timestamp;
1277         char *name = "", *freename = NULL;
1278         const char *l_map_str;
1279         ino_t ino;
1280         int error;
1281         struct vnode *vp;
1282         struct vattr vat;
1283         bool private;
1284
1285         PROC_LOCK(p);
1286         error = p_candebug(td, p);
1287         PROC_UNLOCK(p);
1288         if (error)
1289                 return (error);
1290
1291         if (uio->uio_rw != UIO_READ)
1292                 return (EOPNOTSUPP);
1293
1294         error = 0;
1295         vm = vmspace_acquire_ref(p);
1296         if (vm == NULL)
1297                 return (ESRCH);
1298
1299         if (SV_CURPROC_FLAG(SV_LP64))
1300                 l_map_str = l64_map_str;
1301         else
1302                 l_map_str = l32_map_str;
1303         map = &vm->vm_map;
1304         vm_map_lock_read(map);
1305         VM_MAP_ENTRY_FOREACH(entry, map) {
1306                 name = "";
1307                 freename = NULL;
1308                 if (entry->eflags & MAP_ENTRY_IS_SUB_MAP)
1309                         continue;
1310                 e_prot = entry->protection;
1311                 e_start = entry->start;
1312                 e_end = entry->end;
1313                 obj = entry->object.vm_object;
1314                 off = entry->offset;
1315                 for (lobj = tobj = obj; tobj != NULL;
1316                     lobj = tobj, tobj = tobj->backing_object) {
1317                         VM_OBJECT_RLOCK(tobj);
1318                         off += lobj->backing_object_offset;
1319                         if (lobj != obj)
1320                                 VM_OBJECT_RUNLOCK(lobj);
1321                 }
1322                 private = (entry->eflags & MAP_ENTRY_COW) != 0 || obj == NULL ||
1323                     (obj->flags & OBJ_ANON) != 0;
1324                 last_timestamp = map->timestamp;
1325                 vm_map_unlock_read(map);
1326                 ino = 0;
1327                 if (lobj) {
1328                         vp = vm_object_vnode(lobj);
1329                         if (vp != NULL)
1330                                 vref(vp);
1331                         if (lobj != obj)
1332                                 VM_OBJECT_RUNLOCK(lobj);
1333                         VM_OBJECT_RUNLOCK(obj);
1334                         if (vp != NULL) {
1335                                 vn_fullpath(vp, &name, &freename);
1336                                 vn_lock(vp, LK_SHARED | LK_RETRY);
1337                                 VOP_GETATTR(vp, &vat, td->td_ucred);
1338                                 ino = vat.va_fileid;
1339                                 vput(vp);
1340                         } else if (SV_PROC_ABI(p) == SV_ABI_LINUX) {
1341                                 /*
1342                                  * sv_shared_page_base pointed out to the
1343                                  * FreeBSD sharedpage, PAGE_SIZE is a size
1344                                  * of it. The vDSO page is above.
1345                                  */
1346                                 if (e_start == p->p_sysent->sv_shared_page_base +
1347                                     PAGE_SIZE)
1348                                         name = vdso_str;
1349                                 if (e_end == p->p_sysent->sv_usrstack)
1350                                         name = stack_str;
1351                         }
1352                 }
1353
1354                 /*
1355                  * format:
1356                  *  start, end, access, offset, major, minor, inode, name.
1357                  */
1358                 error = sbuf_printf(sb, l_map_str,
1359                     (u_long)e_start, (u_long)e_end,
1360                     (e_prot & VM_PROT_READ)?"r":"-",
1361                     (e_prot & VM_PROT_WRITE)?"w":"-",
1362                     (e_prot & VM_PROT_EXECUTE)?"x":"-",
1363                     private ? "p" : "s",
1364                     (u_long)off,
1365                     0,
1366                     0,
1367                     (u_long)ino,
1368                     *name ? "     " : " ",
1369                     name
1370                     );
1371                 if (freename)
1372                         free(freename, M_TEMP);
1373                 vm_map_lock_read(map);
1374                 if (error == -1) {
1375                         error = 0;
1376                         break;
1377                 }
1378                 if (last_timestamp != map->timestamp) {
1379                         /*
1380                          * Look again for the entry because the map was
1381                          * modified while it was unlocked.  Specifically,
1382                          * the entry may have been clipped, merged, or deleted.
1383                          */
1384                         vm_map_lookup_entry(map, e_end - 1, &tmp_entry);
1385                         entry = tmp_entry;
1386                 }
1387         }
1388         vm_map_unlock_read(map);
1389         vmspace_free(vm);
1390
1391         return (error);
1392 }
1393
1394 /*
1395  * Filler function for proc/pid/mem
1396  */
1397 static int
1398 linprocfs_doprocmem(PFS_FILL_ARGS)
1399 {
1400         ssize_t resid;
1401         int error;
1402
1403         resid = uio->uio_resid;
1404         error = procfs_doprocmem(PFS_FILL_ARGNAMES);
1405
1406         if (uio->uio_rw == UIO_READ && resid != uio->uio_resid)
1407                 return (0);
1408
1409         if (error == EFAULT)
1410                 error = EIO;
1411
1412         return (error);
1413 }
1414
1415 /*
1416  * Criteria for interface name translation
1417  */
1418 #define IFP_IS_ETH(ifp) (ifp->if_type == IFT_ETHER)
1419
1420 static int
1421 linux_ifname(struct ifnet *ifp, char *buffer, size_t buflen)
1422 {
1423         struct ifnet *ifscan;
1424         int ethno;
1425
1426         IFNET_RLOCK_ASSERT();
1427
1428         /* Short-circuit non ethernet interfaces */
1429         if (!IFP_IS_ETH(ifp))
1430                 return (strlcpy(buffer, ifp->if_xname, buflen));
1431
1432         /* Determine the (relative) unit number for ethernet interfaces */
1433         ethno = 0;
1434         CK_STAILQ_FOREACH(ifscan, &V_ifnet, if_link) {
1435                 if (ifscan == ifp)
1436                         return (snprintf(buffer, buflen, "eth%d", ethno));
1437                 if (IFP_IS_ETH(ifscan))
1438                         ethno++;
1439         }
1440
1441         return (0);
1442 }
1443
1444 /*
1445  * Filler function for proc/net/dev
1446  */
1447 static int
1448 linprocfs_donetdev(PFS_FILL_ARGS)
1449 {
1450         char ifname[16]; /* XXX LINUX_IFNAMSIZ */
1451         struct ifnet *ifp;
1452
1453         sbuf_printf(sb, "%6s|%58s|%s\n"
1454             "%6s|%58s|%58s\n",
1455             "Inter-", "   Receive", "  Transmit",
1456             " face",
1457             "bytes    packets errs drop fifo frame compressed multicast",
1458             "bytes    packets errs drop fifo colls carrier compressed");
1459
1460         CURVNET_SET(TD_TO_VNET(curthread));
1461         IFNET_RLOCK();
1462         CK_STAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1463                 linux_ifname(ifp, ifname, sizeof ifname);
1464                 sbuf_printf(sb, "%6.6s: ", ifname);
1465                 sbuf_printf(sb, "%7ju %7ju %4ju %4ju %4lu %5lu %10lu %9ju ",
1466                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IBYTES),
1467                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IPACKETS),
1468                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IERRORS),
1469                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IQDROPS),
1470                                                         /* rx_missed_errors */
1471                     0UL,                                /* rx_fifo_errors */
1472                     0UL,                                /* rx_length_errors +
1473                                                          * rx_over_errors +
1474                                                          * rx_crc_errors +
1475                                                          * rx_frame_errors */
1476                     0UL,                                /* rx_compressed */
1477                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IMCASTS));
1478                                                         /* XXX-BZ rx only? */
1479                 sbuf_printf(sb, "%8ju %7ju %4ju %4ju %4lu %5ju %7lu %10lu\n",
1480                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OBYTES),
1481                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OPACKETS),
1482                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OERRORS),
1483                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OQDROPS),
1484                     0UL,                                /* tx_fifo_errors */
1485                     (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_COLLISIONS),
1486                     0UL,                                /* tx_carrier_errors +
1487                                                          * tx_aborted_errors +
1488                                                          * tx_window_errors +
1489                                                          * tx_heartbeat_errors*/
1490                     0UL);                               /* tx_compressed */
1491         }
1492         IFNET_RUNLOCK();
1493         CURVNET_RESTORE();
1494
1495         return (0);
1496 }
1497
1498 /*
1499  * Filler function for proc/sys/kernel/osrelease
1500  */
1501 static int
1502 linprocfs_doosrelease(PFS_FILL_ARGS)
1503 {
1504         char osrelease[LINUX_MAX_UTSNAME];
1505
1506         linux_get_osrelease(td, osrelease);
1507         sbuf_printf(sb, "%s\n", osrelease);
1508
1509         return (0);
1510 }
1511
1512 /*
1513  * Filler function for proc/sys/kernel/ostype
1514  */
1515 static int
1516 linprocfs_doostype(PFS_FILL_ARGS)
1517 {
1518         char osname[LINUX_MAX_UTSNAME];
1519
1520         linux_get_osname(td, osname);
1521         sbuf_printf(sb, "%s\n", osname);
1522
1523         return (0);
1524 }
1525
1526 /*
1527  * Filler function for proc/sys/kernel/version
1528  */
1529 static int
1530 linprocfs_doosbuild(PFS_FILL_ARGS)
1531 {
1532
1533         linprocfs_osbuild(td, sb);
1534         sbuf_cat(sb, "\n");
1535         return (0);
1536 }
1537
1538 /*
1539  * Filler function for proc/sys/kernel/msgmax
1540  */
1541 static int
1542 linprocfs_domsgmax(PFS_FILL_ARGS)
1543 {
1544
1545         sbuf_printf(sb, "%d\n", msginfo.msgmax);
1546         return (0);
1547 }
1548
1549 /*
1550  * Filler function for proc/sys/kernel/msgmni
1551  */
1552 static int
1553 linprocfs_domsgmni(PFS_FILL_ARGS)
1554 {
1555
1556         sbuf_printf(sb, "%d\n", msginfo.msgmni);
1557         return (0);
1558 }
1559
1560 /*
1561  * Filler function for proc/sys/kernel/msgmnb
1562  */
1563 static int
1564 linprocfs_domsgmnb(PFS_FILL_ARGS)
1565 {
1566
1567         sbuf_printf(sb, "%d\n", msginfo.msgmnb);
1568         return (0);
1569 }
1570
1571 /*
1572  * Filler function for proc/sys/kernel/ngroups_max
1573  *
1574  * Note that in Linux it defaults to 65536, not 1023.
1575  */
1576 static int
1577 linprocfs_dongroups_max(PFS_FILL_ARGS)
1578 {
1579
1580         sbuf_printf(sb, "%d\n", ngroups_max);
1581         return (0);
1582 }
1583
1584 /*
1585  * Filler function for proc/sys/kernel/pid_max
1586  */
1587 static int
1588 linprocfs_dopid_max(PFS_FILL_ARGS)
1589 {
1590
1591         sbuf_printf(sb, "%i\n", PID_MAX);
1592         return (0);
1593 }
1594
1595 /*
1596  * Filler function for proc/sys/kernel/sem
1597  */
1598 static int
1599 linprocfs_dosem(PFS_FILL_ARGS)
1600 {
1601
1602         sbuf_printf(sb, "%d %d %d %d\n", seminfo.semmsl, seminfo.semmns,
1603             seminfo.semopm, seminfo.semmni);
1604         return (0);
1605 }
1606
1607 /*
1608  * Filler function for proc/sys/kernel/shmall
1609  */
1610 static int
1611 linprocfs_doshmall(PFS_FILL_ARGS)
1612 {
1613
1614         sbuf_printf(sb, "%lu\n", shminfo.shmall);
1615         return (0);
1616 }
1617
1618 /*
1619  * Filler function for proc/sys/kernel/shmmax
1620  */
1621 static int
1622 linprocfs_doshmmax(PFS_FILL_ARGS)
1623 {
1624
1625         sbuf_printf(sb, "%lu\n", shminfo.shmmax);
1626         return (0);
1627 }
1628
1629 /*
1630  * Filler function for proc/sys/kernel/shmmni
1631  */
1632 static int
1633 linprocfs_doshmmni(PFS_FILL_ARGS)
1634 {
1635
1636         sbuf_printf(sb, "%lu\n", shminfo.shmmni);
1637         return (0);
1638 }
1639
1640 /*
1641  * Filler function for proc/sys/kernel/tainted
1642  */
1643 static int
1644 linprocfs_dotainted(PFS_FILL_ARGS)
1645 {
1646
1647         sbuf_printf(sb, "0\n");
1648         return (0);
1649 }
1650
1651 /*
1652  * Filler function for proc/sys/vm/min_free_kbytes
1653  *
1654  * This mirrors the approach in illumos to return zero for reads. Effectively,
1655  * it says, no memory is kept in reserve for "atomic allocations". This class
1656  * of allocation can be used at times when a thread cannot be suspended.
1657  */
1658 static int
1659 linprocfs_dominfree(PFS_FILL_ARGS)
1660 {
1661
1662         sbuf_printf(sb, "%d\n", 0);
1663         return (0);
1664 }
1665
1666 /*
1667  * Filler function for proc/scsi/device_info
1668  */
1669 static int
1670 linprocfs_doscsidevinfo(PFS_FILL_ARGS)
1671 {
1672
1673         return (0);
1674 }
1675
1676 /*
1677  * Filler function for proc/scsi/scsi
1678  */
1679 static int
1680 linprocfs_doscsiscsi(PFS_FILL_ARGS)
1681 {
1682
1683         return (0);
1684 }
1685
1686 /*
1687  * Filler function for proc/devices
1688  */
1689 static int
1690 linprocfs_dodevices(PFS_FILL_ARGS)
1691 {
1692         char *char_devices;
1693         sbuf_printf(sb, "Character devices:\n");
1694
1695         char_devices = linux_get_char_devices();
1696         sbuf_printf(sb, "%s", char_devices);
1697         linux_free_get_char_devices(char_devices);
1698
1699         sbuf_printf(sb, "\nBlock devices:\n");
1700
1701         return (0);
1702 }
1703
1704 /*
1705  * Filler function for proc/cmdline
1706  */
1707 static int
1708 linprocfs_docmdline(PFS_FILL_ARGS)
1709 {
1710
1711         sbuf_printf(sb, "BOOT_IMAGE=%s", kernelname);
1712         sbuf_printf(sb, " ro root=302\n");
1713         return (0);
1714 }
1715
1716 /*
1717  * Filler function for proc/filesystems
1718  */
1719 static int
1720 linprocfs_dofilesystems(PFS_FILL_ARGS)
1721 {
1722         struct vfsconf *vfsp;
1723
1724         vfsconf_slock();
1725         TAILQ_FOREACH(vfsp, &vfsconf, vfc_list) {
1726                 if (vfsp->vfc_flags & VFCF_SYNTHETIC)
1727                         sbuf_printf(sb, "nodev");
1728                 sbuf_printf(sb, "\t%s\n", vfsp->vfc_name);
1729         }
1730         vfsconf_sunlock();
1731         return(0);
1732 }
1733
1734 /*
1735  * Filler function for proc/modules
1736  */
1737 static int
1738 linprocfs_domodules(PFS_FILL_ARGS)
1739 {
1740 #if 0
1741         struct linker_file *lf;
1742
1743         TAILQ_FOREACH(lf, &linker_files, link) {
1744                 sbuf_printf(sb, "%-20s%8lu%4d\n", lf->filename,
1745                     (unsigned long)lf->size, lf->refs);
1746         }
1747 #endif
1748         return (0);
1749 }
1750
1751 /*
1752  * Filler function for proc/pid/fd
1753  */
1754 static int
1755 linprocfs_dofdescfs(PFS_FILL_ARGS)
1756 {
1757
1758         if (p == curproc)
1759                 sbuf_printf(sb, "/dev/fd");
1760         else
1761                 sbuf_printf(sb, "unknown");
1762         return (0);
1763 }
1764
1765 /*
1766  * Filler function for proc/pid/limits
1767  */
1768 static const struct linux_rlimit_ident {
1769         const char      *desc;
1770         const char      *unit;
1771         unsigned int    rlim_id;
1772 } linux_rlimits_ident[] = {
1773         { "Max cpu time",       "seconds",      RLIMIT_CPU },
1774         { "Max file size",      "bytes",        RLIMIT_FSIZE },
1775         { "Max data size",      "bytes",        RLIMIT_DATA },
1776         { "Max stack size",     "bytes",        RLIMIT_STACK },
1777         { "Max core file size",  "bytes",       RLIMIT_CORE },
1778         { "Max resident set",   "bytes",        RLIMIT_RSS },
1779         { "Max processes",      "processes",    RLIMIT_NPROC },
1780         { "Max open files",     "files",        RLIMIT_NOFILE },
1781         { "Max locked memory",  "bytes",        RLIMIT_MEMLOCK },
1782         { "Max address space",  "bytes",        RLIMIT_AS },
1783         { "Max file locks",     "locks",        LINUX_RLIMIT_LOCKS },
1784         { "Max pending signals", "signals",     LINUX_RLIMIT_SIGPENDING },
1785         { "Max msgqueue size",  "bytes",        LINUX_RLIMIT_MSGQUEUE },
1786         { "Max nice priority",          "",     LINUX_RLIMIT_NICE },
1787         { "Max realtime priority",      "",     LINUX_RLIMIT_RTPRIO },
1788         { "Max realtime timeout",       "us",   LINUX_RLIMIT_RTTIME },
1789         { 0, 0, 0 }
1790 };
1791
1792 static int
1793 linprocfs_doproclimits(PFS_FILL_ARGS)
1794 {
1795         const struct linux_rlimit_ident *li;
1796         struct plimit *limp;
1797         struct rlimit rl;
1798         ssize_t size;
1799         int res, error;
1800
1801         error = 0;
1802
1803         PROC_LOCK(p);
1804         limp = lim_hold(p->p_limit);
1805         PROC_UNLOCK(p);
1806         size = sizeof(res);
1807         sbuf_printf(sb, "%-26s%-21s%-21s%-21s\n", "Limit", "Soft Limit",
1808                         "Hard Limit", "Units");
1809         for (li = linux_rlimits_ident; li->desc != NULL; ++li) {
1810                 switch (li->rlim_id)
1811                 {
1812                 case LINUX_RLIMIT_LOCKS:
1813                         /* FALLTHROUGH */
1814                 case LINUX_RLIMIT_RTTIME:
1815                         rl.rlim_cur = RLIM_INFINITY;
1816                         break;
1817                 case LINUX_RLIMIT_SIGPENDING:
1818                         error = kernel_sysctlbyname(td,
1819                             "kern.sigqueue.max_pending_per_proc",
1820                             &res, &size, 0, 0, 0, 0);
1821                         if (error != 0)
1822                                 goto out;
1823                         rl.rlim_cur = res;
1824                         rl.rlim_max = res;
1825                         break;
1826                 case LINUX_RLIMIT_MSGQUEUE:
1827                         error = kernel_sysctlbyname(td,
1828                             "kern.ipc.msgmnb", &res, &size, 0, 0, 0, 0);
1829                         if (error != 0)
1830                                 goto out;
1831                         rl.rlim_cur = res;
1832                         rl.rlim_max = res;
1833                         break;
1834                 case LINUX_RLIMIT_NICE:
1835                         /* FALLTHROUGH */
1836                 case LINUX_RLIMIT_RTPRIO:
1837                         rl.rlim_cur = 0;
1838                         rl.rlim_max = 0;
1839                         break;
1840                 default:
1841                         rl = limp->pl_rlimit[li->rlim_id];
1842                         break;
1843                 }
1844                 if (rl.rlim_cur == RLIM_INFINITY)
1845                         sbuf_printf(sb, "%-26s%-21s%-21s%-10s\n",
1846                             li->desc, "unlimited", "unlimited", li->unit);
1847                 else
1848                         sbuf_printf(sb, "%-26s%-21llu%-21llu%-10s\n",
1849                             li->desc, (unsigned long long)rl.rlim_cur,
1850                             (unsigned long long)rl.rlim_max, li->unit);
1851         }
1852 out:
1853         lim_free(limp);
1854         return (error);
1855 }
1856
1857 /*
1858  * The point of the following two functions is to work around
1859  * an assertion in Chromium; see kern/240991 for details.
1860  */
1861 static int
1862 linprocfs_dotaskattr(PFS_ATTR_ARGS)
1863 {
1864
1865         vap->va_nlink = 3;
1866         return (0);
1867 }
1868
1869 /*
1870  * Filler function for proc/<pid>/task/.dummy
1871  */
1872 static int
1873 linprocfs_dotaskdummy(PFS_FILL_ARGS)
1874 {
1875
1876         return (0);
1877 }
1878
1879 /*
1880  * Filler function for proc/sys/kernel/random/uuid
1881  */
1882 static int
1883 linprocfs_douuid(PFS_FILL_ARGS)
1884 {
1885         struct uuid uuid;
1886
1887         kern_uuidgen(&uuid, 1);
1888         sbuf_printf_uuid(sb, &uuid);
1889         sbuf_printf(sb, "\n");
1890         return(0);
1891 }
1892
1893 /*
1894  * Filler function for proc/pid/auxv
1895  */
1896 static int
1897 linprocfs_doauxv(PFS_FILL_ARGS)
1898 {
1899         struct sbuf *asb;
1900         off_t buflen, resid;
1901         int error;
1902
1903         /*
1904          * Mimic linux behavior and pass only processes with usermode
1905          * address space as valid. Return zero silently otherwise.
1906          */
1907         if (p->p_vmspace == &vmspace0)
1908                 return (0);
1909
1910         if (uio->uio_resid == 0)
1911                 return (0);
1912         if (uio->uio_offset < 0 || uio->uio_resid < 0)
1913                 return (EINVAL);
1914
1915         asb = sbuf_new_auto();
1916         if (asb == NULL)
1917                 return (ENOMEM);
1918         error = proc_getauxv(td, p, asb);
1919         if (error == 0)
1920                 error = sbuf_finish(asb);
1921
1922         resid = sbuf_len(asb) - uio->uio_offset;
1923         if (resid > uio->uio_resid)
1924                 buflen = uio->uio_resid;
1925         else
1926                 buflen = resid;
1927         if (buflen > IOSIZE_MAX)
1928                 return (EINVAL);
1929         if (buflen > maxphys)
1930                 buflen = maxphys;
1931         if (resid <= 0)
1932                 return (0);
1933
1934         if (error == 0)
1935                 error = uiomove(sbuf_data(asb) + uio->uio_offset, buflen, uio);
1936         sbuf_delete(asb);
1937         return (error);
1938 }
1939
1940 /*
1941  * Constructor
1942  */
1943 static int
1944 linprocfs_init(PFS_INIT_ARGS)
1945 {
1946         struct pfs_node *root;
1947         struct pfs_node *dir;
1948         struct pfs_node *sys;
1949
1950         root = pi->pi_root;
1951
1952         /* /proc/... */
1953         pfs_create_file(root, "cmdline", &linprocfs_docmdline,
1954             NULL, NULL, NULL, PFS_RD);
1955         pfs_create_file(root, "cpuinfo", &linprocfs_docpuinfo,
1956             NULL, NULL, NULL, PFS_RD);
1957         pfs_create_file(root, "devices", &linprocfs_dodevices,
1958             NULL, NULL, NULL, PFS_RD);
1959         pfs_create_file(root, "filesystems", &linprocfs_dofilesystems,
1960             NULL, NULL, NULL, PFS_RD);
1961         pfs_create_file(root, "loadavg", &linprocfs_doloadavg,
1962             NULL, NULL, NULL, PFS_RD);
1963         pfs_create_file(root, "meminfo", &linprocfs_domeminfo,
1964             NULL, NULL, NULL, PFS_RD);
1965         pfs_create_file(root, "modules", &linprocfs_domodules,
1966             NULL, NULL, NULL, PFS_RD);
1967         pfs_create_file(root, "mounts", &linprocfs_domtab,
1968             NULL, NULL, NULL, PFS_RD);
1969         pfs_create_file(root, "mtab", &linprocfs_domtab,
1970             NULL, NULL, NULL, PFS_RD);
1971         pfs_create_file(root, "partitions", &linprocfs_dopartitions,
1972             NULL, NULL, NULL, PFS_RD);
1973         pfs_create_link(root, "self", &procfs_docurproc,
1974             NULL, NULL, NULL, 0);
1975         pfs_create_file(root, "stat", &linprocfs_dostat,
1976             NULL, NULL, NULL, PFS_RD);
1977         pfs_create_file(root, "swaps", &linprocfs_doswaps,
1978             NULL, NULL, NULL, PFS_RD);
1979         pfs_create_file(root, "uptime", &linprocfs_douptime,
1980             NULL, NULL, NULL, PFS_RD);
1981         pfs_create_file(root, "version", &linprocfs_doversion,
1982             NULL, NULL, NULL, PFS_RD);
1983
1984         /* /proc/bus/... */
1985         dir = pfs_create_dir(root, "bus", NULL, NULL, NULL, 0);
1986         dir = pfs_create_dir(dir, "pci", NULL, NULL, NULL, 0);
1987         dir = pfs_create_dir(dir, "devices", NULL, NULL, NULL, 0);
1988
1989         /* /proc/net/... */
1990         dir = pfs_create_dir(root, "net", NULL, NULL, NULL, 0);
1991         pfs_create_file(dir, "dev", &linprocfs_donetdev,
1992             NULL, NULL, NULL, PFS_RD);
1993
1994         /* /proc/<pid>/... */
1995         dir = pfs_create_dir(root, "pid", NULL, NULL, NULL, PFS_PROCDEP);
1996         pfs_create_file(dir, "cmdline", &linprocfs_doproccmdline,
1997             NULL, NULL, NULL, PFS_RD);
1998         pfs_create_link(dir, "cwd", &linprocfs_doproccwd,
1999             NULL, NULL, NULL, 0);
2000         pfs_create_file(dir, "environ", &linprocfs_doprocenviron,
2001             NULL, &procfs_candebug, NULL, PFS_RD);
2002         pfs_create_link(dir, "exe", &procfs_doprocfile,
2003             NULL, &procfs_notsystem, NULL, 0);
2004         pfs_create_file(dir, "maps", &linprocfs_doprocmaps,
2005             NULL, NULL, NULL, PFS_RD | PFS_AUTODRAIN);
2006         pfs_create_file(dir, "mem", &linprocfs_doprocmem,
2007             procfs_attr_rw, &procfs_candebug, NULL, PFS_RDWR | PFS_RAW);
2008         pfs_create_file(dir, "mountinfo", &linprocfs_doprocmountinfo,
2009             NULL, NULL, NULL, PFS_RD);
2010         pfs_create_file(dir, "mounts", &linprocfs_domtab,
2011             NULL, NULL, NULL, PFS_RD);
2012         pfs_create_link(dir, "root", &linprocfs_doprocroot,
2013             NULL, NULL, NULL, 0);
2014         pfs_create_file(dir, "stat", &linprocfs_doprocstat,
2015             NULL, NULL, NULL, PFS_RD);
2016         pfs_create_file(dir, "statm", &linprocfs_doprocstatm,
2017             NULL, NULL, NULL, PFS_RD);
2018         pfs_create_file(dir, "status", &linprocfs_doprocstatus,
2019             NULL, NULL, NULL, PFS_RD);
2020         pfs_create_link(dir, "fd", &linprocfs_dofdescfs,
2021             NULL, NULL, NULL, 0);
2022         pfs_create_file(dir, "auxv", &linprocfs_doauxv,
2023             NULL, &procfs_candebug, NULL, PFS_RD|PFS_RAWRD);
2024         pfs_create_file(dir, "limits", &linprocfs_doproclimits,
2025             NULL, NULL, NULL, PFS_RD);
2026
2027         /* /proc/<pid>/task/... */
2028         dir = pfs_create_dir(dir, "task", linprocfs_dotaskattr, NULL, NULL, 0);
2029         pfs_create_file(dir, ".dummy", &linprocfs_dotaskdummy,
2030             NULL, NULL, NULL, PFS_RD);
2031
2032         /* /proc/scsi/... */
2033         dir = pfs_create_dir(root, "scsi", NULL, NULL, NULL, 0);
2034         pfs_create_file(dir, "device_info", &linprocfs_doscsidevinfo,
2035             NULL, NULL, NULL, PFS_RD);
2036         pfs_create_file(dir, "scsi", &linprocfs_doscsiscsi,
2037             NULL, NULL, NULL, PFS_RD);
2038
2039         /* /proc/sys/... */
2040         sys = pfs_create_dir(root, "sys", NULL, NULL, NULL, 0);
2041
2042         /* /proc/sys/kernel/... */
2043         dir = pfs_create_dir(sys, "kernel", NULL, NULL, NULL, 0);
2044         pfs_create_file(dir, "osrelease", &linprocfs_doosrelease,
2045             NULL, NULL, NULL, PFS_RD);
2046         pfs_create_file(dir, "ostype", &linprocfs_doostype,
2047             NULL, NULL, NULL, PFS_RD);
2048         pfs_create_file(dir, "version", &linprocfs_doosbuild,
2049             NULL, NULL, NULL, PFS_RD);
2050         pfs_create_file(dir, "msgmax", &linprocfs_domsgmax,
2051             NULL, NULL, NULL, PFS_RD);
2052         pfs_create_file(dir, "msgmni", &linprocfs_domsgmni,
2053             NULL, NULL, NULL, PFS_RD);
2054         pfs_create_file(dir, "msgmnb", &linprocfs_domsgmnb,
2055             NULL, NULL, NULL, PFS_RD);
2056         pfs_create_file(dir, "ngroups_max", &linprocfs_dongroups_max,
2057             NULL, NULL, NULL, PFS_RD);
2058         pfs_create_file(dir, "pid_max", &linprocfs_dopid_max,
2059             NULL, NULL, NULL, PFS_RD);
2060         pfs_create_file(dir, "sem", &linprocfs_dosem,
2061             NULL, NULL, NULL, PFS_RD);
2062         pfs_create_file(dir, "shmall", &linprocfs_doshmall,
2063             NULL, NULL, NULL, PFS_RD);
2064         pfs_create_file(dir, "shmmax", &linprocfs_doshmmax,
2065             NULL, NULL, NULL, PFS_RD);
2066         pfs_create_file(dir, "shmmni", &linprocfs_doshmmni,
2067             NULL, NULL, NULL, PFS_RD);
2068         pfs_create_file(dir, "tainted", &linprocfs_dotainted,
2069             NULL, NULL, NULL, PFS_RD);
2070
2071         /* /proc/sys/kernel/random/... */
2072         dir = pfs_create_dir(dir, "random", NULL, NULL, NULL, 0);
2073         pfs_create_file(dir, "uuid", &linprocfs_douuid,
2074             NULL, NULL, NULL, PFS_RD);
2075
2076         /* /proc/sys/vm/.... */
2077         dir = pfs_create_dir(sys, "vm", NULL, NULL, NULL, 0);
2078         pfs_create_file(dir, "min_free_kbytes", &linprocfs_dominfree,
2079             NULL, NULL, NULL, PFS_RD);
2080
2081         return (0);
2082 }
2083
2084 /*
2085  * Destructor
2086  */
2087 static int
2088 linprocfs_uninit(PFS_INIT_ARGS)
2089 {
2090
2091         /* nothing to do, pseudofs will GC */
2092         return (0);
2093 }
2094
2095 PSEUDOFS(linprocfs, 1, VFCF_JAIL);
2096 #if defined(__aarch64__) || defined(__amd64__)
2097 MODULE_DEPEND(linprocfs, linux_common, 1, 1, 1);
2098 #else
2099 MODULE_DEPEND(linprocfs, linux, 1, 1, 1);
2100 #endif
2101 MODULE_DEPEND(linprocfs, procfs, 1, 1, 1);
2102 MODULE_DEPEND(linprocfs, sysvmsg, 1, 1, 1);
2103 MODULE_DEPEND(linprocfs, sysvsem, 1, 1, 1);
2104 MODULE_DEPEND(linprocfs, sysvshm, 1, 1, 1);