xref: /freebsd/sys/compat/linprocfs/linprocfs.c (revision 1171c633fb097a19e1da87128604190bc6d27341)
1 /*-
2  * SPDX-License-Identifier: BSD-4-Clause
3  *
4  * Copyright (c) 2000 Dag-Erling Coïdan Smørgrav
5  * Copyright (c) 1999 Pierre Beyssac
6  * Copyright (c) 1993 Jan-Simon Pendry
7  * Copyright (c) 1993
8  *	The Regents of the University of California.  All rights reserved.
9  *
10  * This code is derived from software contributed to Berkeley by
11  * Jan-Simon Pendry.
12  *
13  * Redistribution and use in source and binary forms, with or without
14  * modification, are permitted provided that the following conditions
15  * are met:
16  * 1. Redistributions of source code must retain the above copyright
17  *    notice, this list of conditions and the following disclaimer.
18  * 2. Redistributions in binary form must reproduce the above copyright
19  *    notice, this list of conditions and the following disclaimer in the
20  *    documentation and/or other materials provided with the distribution.
21  * 3. All advertising materials mentioning features or use of this software
22  *    must display the following acknowledgement:
23  *	This product includes software developed by the University of
24  *	California, Berkeley and its contributors.
25  * 4. Neither the name of the University nor the names of its contributors
26  *    may be used to endorse or promote products derived from this software
27  *    without specific prior written permission.
28  *
29  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
30  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
31  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
32  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
33  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
34  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
35  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
36  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
37  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
38  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
39  * SUCH DAMAGE.
40  *
41  *	@(#)procfs_status.c	8.4 (Berkeley) 6/15/94
42  */
43 
44 #include <sys/cdefs.h>
45 __FBSDID("$FreeBSD$");
46 
47 #include <sys/param.h>
48 #include <sys/queue.h>
49 #include <sys/blist.h>
50 #include <sys/conf.h>
51 #include <sys/exec.h>
52 #include <sys/fcntl.h>
53 #include <sys/filedesc.h>
54 #include <sys/jail.h>
55 #include <sys/kernel.h>
56 #include <sys/limits.h>
57 #include <sys/linker.h>
58 #include <sys/lock.h>
59 #include <sys/malloc.h>
60 #include <sys/msg.h>
61 #include <sys/mutex.h>
62 #include <sys/namei.h>
63 #include <sys/proc.h>
64 #include <sys/ptrace.h>
65 #include <sys/resourcevar.h>
66 #include <sys/resource.h>
67 #include <sys/sbuf.h>
68 #include <sys/sem.h>
69 #include <sys/smp.h>
70 #include <sys/socket.h>
71 #include <sys/syscallsubr.h>
72 #include <sys/sysctl.h>
73 #include <sys/sysent.h>
74 #include <sys/systm.h>
75 #include <sys/time.h>
76 #include <sys/tty.h>
77 #include <sys/user.h>
78 #include <sys/uuid.h>
79 #include <sys/vmmeter.h>
80 #include <sys/vnode.h>
81 #include <sys/bus.h>
82 
83 #include <net/if.h>
84 #include <net/if_var.h>
85 #include <net/if_types.h>
86 
87 #include <vm/vm.h>
88 #include <vm/vm_extern.h>
89 #include <vm/pmap.h>
90 #include <vm/vm_map.h>
91 #include <vm/vm_param.h>
92 #include <vm/vm_object.h>
93 #include <vm/swap_pager.h>
94 
95 #include <machine/clock.h>
96 
97 #include <geom/geom.h>
98 #include <geom/geom_int.h>
99 
100 #if defined(__i386__) || defined(__amd64__)
101 #include <machine/cputypes.h>
102 #include <machine/md_var.h>
103 #endif /* __i386__ || __amd64__ */
104 
105 #include <compat/linux/linux.h>
106 #include <compat/linux/linux_mib.h>
107 #include <compat/linux/linux_misc.h>
108 #include <compat/linux/linux_util.h>
109 #include <fs/pseudofs/pseudofs.h>
110 #include <fs/procfs/procfs.h>
111 
112 /*
113  * Various conversion macros
114  */
115 #define T2J(x) ((long)(((x) * 100ULL) / (stathz ? stathz : hz)))	/* ticks to jiffies */
116 #define T2CS(x) ((unsigned long)(((x) * 100ULL) / (stathz ? stathz : hz)))	/* ticks to centiseconds */
117 #define T2S(x) ((x) / (stathz ? stathz : hz))		/* ticks to seconds */
118 #define B2K(x) ((x) >> 10)				/* bytes to kbytes */
119 #define B2P(x) ((x) >> PAGE_SHIFT)			/* bytes to pages */
120 #define P2B(x) ((x) << PAGE_SHIFT)			/* pages to bytes */
121 #define P2K(x) ((x) << (PAGE_SHIFT - 10))		/* pages to kbytes */
122 #define TV2J(x)	((x)->tv_sec * 100UL + (x)->tv_usec / 10000)
123 
124 /**
125  * @brief Mapping of ki_stat in struct kinfo_proc to the linux state
126  *
127  * The linux procfs state field displays one of the characters RSDZTW to
128  * denote running, sleeping in an interruptible wait, waiting in an
129  * uninterruptible disk sleep, a zombie process, process is being traced
130  * or stopped, or process is paging respectively.
131  *
132  * Our struct kinfo_proc contains the variable ki_stat which contains a
133  * value out of SIDL, SRUN, SSLEEP, SSTOP, SZOMB, SWAIT and SLOCK.
134  *
135  * This character array is used with ki_stati-1 as an index and tries to
136  * map our states to suitable linux states.
137  */
138 static char linux_state[] = "RRSTZDD";
139 
140 /*
141  * Filler function for proc/meminfo
142  */
143 static int
144 linprocfs_domeminfo(PFS_FILL_ARGS)
145 {
146 	unsigned long memtotal;		/* total memory in bytes */
147 	unsigned long memused;		/* used memory in bytes */
148 	unsigned long memfree;		/* free memory in bytes */
149 	unsigned long buffers, cached;	/* buffer / cache memory ??? */
150 	unsigned long long swaptotal;	/* total swap space in bytes */
151 	unsigned long long swapused;	/* used swap space in bytes */
152 	unsigned long long swapfree;	/* free swap space in bytes */
153 	int i, j;
154 
155 	memtotal = physmem * PAGE_SIZE;
156 	/*
157 	 * The correct thing here would be:
158 	 *
159 	memfree = vm_free_count() * PAGE_SIZE;
160 	memused = memtotal - memfree;
161 	 *
162 	 * but it might mislead linux binaries into thinking there
163 	 * is very little memory left, so we cheat and tell them that
164 	 * all memory that isn't wired down is free.
165 	 */
166 	memused = vm_wire_count() * PAGE_SIZE;
167 	memfree = memtotal - memused;
168 	swap_pager_status(&i, &j);
169 	swaptotal = (unsigned long long)i * PAGE_SIZE;
170 	swapused = (unsigned long long)j * PAGE_SIZE;
171 	swapfree = swaptotal - swapused;
172 	/*
173 	 * We'd love to be able to write:
174 	 *
175 	buffers = bufspace;
176 	 *
177 	 * but bufspace is internal to vfs_bio.c and we don't feel
178 	 * like unstaticizing it just for linprocfs's sake.
179 	 */
180 	buffers = 0;
181 	cached = vm_inactive_count() * PAGE_SIZE;
182 
183 	sbuf_printf(sb,
184 	    "MemTotal: %9lu kB\n"
185 	    "MemFree:  %9lu kB\n"
186 	    "Buffers:  %9lu kB\n"
187 	    "Cached:   %9lu kB\n"
188 	    "SwapTotal:%9llu kB\n"
189 	    "SwapFree: %9llu kB\n",
190 	    B2K(memtotal), B2K(memfree), B2K(buffers),
191 	    B2K(cached), B2K(swaptotal), B2K(swapfree));
192 
193 	return (0);
194 }
195 
196 #if defined(__i386__) || defined(__amd64__)
197 /*
198  * Filler function for proc/cpuinfo (i386 & amd64 version)
199  */
200 static int
201 linprocfs_docpuinfo(PFS_FILL_ARGS)
202 {
203 	int hw_model[2];
204 	char model[128];
205 	uint64_t freq;
206 	size_t size;
207 	u_int cache_size[4];
208 	int fqmhz, fqkhz;
209 	int i, j;
210 
211 	/*
212 	 * We default the flags to include all non-conflicting flags,
213 	 * and the Intel versions of conflicting flags.
214 	 */
215 	static char *cpu_feature_names[] = {
216 		/*  0 */ "fpu", "vme", "de", "pse",
217 		/*  4 */ "tsc", "msr", "pae", "mce",
218 		/*  8 */ "cx8", "apic", "", "sep",
219 		/* 12 */ "mtrr", "pge", "mca", "cmov",
220 		/* 16 */ "pat", "pse36", "pn", "clflush",
221 		/* 20 */ "", "dts", "acpi", "mmx",
222 		/* 24 */ "fxsr", "sse", "sse2", "ss",
223 		/* 28 */ "ht", "tm", "ia64", "pbe"
224 	};
225 
226 	static char *amd_feature_names[] = {
227 		/*  0 */ "", "", "", "",
228 		/*  4 */ "", "", "", "",
229 		/*  8 */ "", "", "", "syscall",
230 		/* 12 */ "", "", "", "",
231 		/* 16 */ "", "", "", "mp",
232 		/* 20 */ "nx", "", "mmxext", "",
233 		/* 24 */ "", "fxsr_opt", "pdpe1gb", "rdtscp",
234 		/* 28 */ "", "lm", "3dnowext", "3dnow"
235 	};
236 
237 	static char *cpu_feature2_names[] = {
238 		/*  0 */ "pni", "pclmulqdq", "dtes3", "monitor",
239 		/*  4 */ "ds_cpl", "vmx", "smx", "est",
240 		/*  8 */ "tm2", "ssse3", "cid", "sdbg",
241 		/* 12 */ "fma", "cx16", "xptr", "pdcm",
242 		/* 16 */ "", "pcid", "dca", "sse4_1",
243 		/* 20 */ "sse4_2", "x2apic", "movbe", "popcnt",
244 		/* 24 */ "tsc_deadline_timer", "aes", "xsave", "",
245 		/* 28 */ "avx", "f16c", "rdrand", "hypervisor"
246 	};
247 
248 	static char *amd_feature2_names[] = {
249 		/*  0 */ "lahf_lm", "cmp_legacy", "svm", "extapic",
250 		/*  4 */ "cr8_legacy", "abm", "sse4a", "misalignsse",
251 		/*  8 */ "3dnowprefetch", "osvw", "ibs", "xop",
252 		/* 12 */ "skinit", "wdt", "", "lwp",
253 		/* 16 */ "fma4", "tce", "", "nodeid_msr",
254 		/* 20 */ "", "tbm", "topoext", "perfctr_core",
255 		/* 24 */ "perfctr_nb", "", "bpext", "ptsc",
256 		/* 28 */ "perfctr_llc", "mwaitx", "", ""
257 	};
258 
259 	static char *cpu_stdext_feature_names[] = {
260 		/*  0 */ "fsgsbase", "tsc_adjust", "", "bmi1",
261 		/*  4 */ "hle", "avx2", "", "smep",
262 		/*  8 */ "bmi2", "erms", "invpcid", "rtm",
263 		/* 12 */ "cqm", "", "mpx", "rdt_a",
264 		/* 16 */ "avx512f", "avx512dq", "rdseed", "adx",
265 		/* 20 */ "smap", "avx512ifma", "", "clflushopt",
266 		/* 24 */ "clwb", "intel_pt", "avx512pf", "avx512er",
267 		/* 28 */ "avx512cd", "sha_ni", "avx512bw", "avx512vl"
268 	};
269 
270 	static char *power_flags[] = {
271 		"ts",           "fid",          "vid",
272 		"ttp",          "tm",           "stc",
273 		"100mhzsteps",  "hwpstate",     "",
274 		"cpb",          "eff_freq_ro",  "proc_feedback",
275 		"acc_power",
276 	};
277 
278 	hw_model[0] = CTL_HW;
279 	hw_model[1] = HW_MODEL;
280 	model[0] = '\0';
281 	size = sizeof(model);
282 	if (kernel_sysctl(td, hw_model, 2, &model, &size, 0, 0, 0, 0) != 0)
283 		strcpy(model, "unknown");
284 #ifdef __i386__
285 	switch (cpu_vendor_id) {
286 	case CPU_VENDOR_AMD:
287 		if (cpu_class < CPUCLASS_686)
288 			cpu_feature_names[16] = "fcmov";
289 		break;
290 	case CPU_VENDOR_CYRIX:
291 		cpu_feature_names[24] = "cxmmx";
292 		break;
293 	}
294 #endif
295 	if (cpu_exthigh >= 0x80000006)
296 		do_cpuid(0x80000006, cache_size);
297 	else
298 		memset(cache_size, 0, sizeof(cache_size));
299 	for (i = 0; i < mp_ncpus; ++i) {
300 		fqmhz = 0;
301 		fqkhz = 0;
302 		freq = atomic_load_acq_64(&tsc_freq);
303 		if (freq != 0) {
304 			fqmhz = (freq + 4999) / 1000000;
305 			fqkhz = ((freq + 4999) / 10000) % 100;
306 		}
307 		sbuf_printf(sb,
308 		    "processor\t: %d\n"
309 		    "vendor_id\t: %.20s\n"
310 		    "cpu family\t: %u\n"
311 		    "model\t\t: %u\n"
312 		    "model name\t: %s\n"
313 		    "stepping\t: %u\n"
314 		    "cpu MHz\t\t: %d.%02d\n"
315 		    "cache size\t: %d KB\n"
316 		    "physical id\t: %d\n"
317 		    "siblings\t: %d\n"
318 		    "core id\t\t: %d\n"
319 		    "cpu cores\t: %d\n"
320 		    "apicid\t\t: %d\n"
321 		    "initial apicid\t: %d\n"
322 		    "fpu\t\t: %s\n"
323 		    "fpu_exception\t: %s\n"
324 		    "cpuid level\t: %d\n"
325 		    "wp\t\t: %s\n",
326 		    i, cpu_vendor, CPUID_TO_FAMILY(cpu_id),
327 		    CPUID_TO_MODEL(cpu_id), model, cpu_id & CPUID_STEPPING,
328 		    fqmhz, fqkhz,
329 		    (cache_size[2] >> 16), 0, mp_ncpus, i, mp_ncpus,
330 		    i, i, /*cpu_id & CPUID_LOCAL_APIC_ID ??*/
331 		    (cpu_feature & CPUID_FPU) ? "yes" : "no", "yes",
332 		    CPUID_TO_FAMILY(cpu_id), "yes");
333 		sbuf_cat(sb, "flags\t\t:");
334 		for (j = 0; j < nitems(cpu_feature_names); j++)
335 			if (cpu_feature & (1 << j) &&
336 			    cpu_feature_names[j][0] != '\0')
337 				sbuf_printf(sb, " %s", cpu_feature_names[j]);
338 		for (j = 0; j < nitems(amd_feature_names); j++)
339 			if (amd_feature & (1 << j) &&
340 			    amd_feature_names[j][0] != '\0')
341 				sbuf_printf(sb, " %s", amd_feature_names[j]);
342 		for (j = 0; j < nitems(cpu_feature2_names); j++)
343 			if (cpu_feature2 & (1 << j) &&
344 			    cpu_feature2_names[j][0] != '\0')
345 				sbuf_printf(sb, " %s", cpu_feature2_names[j]);
346 		for (j = 0; j < nitems(amd_feature2_names); j++)
347 			if (amd_feature2 & (1 << j) &&
348 			    amd_feature2_names[j][0] != '\0')
349 				sbuf_printf(sb, " %s", amd_feature2_names[j]);
350 		for (j = 0; j < nitems(cpu_stdext_feature_names); j++)
351 			if (cpu_stdext_feature & (1 << j) &&
352 			    cpu_stdext_feature_names[j][0] != '\0')
353 				sbuf_printf(sb, " %s",
354 				    cpu_stdext_feature_names[j]);
355 		sbuf_cat(sb, "\n");
356 		sbuf_printf(sb,
357 		    "bugs\t\t: %s\n"
358 		    "bogomips\t: %d.%02d\n"
359 		    "clflush size\t: %d\n"
360 		    "cache_alignment\t: %d\n"
361 		    "address sizes\t: %d bits physical, %d bits virtual\n",
362 #if defined(I586_CPU) && !defined(NO_F00F_HACK)
363 		    (has_f00f_bug) ? "Intel F00F" : "",
364 #else
365 		    "",
366 #endif
367 		    fqmhz, fqkhz,
368 		    cpu_clflush_line_size, cpu_clflush_line_size,
369 		    cpu_maxphyaddr,
370 		    (cpu_maxphyaddr > 32) ? 48 : 0);
371 		sbuf_cat(sb, "power management: ");
372 		for (j = 0; j < nitems(power_flags); j++)
373 			if (amd_pminfo & (1 << j))
374 				sbuf_printf(sb, " %s", power_flags[j]);
375 		sbuf_cat(sb, "\n\n");
376 
377 		/* XXX per-cpu vendor / class / model / id? */
378 	}
379 	sbuf_cat(sb, "\n");
380 
381 	return (0);
382 }
383 #else
384 /* ARM64TODO: implement non-stubbed linprocfs_docpuinfo */
385 static int
386 linprocfs_docpuinfo(PFS_FILL_ARGS)
387 {
388 	int i;
389 
390 	for (i = 0; i < mp_ncpus; ++i) {
391 		sbuf_printf(sb,
392 		    "processor\t: %d\n"
393 		    "BogoMIPS\t: %d.%02d\n",
394 		    i, 0, 0);
395 		sbuf_cat(sb, "Features\t: ");
396 		sbuf_cat(sb, "\n");
397 		sbuf_printf(sb,
398 		    "CPU implementer\t: \n"
399 		    "CPU architecture: \n"
400 		    "CPU variant\t: 0x%x\n"
401 		    "CPU part\t: 0x%x\n"
402 		    "CPU revision\t: %d\n",
403 		    0, 0, 0);
404 		sbuf_cat(sb, "\n");
405 	}
406 
407 	return (0);
408 }
409 #endif /* __i386__ || __amd64__ */
410 
411 /*
412  * Filler function for proc/mtab
413  *
414  * This file doesn't exist in Linux' procfs, but is included here so
415  * users can symlink /compat/linux/etc/mtab to /proc/mtab
416  */
417 static int
418 linprocfs_domtab(PFS_FILL_ARGS)
419 {
420 	struct nameidata nd;
421 	const char *lep;
422 	char *dlep, *flep, *mntto, *mntfrom, *fstype;
423 	size_t lep_len;
424 	int error;
425 	struct statfs *buf, *sp;
426 	size_t count;
427 
428 	/* resolve symlinks etc. in the emulation tree prefix */
429 	NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, linux_emul_path, td);
430 	flep = NULL;
431 	error = namei(&nd);
432 	lep = linux_emul_path;
433 	if (error == 0) {
434 		if (vn_fullpath(td, nd.ni_vp, &dlep, &flep) == 0)
435 			lep = dlep;
436 		vrele(nd.ni_vp);
437 	}
438 	lep_len = strlen(lep);
439 
440 	buf = NULL;
441 	error = kern_getfsstat(td, &buf, SIZE_T_MAX, &count,
442 	    UIO_SYSSPACE, MNT_WAIT);
443 	if (error != 0) {
444 		free(buf, M_TEMP);
445 		free(flep, M_TEMP);
446 		return (error);
447 	}
448 
449 	for (sp = buf; count > 0; sp++, count--) {
450 		/* determine device name */
451 		mntfrom = sp->f_mntfromname;
452 
453 		/* determine mount point */
454 		mntto = sp->f_mntonname;
455 		if (strncmp(mntto, lep, lep_len) == 0 && mntto[lep_len] == '/')
456 			mntto += lep_len;
457 
458 		/* determine fs type */
459 		fstype = sp->f_fstypename;
460 		if (strcmp(fstype, pn->pn_info->pi_name) == 0)
461 			mntfrom = fstype = "proc";
462 		else if (strcmp(fstype, "procfs") == 0)
463 			continue;
464 
465 		if (strcmp(fstype, "autofs") == 0) {
466 			/*
467 			 * FreeBSD uses eg "map -hosts", whereas Linux
468 			 * expects just "-hosts".
469 			 */
470 			if (strncmp(mntfrom, "map ", 4) == 0)
471 				mntfrom += 4;
472 		}
473 
474 		if (strcmp(fstype, "linsysfs") == 0) {
475 			sbuf_printf(sb, "/sys %s sysfs %s", mntto,
476 			    sp->f_flags & MNT_RDONLY ? "ro" : "rw");
477 		} else {
478 			/* For Linux msdosfs is called vfat */
479 			if (strcmp(fstype, "msdosfs") == 0)
480 				fstype = "vfat";
481 			sbuf_printf(sb, "%s %s %s %s", mntfrom, mntto, fstype,
482 			    sp->f_flags & MNT_RDONLY ? "ro" : "rw");
483 		}
484 #define ADD_OPTION(opt, name) \
485 	if (sp->f_flags & (opt)) sbuf_printf(sb, "," name);
486 		ADD_OPTION(MNT_SYNCHRONOUS,	"sync");
487 		ADD_OPTION(MNT_NOEXEC,		"noexec");
488 		ADD_OPTION(MNT_NOSUID,		"nosuid");
489 		ADD_OPTION(MNT_UNION,		"union");
490 		ADD_OPTION(MNT_ASYNC,		"async");
491 		ADD_OPTION(MNT_SUIDDIR,		"suiddir");
492 		ADD_OPTION(MNT_NOSYMFOLLOW,	"nosymfollow");
493 		ADD_OPTION(MNT_NOATIME,		"noatime");
494 #undef ADD_OPTION
495 		/* a real Linux mtab will also show NFS options */
496 		sbuf_printf(sb, " 0 0\n");
497 	}
498 
499 	free(buf, M_TEMP);
500 	free(flep, M_TEMP);
501 	return (error);
502 }
503 
504 /*
505  * Filler function for proc/partitions
506  */
507 static int
508 linprocfs_dopartitions(PFS_FILL_ARGS)
509 {
510 	struct g_class *cp;
511 	struct g_geom *gp;
512 	struct g_provider *pp;
513 	int major, minor;
514 
515 	g_topology_lock();
516 	sbuf_printf(sb, "major minor  #blocks  name rio rmerge rsect "
517 	    "ruse wio wmerge wsect wuse running use aveq\n");
518 
519 	LIST_FOREACH(cp, &g_classes, class) {
520 		if (strcmp(cp->name, "DISK") == 0 ||
521 		    strcmp(cp->name, "PART") == 0)
522 			LIST_FOREACH(gp, &cp->geom, geom) {
523 				LIST_FOREACH(pp, &gp->provider, provider) {
524 					if (linux_driver_get_major_minor(
525 					    pp->name, &major, &minor) != 0) {
526 						major = 0;
527 						minor = 0;
528 					}
529 					sbuf_printf(sb, "%d %d %lld %s "
530 					    "%d %d %d %d %d "
531 					     "%d %d %d %d %d %d\n",
532 					     major, minor,
533 					     (long long)pp->mediasize, pp->name,
534 					     0, 0, 0, 0, 0,
535 					     0, 0, 0, 0, 0, 0);
536 				}
537 			}
538 	}
539 	g_topology_unlock();
540 
541 	return (0);
542 }
543 
544 /*
545  * Filler function for proc/stat
546  *
547  * Output depends on kernel version:
548  *
549  * v2.5.40 <=
550  *   user nice system idle
551  * v2.5.41
552  *   user nice system idle iowait
553  * v2.6.11
554  *   user nice system idle iowait irq softirq steal
555  * v2.6.24
556  *   user nice system idle iowait irq softirq steal guest
557  * v2.6.33 >=
558  *   user nice system idle iowait irq softirq steal guest guest_nice
559  */
560 static int
561 linprocfs_dostat(PFS_FILL_ARGS)
562 {
563 	struct pcpu *pcpu;
564 	long cp_time[CPUSTATES];
565 	long *cp;
566 	struct timeval boottime;
567 	int i;
568 	char *zero_pad;
569 	bool has_intr = true;
570 
571 	if (linux_kernver(td) >= LINUX_KERNVER(2,6,33)) {
572 		zero_pad = " 0 0 0 0\n";
573 	} else if (linux_kernver(td) >= LINUX_KERNVER(2,6,24)) {
574 		zero_pad = " 0 0 0\n";
575 	} else if (linux_kernver(td) >= LINUX_KERNVER(2,6,11)) {
576 		zero_pad = " 0 0\n";
577 	} else if (linux_kernver(td) >= LINUX_KERNVER(2,5,41)) {
578 		has_intr = false;
579 		zero_pad = " 0\n";
580 	} else {
581 		has_intr = false;
582 		zero_pad = "\n";
583 	}
584 
585 	read_cpu_time(cp_time);
586 	getboottime(&boottime);
587 	/* Parameters common to all versions */
588 	sbuf_printf(sb, "cpu %lu %lu %lu %lu",
589 	    T2J(cp_time[CP_USER]),
590 	    T2J(cp_time[CP_NICE]),
591 	    T2J(cp_time[CP_SYS]),
592 	    T2J(cp_time[CP_IDLE]));
593 
594 	/* Print interrupt stats if available */
595 	if (has_intr) {
596 		sbuf_printf(sb, " 0 %lu", T2J(cp_time[CP_INTR]));
597 	}
598 
599 	/* Pad out remaining fields depending on version */
600 	sbuf_printf(sb, "%s", zero_pad);
601 
602 	CPU_FOREACH(i) {
603 		pcpu = pcpu_find(i);
604 		cp = pcpu->pc_cp_time;
605 		sbuf_printf(sb, "cpu%d %lu %lu %lu %lu", i,
606 		    T2J(cp[CP_USER]),
607 		    T2J(cp[CP_NICE]),
608 		    T2J(cp[CP_SYS]),
609 		    T2J(cp[CP_IDLE]));
610 
611 		if (has_intr) {
612 			sbuf_printf(sb, " 0 %lu", T2J(cp[CP_INTR]));
613 		}
614 
615 		sbuf_printf(sb, "%s", zero_pad);
616 	}
617 	sbuf_printf(sb,
618 	    "disk 0 0 0 0\n"
619 	    "page %ju %ju\n"
620 	    "swap %ju %ju\n"
621 	    "intr %ju\n"
622 	    "ctxt %ju\n"
623 	    "btime %lld\n",
624 	    (uintmax_t)VM_CNT_FETCH(v_vnodepgsin),
625 	    (uintmax_t)VM_CNT_FETCH(v_vnodepgsout),
626 	    (uintmax_t)VM_CNT_FETCH(v_swappgsin),
627 	    (uintmax_t)VM_CNT_FETCH(v_swappgsout),
628 	    (uintmax_t)VM_CNT_FETCH(v_intr),
629 	    (uintmax_t)VM_CNT_FETCH(v_swtch),
630 	    (long long)boottime.tv_sec);
631 	return (0);
632 }
633 
634 static int
635 linprocfs_doswaps(PFS_FILL_ARGS)
636 {
637 	struct xswdev xsw;
638 	uintmax_t total, used;
639 	int n;
640 	char devname[SPECNAMELEN + 1];
641 
642 	sbuf_printf(sb, "Filename\t\t\t\tType\t\tSize\tUsed\tPriority\n");
643 	for (n = 0; ; n++) {
644 		if (swap_dev_info(n, &xsw, devname, sizeof(devname)) != 0)
645 			break;
646 		total = (uintmax_t)xsw.xsw_nblks * PAGE_SIZE / 1024;
647 		used  = (uintmax_t)xsw.xsw_used * PAGE_SIZE / 1024;
648 
649 		/*
650 		 * The space and not tab after the device name is on
651 		 * purpose.  Linux does so.
652 		 */
653 		sbuf_printf(sb, "/dev/%-34s unknown\t\t%jd\t%jd\t-1\n",
654 		    devname, total, used);
655 	}
656 	return (0);
657 }
658 
659 /*
660  * Filler function for proc/uptime
661  */
662 static int
663 linprocfs_douptime(PFS_FILL_ARGS)
664 {
665 	long cp_time[CPUSTATES];
666 	struct timeval tv;
667 
668 	getmicrouptime(&tv);
669 	read_cpu_time(cp_time);
670 	sbuf_printf(sb, "%lld.%02ld %ld.%02lu\n",
671 	    (long long)tv.tv_sec, tv.tv_usec / 10000,
672 	    T2S(cp_time[CP_IDLE] / mp_ncpus),
673 	    T2CS(cp_time[CP_IDLE] / mp_ncpus) % 100);
674 	return (0);
675 }
676 
677 /*
678  * Get OS build date
679  */
680 static void
681 linprocfs_osbuild(struct thread *td, struct sbuf *sb)
682 {
683 #if 0
684 	char osbuild[256];
685 	char *cp1, *cp2;
686 
687 	strncpy(osbuild, version, 256);
688 	osbuild[255] = '\0';
689 	cp1 = strstr(osbuild, "\n");
690 	cp2 = strstr(osbuild, ":");
691 	if (cp1 && cp2) {
692 		*cp1 = *cp2 = '\0';
693 		cp1 = strstr(osbuild, "#");
694 	} else
695 		cp1 = NULL;
696 	if (cp1)
697 		sbuf_printf(sb, "%s%s", cp1, cp2 + 1);
698 	else
699 #endif
700 		sbuf_cat(sb, "#4 Sun Dec 18 04:30:00 CET 1977");
701 }
702 
703 /*
704  * Get OS builder
705  */
706 static void
707 linprocfs_osbuilder(struct thread *td, struct sbuf *sb)
708 {
709 #if 0
710 	char builder[256];
711 	char *cp;
712 
713 	cp = strstr(version, "\n    ");
714 	if (cp) {
715 		strncpy(builder, cp + 5, 256);
716 		builder[255] = '\0';
717 		cp = strstr(builder, ":");
718 		if (cp)
719 			*cp = '\0';
720 	}
721 	if (cp)
722 		sbuf_cat(sb, builder);
723 	else
724 #endif
725 		sbuf_cat(sb, "des@freebsd.org");
726 }
727 
728 /*
729  * Filler function for proc/version
730  */
731 static int
732 linprocfs_doversion(PFS_FILL_ARGS)
733 {
734 	char osname[LINUX_MAX_UTSNAME];
735 	char osrelease[LINUX_MAX_UTSNAME];
736 
737 	linux_get_osname(td, osname);
738 	linux_get_osrelease(td, osrelease);
739 	sbuf_printf(sb, "%s version %s (", osname, osrelease);
740 	linprocfs_osbuilder(td, sb);
741 	sbuf_cat(sb, ") (gcc version " __VERSION__ ") ");
742 	linprocfs_osbuild(td, sb);
743 	sbuf_cat(sb, "\n");
744 
745 	return (0);
746 }
747 
748 /*
749  * Filler function for proc/loadavg
750  */
751 static int
752 linprocfs_doloadavg(PFS_FILL_ARGS)
753 {
754 
755 	sbuf_printf(sb,
756 	    "%d.%02d %d.%02d %d.%02d %d/%d %d\n",
757 	    (int)(averunnable.ldavg[0] / averunnable.fscale),
758 	    (int)(averunnable.ldavg[0] * 100 / averunnable.fscale % 100),
759 	    (int)(averunnable.ldavg[1] / averunnable.fscale),
760 	    (int)(averunnable.ldavg[1] * 100 / averunnable.fscale % 100),
761 	    (int)(averunnable.ldavg[2] / averunnable.fscale),
762 	    (int)(averunnable.ldavg[2] * 100 / averunnable.fscale % 100),
763 	    1,				/* number of running tasks */
764 	    nprocs,			/* number of tasks */
765 	    lastpid			/* the last pid */
766 	);
767 	return (0);
768 }
769 
770 /*
771  * Filler function for proc/pid/stat
772  */
773 static int
774 linprocfs_doprocstat(PFS_FILL_ARGS)
775 {
776 	struct kinfo_proc kp;
777 	struct timeval boottime;
778 	char state;
779 	static int ratelimit = 0;
780 	vm_offset_t startcode, startdata;
781 
782 	getboottime(&boottime);
783 	sx_slock(&proctree_lock);
784 	PROC_LOCK(p);
785 	fill_kinfo_proc(p, &kp);
786 	sx_sunlock(&proctree_lock);
787 	if (p->p_vmspace) {
788 	   startcode = (vm_offset_t)p->p_vmspace->vm_taddr;
789 	   startdata = (vm_offset_t)p->p_vmspace->vm_daddr;
790 	} else {
791 	   startcode = 0;
792 	   startdata = 0;
793 	}
794 	sbuf_printf(sb, "%d", p->p_pid);
795 #define PS_ADD(name, fmt, arg) sbuf_printf(sb, " " fmt, arg)
796 	PS_ADD("comm",		"(%s)",	p->p_comm);
797 	if (kp.ki_stat > sizeof(linux_state)) {
798 		state = 'R';
799 
800 		if (ratelimit == 0) {
801 			printf("linprocfs: don't know how to handle unknown FreeBSD state %d/%zd, mapping to R\n",
802 			    kp.ki_stat, sizeof(linux_state));
803 			++ratelimit;
804 		}
805 	} else
806 		state = linux_state[kp.ki_stat - 1];
807 	PS_ADD("state",		"%c",	state);
808 	PS_ADD("ppid",		"%d",	p->p_pptr ? p->p_pptr->p_pid : 0);
809 	PS_ADD("pgrp",		"%d",	p->p_pgid);
810 	PS_ADD("session",	"%d",	p->p_session->s_sid);
811 	PROC_UNLOCK(p);
812 	if (kp.ki_tdev == NODEV)
813 		PS_ADD("tty",	"%s",	"-1");
814 	else
815 		PS_ADD("tty",		"%ju",	(uintmax_t)kp.ki_tdev);
816 	PS_ADD("tpgid",		"%d",	kp.ki_tpgid);
817 	PS_ADD("flags",		"%u",	0); /* XXX */
818 	PS_ADD("minflt",	"%lu",	kp.ki_rusage.ru_minflt);
819 	PS_ADD("cminflt",	"%lu",	kp.ki_rusage_ch.ru_minflt);
820 	PS_ADD("majflt",	"%lu",	kp.ki_rusage.ru_majflt);
821 	PS_ADD("cmajflt",	"%lu",	kp.ki_rusage_ch.ru_majflt);
822 	PS_ADD("utime",		"%ld",	TV2J(&kp.ki_rusage.ru_utime));
823 	PS_ADD("stime",		"%ld",	TV2J(&kp.ki_rusage.ru_stime));
824 	PS_ADD("cutime",	"%ld",	TV2J(&kp.ki_rusage_ch.ru_utime));
825 	PS_ADD("cstime",	"%ld",	TV2J(&kp.ki_rusage_ch.ru_stime));
826 	PS_ADD("priority",	"%d",	kp.ki_pri.pri_user);
827 	PS_ADD("nice",		"%d",	kp.ki_nice); /* 19 (nicest) to -19 */
828 	PS_ADD("0",		"%d",	0); /* removed field */
829 	PS_ADD("itrealvalue",	"%d",	0); /* XXX */
830 	PS_ADD("starttime",	"%lu",	TV2J(&kp.ki_start) - TV2J(&boottime));
831 	PS_ADD("vsize",		"%ju",	P2K((uintmax_t)kp.ki_size));
832 	PS_ADD("rss",		"%ju",	(uintmax_t)kp.ki_rssize);
833 	PS_ADD("rlim",		"%lu",	kp.ki_rusage.ru_maxrss);
834 	PS_ADD("startcode",	"%ju",	(uintmax_t)startcode);
835 	PS_ADD("endcode",	"%ju",	(uintmax_t)startdata);
836 	PS_ADD("startstack",	"%u",	0); /* XXX */
837 	PS_ADD("kstkesp",	"%u",	0); /* XXX */
838 	PS_ADD("kstkeip",	"%u",	0); /* XXX */
839 	PS_ADD("signal",	"%u",	0); /* XXX */
840 	PS_ADD("blocked",	"%u",	0); /* XXX */
841 	PS_ADD("sigignore",	"%u",	0); /* XXX */
842 	PS_ADD("sigcatch",	"%u",	0); /* XXX */
843 	PS_ADD("wchan",		"%u",	0); /* XXX */
844 	PS_ADD("nswap",		"%lu",	kp.ki_rusage.ru_nswap);
845 	PS_ADD("cnswap",	"%lu",	kp.ki_rusage_ch.ru_nswap);
846 	PS_ADD("exitsignal",	"%d",	0); /* XXX */
847 	PS_ADD("processor",	"%u",	kp.ki_lastcpu);
848 	PS_ADD("rt_priority",	"%u",	0); /* XXX */ /* >= 2.5.19 */
849 	PS_ADD("policy",	"%u",	kp.ki_pri.pri_class); /* >= 2.5.19 */
850 #undef PS_ADD
851 	sbuf_putc(sb, '\n');
852 
853 	return (0);
854 }
855 
856 /*
857  * Filler function for proc/pid/statm
858  */
859 static int
860 linprocfs_doprocstatm(PFS_FILL_ARGS)
861 {
862 	struct kinfo_proc kp;
863 	segsz_t lsize;
864 
865 	sx_slock(&proctree_lock);
866 	PROC_LOCK(p);
867 	fill_kinfo_proc(p, &kp);
868 	PROC_UNLOCK(p);
869 	sx_sunlock(&proctree_lock);
870 
871 	/*
872 	 * See comments in linprocfs_doprocstatus() regarding the
873 	 * computation of lsize.
874 	 */
875 	/* size resident share trs drs lrs dt */
876 	sbuf_printf(sb, "%ju ", B2P((uintmax_t)kp.ki_size));
877 	sbuf_printf(sb, "%ju ", (uintmax_t)kp.ki_rssize);
878 	sbuf_printf(sb, "%ju ", (uintmax_t)0); /* XXX */
879 	sbuf_printf(sb, "%ju ",	(uintmax_t)kp.ki_tsize);
880 	sbuf_printf(sb, "%ju ", (uintmax_t)(kp.ki_dsize + kp.ki_ssize));
881 	lsize = B2P(kp.ki_size) - kp.ki_dsize -
882 	    kp.ki_ssize - kp.ki_tsize - 1;
883 	sbuf_printf(sb, "%ju ", (uintmax_t)lsize);
884 	sbuf_printf(sb, "%ju\n", (uintmax_t)0); /* XXX */
885 
886 	return (0);
887 }
888 
889 /*
890  * Filler function for proc/pid/status
891  */
892 static int
893 linprocfs_doprocstatus(PFS_FILL_ARGS)
894 {
895 	struct kinfo_proc kp;
896 	char *state;
897 	segsz_t lsize;
898 	struct thread *td2;
899 	struct sigacts *ps;
900 	l_sigset_t siglist, sigignore, sigcatch;
901 	int i;
902 
903 	sx_slock(&proctree_lock);
904 	PROC_LOCK(p);
905 	td2 = FIRST_THREAD_IN_PROC(p); /* XXXKSE pretend only one thread */
906 
907 	if (P_SHOULDSTOP(p)) {
908 		state = "T (stopped)";
909 	} else {
910 		switch(p->p_state) {
911 		case PRS_NEW:
912 			state = "I (idle)";
913 			break;
914 		case PRS_NORMAL:
915 			if (p->p_flag & P_WEXIT) {
916 				state = "X (exiting)";
917 				break;
918 			}
919 			switch(td2->td_state) {
920 			case TDS_INHIBITED:
921 				state = "S (sleeping)";
922 				break;
923 			case TDS_RUNQ:
924 			case TDS_RUNNING:
925 				state = "R (running)";
926 				break;
927 			default:
928 				state = "? (unknown)";
929 				break;
930 			}
931 			break;
932 		case PRS_ZOMBIE:
933 			state = "Z (zombie)";
934 			break;
935 		default:
936 			state = "? (unknown)";
937 			break;
938 		}
939 	}
940 
941 	fill_kinfo_proc(p, &kp);
942 	sx_sunlock(&proctree_lock);
943 
944 	sbuf_printf(sb, "Name:\t%s\n",		p->p_comm); /* XXX escape */
945 	sbuf_printf(sb, "State:\t%s\n",		state);
946 
947 	/*
948 	 * Credentials
949 	 */
950 	sbuf_printf(sb, "Tgid:\t%d\n",		p->p_pid);
951 	sbuf_printf(sb, "Pid:\t%d\n",		p->p_pid);
952 	sbuf_printf(sb, "PPid:\t%d\n",		kp.ki_ppid );
953 	sbuf_printf(sb, "TracerPid:\t%d\n",	kp.ki_tracer );
954 	sbuf_printf(sb, "Uid:\t%d %d %d %d\n",	p->p_ucred->cr_ruid,
955 						p->p_ucred->cr_uid,
956 						p->p_ucred->cr_svuid,
957 						/* FreeBSD doesn't have fsuid */
958 						p->p_ucred->cr_uid);
959 	sbuf_printf(sb, "Gid:\t%d %d %d %d\n",	p->p_ucred->cr_rgid,
960 						p->p_ucred->cr_gid,
961 						p->p_ucred->cr_svgid,
962 						/* FreeBSD doesn't have fsgid */
963 						p->p_ucred->cr_gid);
964 	sbuf_cat(sb, "Groups:\t");
965 	for (i = 0; i < p->p_ucred->cr_ngroups; i++)
966 		sbuf_printf(sb, "%d ",		p->p_ucred->cr_groups[i]);
967 	PROC_UNLOCK(p);
968 	sbuf_putc(sb, '\n');
969 
970 	/*
971 	 * Memory
972 	 *
973 	 * While our approximation of VmLib may not be accurate (I
974 	 * don't know of a simple way to verify it, and I'm not sure
975 	 * it has much meaning anyway), I believe it's good enough.
976 	 *
977 	 * The same code that could (I think) accurately compute VmLib
978 	 * could also compute VmLck, but I don't really care enough to
979 	 * implement it. Submissions are welcome.
980 	 */
981 	sbuf_printf(sb, "VmSize:\t%8ju kB\n",	B2K((uintmax_t)kp.ki_size));
982 	sbuf_printf(sb, "VmLck:\t%8u kB\n",	P2K(0)); /* XXX */
983 	sbuf_printf(sb, "VmRSS:\t%8ju kB\n",	P2K((uintmax_t)kp.ki_rssize));
984 	sbuf_printf(sb, "VmData:\t%8ju kB\n",	P2K((uintmax_t)kp.ki_dsize));
985 	sbuf_printf(sb, "VmStk:\t%8ju kB\n",	P2K((uintmax_t)kp.ki_ssize));
986 	sbuf_printf(sb, "VmExe:\t%8ju kB\n",	P2K((uintmax_t)kp.ki_tsize));
987 	lsize = B2P(kp.ki_size) - kp.ki_dsize -
988 	    kp.ki_ssize - kp.ki_tsize - 1;
989 	sbuf_printf(sb, "VmLib:\t%8ju kB\n",	P2K((uintmax_t)lsize));
990 
991 	/*
992 	 * Signal masks
993 	 */
994 	PROC_LOCK(p);
995 	bsd_to_linux_sigset(&p->p_siglist, &siglist);
996 	ps = p->p_sigacts;
997 	mtx_lock(&ps->ps_mtx);
998 	bsd_to_linux_sigset(&ps->ps_sigignore, &sigignore);
999 	bsd_to_linux_sigset(&ps->ps_sigcatch, &sigcatch);
1000 	mtx_unlock(&ps->ps_mtx);
1001 	PROC_UNLOCK(p);
1002 
1003 	sbuf_printf(sb, "SigPnd:\t%016jx\n",	siglist.__mask);
1004 	/*
1005 	 * XXX. SigBlk - target thread's signal mask, td_sigmask.
1006 	 * To implement SigBlk pseudofs should support proc/tid dir entries.
1007 	 */
1008 	sbuf_printf(sb, "SigBlk:\t%016x\n",	0);
1009 	sbuf_printf(sb, "SigIgn:\t%016jx\n",	sigignore.__mask);
1010 	sbuf_printf(sb, "SigCgt:\t%016jx\n",	sigcatch.__mask);
1011 
1012 	/*
1013 	 * Linux also prints the capability masks, but we don't have
1014 	 * capabilities yet, and when we do get them they're likely to
1015 	 * be meaningless to Linux programs, so we lie. XXX
1016 	 */
1017 	sbuf_printf(sb, "CapInh:\t%016x\n",	0);
1018 	sbuf_printf(sb, "CapPrm:\t%016x\n",	0);
1019 	sbuf_printf(sb, "CapEff:\t%016x\n",	0);
1020 
1021 	return (0);
1022 }
1023 
1024 
1025 /*
1026  * Filler function for proc/pid/cwd
1027  */
1028 static int
1029 linprocfs_doproccwd(PFS_FILL_ARGS)
1030 {
1031 	struct filedesc *fdp;
1032 	struct vnode *vp;
1033 	char *fullpath = "unknown";
1034 	char *freepath = NULL;
1035 
1036 	fdp = p->p_fd;
1037 	FILEDESC_SLOCK(fdp);
1038 	vp = fdp->fd_cdir;
1039 	if (vp != NULL)
1040 		VREF(vp);
1041 	FILEDESC_SUNLOCK(fdp);
1042 	vn_fullpath(td, vp, &fullpath, &freepath);
1043 	if (vp != NULL)
1044 		vrele(vp);
1045 	sbuf_printf(sb, "%s", fullpath);
1046 	if (freepath)
1047 		free(freepath, M_TEMP);
1048 	return (0);
1049 }
1050 
1051 /*
1052  * Filler function for proc/pid/root
1053  */
1054 static int
1055 linprocfs_doprocroot(PFS_FILL_ARGS)
1056 {
1057 	struct filedesc *fdp;
1058 	struct vnode *vp;
1059 	char *fullpath = "unknown";
1060 	char *freepath = NULL;
1061 
1062 	fdp = p->p_fd;
1063 	FILEDESC_SLOCK(fdp);
1064 	vp = jailed(p->p_ucred) ? fdp->fd_jdir : fdp->fd_rdir;
1065 	if (vp != NULL)
1066 		VREF(vp);
1067 	FILEDESC_SUNLOCK(fdp);
1068 	vn_fullpath(td, vp, &fullpath, &freepath);
1069 	if (vp != NULL)
1070 		vrele(vp);
1071 	sbuf_printf(sb, "%s", fullpath);
1072 	if (freepath)
1073 		free(freepath, M_TEMP);
1074 	return (0);
1075 }
1076 
1077 /*
1078  * Filler function for proc/pid/cmdline
1079  */
1080 static int
1081 linprocfs_doproccmdline(PFS_FILL_ARGS)
1082 {
1083 	int ret;
1084 
1085 	PROC_LOCK(p);
1086 	if ((ret = p_cansee(td, p)) != 0) {
1087 		PROC_UNLOCK(p);
1088 		return (ret);
1089 	}
1090 
1091 	/*
1092 	 * Mimic linux behavior and pass only processes with usermode
1093 	 * address space as valid.  Return zero silently otherwize.
1094 	 */
1095 	if (p->p_vmspace == &vmspace0) {
1096 		PROC_UNLOCK(p);
1097 		return (0);
1098 	}
1099 	if (p->p_args != NULL) {
1100 		sbuf_bcpy(sb, p->p_args->ar_args, p->p_args->ar_length);
1101 		PROC_UNLOCK(p);
1102 		return (0);
1103 	}
1104 
1105 	if ((p->p_flag & P_SYSTEM) != 0) {
1106 		PROC_UNLOCK(p);
1107 		return (0);
1108 	}
1109 
1110 	PROC_UNLOCK(p);
1111 
1112 	ret = proc_getargv(td, p, sb);
1113 	return (ret);
1114 }
1115 
1116 /*
1117  * Filler function for proc/pid/environ
1118  */
1119 static int
1120 linprocfs_doprocenviron(PFS_FILL_ARGS)
1121 {
1122 
1123 	/*
1124 	 * Mimic linux behavior and pass only processes with usermode
1125 	 * address space as valid.  Return zero silently otherwize.
1126 	 */
1127 	if (p->p_vmspace == &vmspace0)
1128 		return (0);
1129 
1130 	return (proc_getenvv(td, p, sb));
1131 }
1132 
1133 static char l32_map_str[] = "%08lx-%08lx %s%s%s%s %08lx %02x:%02x %lu%s%s\n";
1134 static char l64_map_str[] = "%016lx-%016lx %s%s%s%s %08lx %02x:%02x %lu%s%s\n";
1135 static char vdso_str[] = "      [vdso]";
1136 static char stack_str[] = "      [stack]";
1137 
1138 /*
1139  * Filler function for proc/pid/maps
1140  */
1141 static int
1142 linprocfs_doprocmaps(PFS_FILL_ARGS)
1143 {
1144 	struct vmspace *vm;
1145 	vm_map_t map;
1146 	vm_map_entry_t entry, tmp_entry;
1147 	vm_object_t obj, tobj, lobj;
1148 	vm_offset_t e_start, e_end;
1149 	vm_ooffset_t off;
1150 	vm_prot_t e_prot;
1151 	unsigned int last_timestamp;
1152 	char *name = "", *freename = NULL;
1153 	const char *l_map_str;
1154 	ino_t ino;
1155 	int ref_count, shadow_count, flags;
1156 	int error;
1157 	struct vnode *vp;
1158 	struct vattr vat;
1159 	bool private;
1160 
1161 	PROC_LOCK(p);
1162 	error = p_candebug(td, p);
1163 	PROC_UNLOCK(p);
1164 	if (error)
1165 		return (error);
1166 
1167 	if (uio->uio_rw != UIO_READ)
1168 		return (EOPNOTSUPP);
1169 
1170 	error = 0;
1171 	vm = vmspace_acquire_ref(p);
1172 	if (vm == NULL)
1173 		return (ESRCH);
1174 
1175 	if (SV_CURPROC_FLAG(SV_LP64))
1176 		l_map_str = l64_map_str;
1177 	else
1178 		l_map_str = l32_map_str;
1179 	map = &vm->vm_map;
1180 	vm_map_lock_read(map);
1181 	VM_MAP_ENTRY_FOREACH(entry, map) {
1182 		name = "";
1183 		freename = NULL;
1184 		if (entry->eflags & MAP_ENTRY_IS_SUB_MAP)
1185 			continue;
1186 		e_prot = entry->protection;
1187 		e_start = entry->start;
1188 		e_end = entry->end;
1189 		obj = entry->object.vm_object;
1190 		off = entry->offset;
1191 		for (lobj = tobj = obj; tobj != NULL;
1192 		    lobj = tobj, tobj = tobj->backing_object) {
1193 			VM_OBJECT_RLOCK(tobj);
1194 			off += lobj->backing_object_offset;
1195 			if (lobj != obj)
1196 				VM_OBJECT_RUNLOCK(lobj);
1197 		}
1198 		private = (entry->eflags & MAP_ENTRY_COW) != 0 || obj == NULL ||
1199 		    (obj->flags & OBJ_ANON) != 0;
1200 		last_timestamp = map->timestamp;
1201 		vm_map_unlock_read(map);
1202 		ino = 0;
1203 		if (lobj) {
1204 			vp = vm_object_vnode(lobj);
1205 			if (vp != NULL)
1206 				vref(vp);
1207 			if (lobj != obj)
1208 				VM_OBJECT_RUNLOCK(lobj);
1209 			flags = obj->flags;
1210 			ref_count = obj->ref_count;
1211 			shadow_count = obj->shadow_count;
1212 			VM_OBJECT_RUNLOCK(obj);
1213 			if (vp != NULL) {
1214 				vn_fullpath(td, vp, &name, &freename);
1215 				vn_lock(vp, LK_SHARED | LK_RETRY);
1216 				VOP_GETATTR(vp, &vat, td->td_ucred);
1217 				ino = vat.va_fileid;
1218 				vput(vp);
1219 			} else if (SV_PROC_ABI(p) == SV_ABI_LINUX) {
1220 				if (e_start == p->p_sysent->sv_shared_page_base)
1221 					name = vdso_str;
1222 				if (e_end == p->p_sysent->sv_usrstack)
1223 					name = stack_str;
1224 			}
1225 		} else {
1226 			flags = 0;
1227 			ref_count = 0;
1228 			shadow_count = 0;
1229 		}
1230 
1231 		/*
1232 		 * format:
1233 		 *  start, end, access, offset, major, minor, inode, name.
1234 		 */
1235 		error = sbuf_printf(sb, l_map_str,
1236 		    (u_long)e_start, (u_long)e_end,
1237 		    (e_prot & VM_PROT_READ)?"r":"-",
1238 		    (e_prot & VM_PROT_WRITE)?"w":"-",
1239 		    (e_prot & VM_PROT_EXECUTE)?"x":"-",
1240 		    private ? "p" : "s",
1241 		    (u_long)off,
1242 		    0,
1243 		    0,
1244 		    (u_long)ino,
1245 		    *name ? "     " : "",
1246 		    name
1247 		    );
1248 		if (freename)
1249 			free(freename, M_TEMP);
1250 		vm_map_lock_read(map);
1251 		if (error == -1) {
1252 			error = 0;
1253 			break;
1254 		}
1255 		if (last_timestamp != map->timestamp) {
1256 			/*
1257 			 * Look again for the entry because the map was
1258 			 * modified while it was unlocked.  Specifically,
1259 			 * the entry may have been clipped, merged, or deleted.
1260 			 */
1261 			vm_map_lookup_entry(map, e_end - 1, &tmp_entry);
1262 			entry = tmp_entry;
1263 		}
1264 	}
1265 	vm_map_unlock_read(map);
1266 	vmspace_free(vm);
1267 
1268 	return (error);
1269 }
1270 
1271 /*
1272  * Criteria for interface name translation
1273  */
1274 #define IFP_IS_ETH(ifp) (ifp->if_type == IFT_ETHER)
1275 
1276 static int
1277 linux_ifname(struct ifnet *ifp, char *buffer, size_t buflen)
1278 {
1279 	struct ifnet *ifscan;
1280 	int ethno;
1281 
1282 	IFNET_RLOCK_ASSERT();
1283 
1284 	/* Short-circuit non ethernet interfaces */
1285 	if (!IFP_IS_ETH(ifp))
1286 		return (strlcpy(buffer, ifp->if_xname, buflen));
1287 
1288 	/* Determine the (relative) unit number for ethernet interfaces */
1289 	ethno = 0;
1290 	CK_STAILQ_FOREACH(ifscan, &V_ifnet, if_link) {
1291 		if (ifscan == ifp)
1292 			return (snprintf(buffer, buflen, "eth%d", ethno));
1293 		if (IFP_IS_ETH(ifscan))
1294 			ethno++;
1295 	}
1296 
1297 	return (0);
1298 }
1299 
1300 /*
1301  * Filler function for proc/net/dev
1302  */
1303 static int
1304 linprocfs_donetdev(PFS_FILL_ARGS)
1305 {
1306 	char ifname[16]; /* XXX LINUX_IFNAMSIZ */
1307 	struct ifnet *ifp;
1308 
1309 	sbuf_printf(sb, "%6s|%58s|%s\n"
1310 	    "%6s|%58s|%58s\n",
1311 	    "Inter-", "   Receive", "  Transmit",
1312 	    " face",
1313 	    "bytes    packets errs drop fifo frame compressed multicast",
1314 	    "bytes    packets errs drop fifo colls carrier compressed");
1315 
1316 	CURVNET_SET(TD_TO_VNET(curthread));
1317 	IFNET_RLOCK();
1318 	CK_STAILQ_FOREACH(ifp, &V_ifnet, if_link) {
1319 		linux_ifname(ifp, ifname, sizeof ifname);
1320 		sbuf_printf(sb, "%6.6s: ", ifname);
1321 		sbuf_printf(sb, "%7ju %7ju %4ju %4ju %4lu %5lu %10lu %9ju ",
1322 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IBYTES),
1323 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IPACKETS),
1324 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IERRORS),
1325 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IQDROPS),
1326 							/* rx_missed_errors */
1327 		    0UL,				/* rx_fifo_errors */
1328 		    0UL,				/* rx_length_errors +
1329 							 * rx_over_errors +
1330 							 * rx_crc_errors +
1331 							 * rx_frame_errors */
1332 		    0UL,				/* rx_compressed */
1333 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_IMCASTS));
1334 							/* XXX-BZ rx only? */
1335 		sbuf_printf(sb, "%8ju %7ju %4ju %4ju %4lu %5ju %7lu %10lu\n",
1336 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OBYTES),
1337 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OPACKETS),
1338 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OERRORS),
1339 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_OQDROPS),
1340 		    0UL,				/* tx_fifo_errors */
1341 		    (uintmax_t )ifp->if_get_counter(ifp, IFCOUNTER_COLLISIONS),
1342 		    0UL,				/* tx_carrier_errors +
1343 							 * tx_aborted_errors +
1344 							 * tx_window_errors +
1345 							 * tx_heartbeat_errors*/
1346 		    0UL);				/* tx_compressed */
1347 	}
1348 	IFNET_RUNLOCK();
1349 	CURVNET_RESTORE();
1350 
1351 	return (0);
1352 }
1353 
1354 /*
1355  * Filler function for proc/sys/kernel/osrelease
1356  */
1357 static int
1358 linprocfs_doosrelease(PFS_FILL_ARGS)
1359 {
1360 	char osrelease[LINUX_MAX_UTSNAME];
1361 
1362 	linux_get_osrelease(td, osrelease);
1363 	sbuf_printf(sb, "%s\n", osrelease);
1364 
1365 	return (0);
1366 }
1367 
1368 /*
1369  * Filler function for proc/sys/kernel/ostype
1370  */
1371 static int
1372 linprocfs_doostype(PFS_FILL_ARGS)
1373 {
1374 	char osname[LINUX_MAX_UTSNAME];
1375 
1376 	linux_get_osname(td, osname);
1377 	sbuf_printf(sb, "%s\n", osname);
1378 
1379 	return (0);
1380 }
1381 
1382 /*
1383  * Filler function for proc/sys/kernel/version
1384  */
1385 static int
1386 linprocfs_doosbuild(PFS_FILL_ARGS)
1387 {
1388 
1389 	linprocfs_osbuild(td, sb);
1390 	sbuf_cat(sb, "\n");
1391 	return (0);
1392 }
1393 
1394 /*
1395  * Filler function for proc/sys/kernel/msgmni
1396  */
1397 static int
1398 linprocfs_domsgmni(PFS_FILL_ARGS)
1399 {
1400 
1401 	sbuf_printf(sb, "%d\n", msginfo.msgmni);
1402 	return (0);
1403 }
1404 
1405 /*
1406  * Filler function for proc/sys/kernel/pid_max
1407  */
1408 static int
1409 linprocfs_dopid_max(PFS_FILL_ARGS)
1410 {
1411 
1412 	sbuf_printf(sb, "%i\n", PID_MAX);
1413 	return (0);
1414 }
1415 
1416 /*
1417  * Filler function for proc/sys/kernel/sem
1418  */
1419 static int
1420 linprocfs_dosem(PFS_FILL_ARGS)
1421 {
1422 
1423 	sbuf_printf(sb, "%d %d %d %d\n", seminfo.semmsl, seminfo.semmns,
1424 	    seminfo.semopm, seminfo.semmni);
1425 	return (0);
1426 }
1427 
1428 /*
1429  * Filler function for proc/sys/vm/min_free_kbytes
1430  *
1431  * This mirrors the approach in illumos to return zero for reads. Effectively,
1432  * it says, no memory is kept in reserve for "atomic allocations". This class
1433  * of allocation can be used at times when a thread cannot be suspended.
1434  */
1435 static int
1436 linprocfs_dominfree(PFS_FILL_ARGS)
1437 {
1438 
1439 	sbuf_printf(sb, "%d\n", 0);
1440 	return (0);
1441 }
1442 
1443 /*
1444  * Filler function for proc/scsi/device_info
1445  */
1446 static int
1447 linprocfs_doscsidevinfo(PFS_FILL_ARGS)
1448 {
1449 
1450 	return (0);
1451 }
1452 
1453 /*
1454  * Filler function for proc/scsi/scsi
1455  */
1456 static int
1457 linprocfs_doscsiscsi(PFS_FILL_ARGS)
1458 {
1459 
1460 	return (0);
1461 }
1462 
1463 /*
1464  * Filler function for proc/devices
1465  */
1466 static int
1467 linprocfs_dodevices(PFS_FILL_ARGS)
1468 {
1469 	char *char_devices;
1470 	sbuf_printf(sb, "Character devices:\n");
1471 
1472 	char_devices = linux_get_char_devices();
1473 	sbuf_printf(sb, "%s", char_devices);
1474 	linux_free_get_char_devices(char_devices);
1475 
1476 	sbuf_printf(sb, "\nBlock devices:\n");
1477 
1478 	return (0);
1479 }
1480 
1481 /*
1482  * Filler function for proc/cmdline
1483  */
1484 static int
1485 linprocfs_docmdline(PFS_FILL_ARGS)
1486 {
1487 
1488 	sbuf_printf(sb, "BOOT_IMAGE=%s", kernelname);
1489 	sbuf_printf(sb, " ro root=302\n");
1490 	return (0);
1491 }
1492 
1493 /*
1494  * Filler function for proc/filesystems
1495  */
1496 static int
1497 linprocfs_dofilesystems(PFS_FILL_ARGS)
1498 {
1499 	struct vfsconf *vfsp;
1500 
1501 	vfsconf_slock();
1502 	TAILQ_FOREACH(vfsp, &vfsconf, vfc_list) {
1503 		if (vfsp->vfc_flags & VFCF_SYNTHETIC)
1504 			sbuf_printf(sb, "nodev");
1505 		sbuf_printf(sb, "\t%s\n", vfsp->vfc_name);
1506 	}
1507 	vfsconf_sunlock();
1508 	return(0);
1509 }
1510 
1511 /*
1512  * Filler function for proc/modules
1513  */
1514 static int
1515 linprocfs_domodules(PFS_FILL_ARGS)
1516 {
1517 #if 0
1518 	struct linker_file *lf;
1519 
1520 	TAILQ_FOREACH(lf, &linker_files, link) {
1521 		sbuf_printf(sb, "%-20s%8lu%4d\n", lf->filename,
1522 		    (unsigned long)lf->size, lf->refs);
1523 	}
1524 #endif
1525 	return (0);
1526 }
1527 
1528 /*
1529  * Filler function for proc/pid/fd
1530  */
1531 static int
1532 linprocfs_dofdescfs(PFS_FILL_ARGS)
1533 {
1534 
1535 	if (p == curproc)
1536 		sbuf_printf(sb, "/dev/fd");
1537 	else
1538 		sbuf_printf(sb, "unknown");
1539 	return (0);
1540 }
1541 
1542 /*
1543  * Filler function for proc/pid/limits
1544  */
1545 static const struct linux_rlimit_ident {
1546 	const char	*desc;
1547 	const char	*unit;
1548 	unsigned int	rlim_id;
1549 } linux_rlimits_ident[] = {
1550 	{ "Max cpu time",	"seconds",	RLIMIT_CPU },
1551 	{ "Max file size", 	"bytes",	RLIMIT_FSIZE },
1552 	{ "Max data size",	"bytes", 	RLIMIT_DATA },
1553 	{ "Max stack size",	"bytes", 	RLIMIT_STACK },
1554 	{ "Max core file size",  "bytes",	RLIMIT_CORE },
1555 	{ "Max resident set",	"bytes",	RLIMIT_RSS },
1556 	{ "Max processes",	"processes",	RLIMIT_NPROC },
1557 	{ "Max open files",	"files",	RLIMIT_NOFILE },
1558 	{ "Max locked memory",	"bytes",	RLIMIT_MEMLOCK },
1559 	{ "Max address space",	"bytes",	RLIMIT_AS },
1560 	{ "Max file locks",	"locks",	LINUX_RLIMIT_LOCKS },
1561 	{ "Max pending signals", "signals",	LINUX_RLIMIT_SIGPENDING },
1562 	{ "Max msgqueue size",	"bytes",	LINUX_RLIMIT_MSGQUEUE },
1563 	{ "Max nice priority", 		"",	LINUX_RLIMIT_NICE },
1564 	{ "Max realtime priority",	"",	LINUX_RLIMIT_RTPRIO },
1565 	{ "Max realtime timeout",	"us",	LINUX_RLIMIT_RTTIME },
1566 	{ 0, 0, 0 }
1567 };
1568 
1569 static int
1570 linprocfs_doproclimits(PFS_FILL_ARGS)
1571 {
1572 	const struct linux_rlimit_ident *li;
1573 	struct plimit *limp;
1574 	struct rlimit rl;
1575 	ssize_t size;
1576 	int res, error;
1577 
1578 	error = 0;
1579 
1580 	PROC_LOCK(p);
1581 	limp = lim_hold(p->p_limit);
1582 	PROC_UNLOCK(p);
1583 	size = sizeof(res);
1584 	sbuf_printf(sb, "%-26s%-21s%-21s%-21s\n", "Limit", "Soft Limit",
1585 			"Hard Limit", "Units");
1586 	for (li = linux_rlimits_ident; li->desc != NULL; ++li) {
1587 		switch (li->rlim_id)
1588 		{
1589 		case LINUX_RLIMIT_LOCKS:
1590 			/* FALLTHROUGH */
1591 		case LINUX_RLIMIT_RTTIME:
1592 			rl.rlim_cur = RLIM_INFINITY;
1593 			break;
1594 		case LINUX_RLIMIT_SIGPENDING:
1595 			error = kernel_sysctlbyname(td,
1596 			    "kern.sigqueue.max_pending_per_proc",
1597 			    &res, &size, 0, 0, 0, 0);
1598 			if (error != 0)
1599 				goto out;
1600 			rl.rlim_cur = res;
1601 			rl.rlim_max = res;
1602 			break;
1603 		case LINUX_RLIMIT_MSGQUEUE:
1604 			error = kernel_sysctlbyname(td,
1605 			    "kern.ipc.msgmnb", &res, &size, 0, 0, 0, 0);
1606 			if (error != 0)
1607 				goto out;
1608 			rl.rlim_cur = res;
1609 			rl.rlim_max = res;
1610 			break;
1611 		case LINUX_RLIMIT_NICE:
1612 			/* FALLTHROUGH */
1613 		case LINUX_RLIMIT_RTPRIO:
1614 			rl.rlim_cur = 0;
1615 			rl.rlim_max = 0;
1616 			break;
1617 		default:
1618 			rl = limp->pl_rlimit[li->rlim_id];
1619 			break;
1620 		}
1621 		if (rl.rlim_cur == RLIM_INFINITY)
1622 			sbuf_printf(sb, "%-26s%-21s%-21s%-10s\n",
1623 			    li->desc, "unlimited", "unlimited", li->unit);
1624 		else
1625 			sbuf_printf(sb, "%-26s%-21llu%-21llu%-10s\n",
1626 			    li->desc, (unsigned long long)rl.rlim_cur,
1627 			    (unsigned long long)rl.rlim_max, li->unit);
1628 	}
1629 out:
1630 	lim_free(limp);
1631 	return (error);
1632 }
1633 
1634 /*
1635  * Filler function for proc/sys/kernel/random/uuid
1636  */
1637 static int
1638 linprocfs_douuid(PFS_FILL_ARGS)
1639 {
1640 	struct uuid uuid;
1641 
1642 	kern_uuidgen(&uuid, 1);
1643 	sbuf_printf_uuid(sb, &uuid);
1644 	sbuf_printf(sb, "\n");
1645 	return(0);
1646 }
1647 
1648 /*
1649  * Filler function for proc/pid/auxv
1650  */
1651 static int
1652 linprocfs_doauxv(PFS_FILL_ARGS)
1653 {
1654 	struct sbuf *asb;
1655 	off_t buflen, resid;
1656 	int error;
1657 
1658 	/*
1659 	 * Mimic linux behavior and pass only processes with usermode
1660 	 * address space as valid. Return zero silently otherwise.
1661 	 */
1662 	if (p->p_vmspace == &vmspace0)
1663 		return (0);
1664 
1665 	if (uio->uio_resid == 0)
1666 		return (0);
1667 	if (uio->uio_offset < 0 || uio->uio_resid < 0)
1668 		return (EINVAL);
1669 
1670 	asb = sbuf_new_auto();
1671 	if (asb == NULL)
1672 		return (ENOMEM);
1673 	error = proc_getauxv(td, p, asb);
1674 	if (error == 0)
1675 		error = sbuf_finish(asb);
1676 
1677 	resid = sbuf_len(asb) - uio->uio_offset;
1678 	if (resid > uio->uio_resid)
1679 		buflen = uio->uio_resid;
1680 	else
1681 		buflen = resid;
1682 	if (buflen > IOSIZE_MAX)
1683 		return (EINVAL);
1684 	if (buflen > MAXPHYS)
1685 		buflen = MAXPHYS;
1686 	if (resid <= 0)
1687 		return (0);
1688 
1689 	if (error == 0)
1690 		error = uiomove(sbuf_data(asb) + uio->uio_offset, buflen, uio);
1691 	sbuf_delete(asb);
1692 	return (error);
1693 }
1694 
1695 /*
1696  * Constructor
1697  */
1698 static int
1699 linprocfs_init(PFS_INIT_ARGS)
1700 {
1701 	struct pfs_node *root;
1702 	struct pfs_node *dir;
1703 	struct pfs_node *sys;
1704 
1705 	root = pi->pi_root;
1706 
1707 	/* /proc/... */
1708 	pfs_create_file(root, "cmdline", &linprocfs_docmdline,
1709 	    NULL, NULL, NULL, PFS_RD);
1710 	pfs_create_file(root, "cpuinfo", &linprocfs_docpuinfo,
1711 	    NULL, NULL, NULL, PFS_RD);
1712 	pfs_create_file(root, "devices", &linprocfs_dodevices,
1713 	    NULL, NULL, NULL, PFS_RD);
1714 	pfs_create_file(root, "filesystems", &linprocfs_dofilesystems,
1715 	    NULL, NULL, NULL, PFS_RD);
1716 	pfs_create_file(root, "loadavg", &linprocfs_doloadavg,
1717 	    NULL, NULL, NULL, PFS_RD);
1718 	pfs_create_file(root, "meminfo", &linprocfs_domeminfo,
1719 	    NULL, NULL, NULL, PFS_RD);
1720 	pfs_create_file(root, "modules", &linprocfs_domodules,
1721 	    NULL, NULL, NULL, PFS_RD);
1722 	pfs_create_file(root, "mounts", &linprocfs_domtab,
1723 	    NULL, NULL, NULL, PFS_RD);
1724 	pfs_create_file(root, "mtab", &linprocfs_domtab,
1725 	    NULL, NULL, NULL, PFS_RD);
1726 	pfs_create_file(root, "partitions", &linprocfs_dopartitions,
1727 	    NULL, NULL, NULL, PFS_RD);
1728 	pfs_create_link(root, "self", &procfs_docurproc,
1729 	    NULL, NULL, NULL, 0);
1730 	pfs_create_file(root, "stat", &linprocfs_dostat,
1731 	    NULL, NULL, NULL, PFS_RD);
1732 	pfs_create_file(root, "swaps", &linprocfs_doswaps,
1733 	    NULL, NULL, NULL, PFS_RD);
1734 	pfs_create_file(root, "uptime", &linprocfs_douptime,
1735 	    NULL, NULL, NULL, PFS_RD);
1736 	pfs_create_file(root, "version", &linprocfs_doversion,
1737 	    NULL, NULL, NULL, PFS_RD);
1738 
1739 	/* /proc/net/... */
1740 	dir = pfs_create_dir(root, "net", NULL, NULL, NULL, 0);
1741 	pfs_create_file(dir, "dev", &linprocfs_donetdev,
1742 	    NULL, NULL, NULL, PFS_RD);
1743 
1744 	/* /proc/<pid>/... */
1745 	dir = pfs_create_dir(root, "pid", NULL, NULL, NULL, PFS_PROCDEP);
1746 	pfs_create_file(dir, "cmdline", &linprocfs_doproccmdline,
1747 	    NULL, NULL, NULL, PFS_RD);
1748 	pfs_create_link(dir, "cwd", &linprocfs_doproccwd,
1749 	    NULL, NULL, NULL, 0);
1750 	pfs_create_file(dir, "environ", &linprocfs_doprocenviron,
1751 	    NULL, &procfs_candebug, NULL, PFS_RD);
1752 	pfs_create_link(dir, "exe", &procfs_doprocfile,
1753 	    NULL, &procfs_notsystem, NULL, 0);
1754 	pfs_create_file(dir, "maps", &linprocfs_doprocmaps,
1755 	    NULL, NULL, NULL, PFS_RD);
1756 	pfs_create_file(dir, "mem", &procfs_doprocmem,
1757 	    procfs_attr_rw, &procfs_candebug, NULL, PFS_RDWR | PFS_RAW);
1758 	pfs_create_file(dir, "mounts", &linprocfs_domtab,
1759 	    NULL, NULL, NULL, PFS_RD);
1760 	pfs_create_link(dir, "root", &linprocfs_doprocroot,
1761 	    NULL, NULL, NULL, 0);
1762 	pfs_create_file(dir, "stat", &linprocfs_doprocstat,
1763 	    NULL, NULL, NULL, PFS_RD);
1764 	pfs_create_file(dir, "statm", &linprocfs_doprocstatm,
1765 	    NULL, NULL, NULL, PFS_RD);
1766 	pfs_create_file(dir, "status", &linprocfs_doprocstatus,
1767 	    NULL, NULL, NULL, PFS_RD);
1768 	pfs_create_link(dir, "fd", &linprocfs_dofdescfs,
1769 	    NULL, NULL, NULL, 0);
1770 	pfs_create_file(dir, "auxv", &linprocfs_doauxv,
1771 	    NULL, &procfs_candebug, NULL, PFS_RD|PFS_RAWRD);
1772 	pfs_create_file(dir, "limits", &linprocfs_doproclimits,
1773 	    NULL, NULL, NULL, PFS_RD);
1774 
1775 	/* /proc/scsi/... */
1776 	dir = pfs_create_dir(root, "scsi", NULL, NULL, NULL, 0);
1777 	pfs_create_file(dir, "device_info", &linprocfs_doscsidevinfo,
1778 	    NULL, NULL, NULL, PFS_RD);
1779 	pfs_create_file(dir, "scsi", &linprocfs_doscsiscsi,
1780 	    NULL, NULL, NULL, PFS_RD);
1781 
1782 	/* /proc/sys/... */
1783 	sys = pfs_create_dir(root, "sys", NULL, NULL, NULL, 0);
1784 	/* /proc/sys/kernel/... */
1785 	dir = pfs_create_dir(sys, "kernel", NULL, NULL, NULL, 0);
1786 	pfs_create_file(dir, "osrelease", &linprocfs_doosrelease,
1787 	    NULL, NULL, NULL, PFS_RD);
1788 	pfs_create_file(dir, "ostype", &linprocfs_doostype,
1789 	    NULL, NULL, NULL, PFS_RD);
1790 	pfs_create_file(dir, "version", &linprocfs_doosbuild,
1791 	    NULL, NULL, NULL, PFS_RD);
1792 	pfs_create_file(dir, "msgmni", &linprocfs_domsgmni,
1793 	    NULL, NULL, NULL, PFS_RD);
1794 	pfs_create_file(dir, "pid_max", &linprocfs_dopid_max,
1795 	    NULL, NULL, NULL, PFS_RD);
1796 	pfs_create_file(dir, "sem", &linprocfs_dosem,
1797 	    NULL, NULL, NULL, PFS_RD);
1798 
1799 	/* /proc/sys/kernel/random/... */
1800 	dir = pfs_create_dir(dir, "random", NULL, NULL, NULL, 0);
1801 	pfs_create_file(dir, "uuid", &linprocfs_douuid,
1802 	    NULL, NULL, NULL, PFS_RD);
1803 
1804 	/* /proc/sys/vm/.... */
1805 	dir = pfs_create_dir(sys, "vm", NULL, NULL, NULL, 0);
1806 	pfs_create_file(dir, "min_free_kbytes", &linprocfs_dominfree,
1807 	    NULL, NULL, NULL, PFS_RD);
1808 
1809 	return (0);
1810 }
1811 
1812 /*
1813  * Destructor
1814  */
1815 static int
1816 linprocfs_uninit(PFS_INIT_ARGS)
1817 {
1818 
1819 	/* nothing to do, pseudofs will GC */
1820 	return (0);
1821 }
1822 
1823 PSEUDOFS(linprocfs, 1, VFCF_JAIL);
1824 #if defined(__aarch64__) || defined(__amd64__)
1825 MODULE_DEPEND(linprocfs, linux_common, 1, 1, 1);
1826 #else
1827 MODULE_DEPEND(linprocfs, linux, 1, 1, 1);
1828 #endif
1829 MODULE_DEPEND(linprocfs, procfs, 1, 1, 1);
1830 MODULE_DEPEND(linprocfs, sysvmsg, 1, 1, 1);
1831 MODULE_DEPEND(linprocfs, sysvsem, 1, 1, 1);
1832