xref: /freebsd/usr.bin/vmstat/vmstat.c (revision 4133f23624058951a3b66e3ad735de980a485f36)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1980, 1986, 1991, 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  * 3. Neither the name of the University nor the names of its contributors
16  *    may be used to endorse or promote products derived from this software
17  *    without specific prior written permission.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  */
31 
32 #ifndef lint
33 static const char copyright[] =
34 "@(#) Copyright (c) 1980, 1986, 1991, 1993\n\
35 	The Regents of the University of California.  All rights reserved.\n";
36 #endif /* not lint */
37 
38 #if 0
39 #ifndef lint
40 static char sccsid[] = "@(#)vmstat.c	8.1 (Berkeley) 6/6/93";
41 #endif /* not lint */
42 #endif
43 
44 #include <sys/cdefs.h>
45 __FBSDID("$FreeBSD$");
46 
47 #include <sys/param.h>
48 #include <sys/proc.h>
49 #include <sys/uio.h>
50 #include <sys/namei.h>
51 #include <sys/malloc.h>
52 #include <sys/signal.h>
53 #include <sys/fcntl.h>
54 #include <sys/ioctl.h>
55 #include <sys/resource.h>
56 #include <sys/sysctl.h>
57 #include <sys/time.h>
58 #include <sys/user.h>
59 #define	_WANT_VMMETER
60 #include <sys/vmmeter.h>
61 #include <sys/pcpu.h>
62 
63 #include <vm/vm_param.h>
64 
65 #include <ctype.h>
66 #include <devstat.h>
67 #include <err.h>
68 #include <errno.h>
69 #include <inttypes.h>
70 #include <kvm.h>
71 #include <limits.h>
72 #include <memstat.h>
73 #include <nlist.h>
74 #include <paths.h>
75 #include <stdio.h>
76 #include <stdlib.h>
77 #include <string.h>
78 #include <sysexits.h>
79 #include <time.h>
80 #include <unistd.h>
81 #include <libutil.h>
82 #include <libxo/xo.h>
83 
84 #define VMSTAT_XO_VERSION "1"
85 
86 static char da[] = "da";
87 
88 enum x_stats { X_SUM, X_HZ, X_STATHZ, X_NCHSTATS, X_INTRNAMES, X_SINTRNAMES,
89     X_INTRCNT, X_SINTRCNT, X_NINTRCNT };
90 
91 static struct nlist namelist[] = {
92 	[X_SUM] = { .n_name = "_vm_cnt", },
93 	[X_HZ] = { .n_name = "_hz", },
94 	[X_STATHZ] = { .n_name = "_stathz", },
95 	[X_NCHSTATS] = { .n_name = "_nchstats", },
96 	[X_INTRNAMES] = { .n_name = "_intrnames", },
97 	[X_SINTRNAMES] = { .n_name = "_sintrnames", },
98 	[X_INTRCNT] = { .n_name = "_intrcnt", },
99 	[X_SINTRCNT] = { .n_name = "_sintrcnt", },
100 	[X_NINTRCNT] = { .n_name = "_nintrcnt", },
101 	{ .n_name = NULL, },
102 };
103 
104 static struct devstat_match *matches;
105 static struct device_selection *dev_select;
106 static struct statinfo cur, last;
107 static devstat_select_mode select_mode;
108 static size_t size_cp_times;
109 static long *cur_cp_times, *last_cp_times;
110 static long generation, select_generation;
111 static int hz, hdrcnt, maxshowdevs;
112 static int num_devices, num_devices_specified;
113 static int num_matches, num_selected, num_selections;
114 static char **specified_devices;
115 
116 static struct __vmmeter {
117 	uint64_t v_swtch;
118 	uint64_t v_trap;
119 	uint64_t v_syscall;
120 	uint64_t v_intr;
121 	uint64_t v_soft;
122 	uint64_t v_vm_faults;
123 	uint64_t v_io_faults;
124 	uint64_t v_cow_faults;
125 	uint64_t v_cow_optim;
126 	uint64_t v_zfod;
127 	uint64_t v_ozfod;
128 	uint64_t v_swapin;
129 	uint64_t v_swapout;
130 	uint64_t v_swappgsin;
131 	uint64_t v_swappgsout;
132 	uint64_t v_vnodein;
133 	uint64_t v_vnodeout;
134 	uint64_t v_vnodepgsin;
135 	uint64_t v_vnodepgsout;
136 	uint64_t v_intrans;
137 	uint64_t v_reactivated;
138 	uint64_t v_pdwakeups;
139 	uint64_t v_pdpages;
140 	uint64_t v_pdshortfalls;
141 	uint64_t v_dfree;
142 	uint64_t v_pfree;
143 	uint64_t v_tfree;
144 	uint64_t v_forks;
145 	uint64_t v_vforks;
146 	uint64_t v_rforks;
147 	uint64_t v_kthreads;
148 	uint64_t v_forkpages;
149 	uint64_t v_vforkpages;
150 	uint64_t v_rforkpages;
151 	uint64_t v_kthreadpages;
152 	u_int v_page_size;
153 	u_int v_page_count;
154 	u_int v_free_reserved;
155 	u_int v_free_target;
156 	u_int v_free_min;
157 	u_int v_free_count;
158 	u_int v_wire_count;
159 	u_long v_user_wire_count;
160 	u_int v_active_count;
161 	u_int v_inactive_target;
162 	u_int v_inactive_count;
163 	u_int v_laundry_count;
164 	u_int v_pageout_free_min;
165 	u_int v_interrupt_free_min;
166 	u_int v_free_severe;
167 } sum, osum;
168 
169 #define	VMSTAT_DEFAULT_LINES	20	/* Default number of `winlines'. */
170 static volatile sig_atomic_t wresized;		/* Tty resized when non-zero. */
171 static int winlines = VMSTAT_DEFAULT_LINES; /* Current number of tty rows. */
172 
173 static int	aflag;
174 static int	nflag;
175 static int	Pflag;
176 static int	hflag;
177 
178 static kvm_t	*kd;
179 
180 #define	FORKSTAT	0x01
181 #define	INTRSTAT	0x02
182 #define	MEMSTAT		0x04
183 #define	SUMSTAT		0x08
184 #define	TIMESTAT	0x10
185 #define	VMSTAT		0x20
186 #define	ZMEMSTAT	0x40
187 #define	OBJSTAT		0x80
188 
189 static void	cpustats(void);
190 static void	pcpustats(u_long, int);
191 static void	devstats(void);
192 static void	doforkst(void);
193 static void	dointr(unsigned int, int);
194 static void	doobjstat(void);
195 static void	dosum(void);
196 static void	dovmstat(unsigned int, int);
197 static void	domemstat_malloc(void);
198 static void	domemstat_zone(void);
199 static void	kread(int, void *, size_t);
200 static void	kreado(int, void *, size_t, size_t);
201 static void	kreadptr(uintptr_t, void *, size_t);
202 static void	needhdr(int);
203 static void	needresize(int);
204 static void	doresize(void);
205 static void	printhdr(int, u_long);
206 static void	usage(void);
207 
208 static long	pct(long, long);
209 static long long	getuptime(void);
210 
211 static char	**getdrivedata(char **);
212 
213 int
214 main(int argc, char *argv[])
215 {
216 	char *bp, *buf, *memf, *nlistf;
217 	float f;
218 	int bufsize, c, reps, todo;
219 	size_t len;
220 	unsigned int interval;
221 	char errbuf[_POSIX2_LINE_MAX];
222 
223 	memf = nlistf = NULL;
224 	interval = reps = todo = 0;
225 	maxshowdevs = 2;
226 	hflag = isatty(1);
227 
228 	argc = xo_parse_args(argc, argv);
229 	if (argc < 0)
230 		return (argc);
231 
232 	while ((c = getopt(argc, argv, "ac:fhHiM:mN:n:oPp:sw:z")) != -1) {
233 		switch (c) {
234 		case 'a':
235 			aflag++;
236 			break;
237 		case 'c':
238 			reps = atoi(optarg);
239 			break;
240 		case 'P':
241 			Pflag++;
242 			break;
243 		case 'f':
244 			todo |= FORKSTAT;
245 			break;
246 		case 'h':
247 			hflag = 1;
248 			break;
249 		case 'H':
250 			hflag = 0;
251 			break;
252 		case 'i':
253 			todo |= INTRSTAT;
254 			break;
255 		case 'M':
256 			memf = optarg;
257 			break;
258 		case 'm':
259 			todo |= MEMSTAT;
260 			break;
261 		case 'N':
262 			nlistf = optarg;
263 			break;
264 		case 'n':
265 			nflag = 1;
266 			maxshowdevs = atoi(optarg);
267 			if (maxshowdevs < 0)
268 				xo_errx(1, "number of devices %d is < 0",
269 				    maxshowdevs);
270 			break;
271 		case 'o':
272 			todo |= OBJSTAT;
273 			break;
274 		case 'p':
275 			if (devstat_buildmatch(optarg, &matches, &num_matches)
276 			    != 0)
277 				xo_errx(1, "%s", devstat_errbuf);
278 			break;
279 		case 's':
280 			todo |= SUMSTAT;
281 			break;
282 		case 'w':
283 			/* Convert to milliseconds. */
284 			f = atof(optarg);
285 			interval = f * 1000;
286 			break;
287 		case 'z':
288 			todo |= ZMEMSTAT;
289 			break;
290 		case '?':
291 		default:
292 			usage();
293 		}
294 	}
295 	argc -= optind;
296 	argv += optind;
297 
298 	xo_set_version(VMSTAT_XO_VERSION);
299 	if (todo == 0)
300 		todo = VMSTAT;
301 
302 	if (memf != NULL) {
303 		kd = kvm_openfiles(nlistf, memf, NULL, O_RDONLY, errbuf);
304 		if (kd == NULL)
305 			xo_errx(1, "kvm_openfiles: %s", errbuf);
306 	}
307 
308 retry_nlist:
309 	if (kd != NULL && (c = kvm_nlist(kd, namelist)) != 0) {
310 		if (c > 0) {
311 			bufsize = 0;
312 			len = 0;
313 
314 			/*
315 			 * 'cnt' was renamed to 'vm_cnt'.  If 'vm_cnt' is not
316 			 * found try looking up older 'cnt' symbol.
317 			 * */
318 			if (namelist[X_SUM].n_type == 0 &&
319 			    strcmp(namelist[X_SUM].n_name, "_vm_cnt") == 0) {
320 				namelist[X_SUM].n_name = "_cnt";
321 				goto retry_nlist;
322 			}
323 
324 			/*
325 			 * 'nintrcnt' doesn't exist in older kernels, but
326 			 * that isn't fatal.
327 			 */
328 			if (namelist[X_NINTRCNT].n_type == 0 && c == 1)
329 				goto nlist_ok;
330 
331 			for (c = 0; c < (int)(nitems(namelist)); c++)
332 				if (namelist[c].n_type == 0)
333 					bufsize += strlen(namelist[c].n_name)
334 					    + 1;
335 			bufsize += len + 1;
336 			buf = bp = alloca(bufsize);
337 
338 			for (c = 0; c < (int)(nitems(namelist)); c++)
339 				if (namelist[c].n_type == 0) {
340 					xo_error(" %s",
341 					    namelist[c].n_name);
342 					len = strlen(namelist[c].n_name);
343 					*bp++ = ' ';
344 					memcpy(bp, namelist[c].n_name, len);
345 					bp += len;
346 				}
347 			*bp = '\0';
348 			xo_error("undefined symbols:\n", buf);
349 		} else
350 			xo_warnx("kvm_nlist: %s", kvm_geterr(kd));
351 		xo_finish();
352 		exit(1);
353 	}
354 nlist_ok:
355 	if (kd && Pflag)
356 		xo_errx(1, "Cannot use -P with crash dumps");
357 
358 	if (todo & VMSTAT) {
359 		/*
360 		 * Make sure that the userland devstat version matches the
361 		 * kernel devstat version.  If not, exit and print a
362 		 * message informing the user of his mistake.
363 		 */
364 		if (devstat_checkversion(NULL) < 0)
365 			xo_errx(1, "%s", devstat_errbuf);
366 
367 
368 		argv = getdrivedata(argv);
369 	}
370 
371 	if (*argv) {
372 		f = atof(*argv);
373 		interval = f * 1000;
374 		if (*++argv)
375 			reps = atoi(*argv);
376 	}
377 
378 	if (interval) {
379 		if (!reps)
380 			reps = -1;
381 	} else if (reps)
382 		interval = 1 * 1000;
383 
384 	if (todo & FORKSTAT)
385 		doforkst();
386 	if (todo & MEMSTAT)
387 		domemstat_malloc();
388 	if (todo & ZMEMSTAT)
389 		domemstat_zone();
390 	if (todo & SUMSTAT)
391 		dosum();
392 	if (todo & OBJSTAT)
393 		doobjstat();
394 	if (todo & INTRSTAT)
395 		dointr(interval, reps);
396 	if (todo & VMSTAT)
397 		dovmstat(interval, reps);
398 	xo_finish();
399 	exit(0);
400 }
401 
402 static int
403 mysysctl(const char *name, void *oldp, size_t *oldlenp)
404 {
405 	int error;
406 
407 	error = sysctlbyname(name, oldp, oldlenp, NULL, 0);
408 	if (error != 0 && errno != ENOMEM)
409 		xo_err(1, "sysctl(%s)", name);
410 	return (error);
411 }
412 
413 static char **
414 getdrivedata(char **argv)
415 {
416 
417 	if ((num_devices = devstat_getnumdevs(NULL)) < 0)
418 		xo_errx(1, "%s", devstat_errbuf);
419 
420 	cur.dinfo = (struct devinfo *)calloc(1, sizeof(struct devinfo));
421 	last.dinfo = (struct devinfo *)calloc(1, sizeof(struct devinfo));
422 
423 	if (devstat_getdevs(NULL, &cur) == -1)
424 		xo_errx(1, "%s", devstat_errbuf);
425 
426 	num_devices = cur.dinfo->numdevs;
427 	generation = cur.dinfo->generation;
428 
429 	specified_devices = malloc(sizeof(char *));
430 	for (num_devices_specified = 0; *argv; ++argv) {
431 		if (isdigit(**argv))
432 			break;
433 		num_devices_specified++;
434 		specified_devices = reallocf(specified_devices,
435 		    sizeof(char *) * num_devices_specified);
436 		if (specified_devices == NULL) {
437 			xo_errx(1, "%s", "reallocf (specified_devices)");
438 		}
439 		specified_devices[num_devices_specified - 1] = *argv;
440 	}
441 	dev_select = NULL;
442 
443 	if (nflag == 0 && maxshowdevs < num_devices_specified)
444 		maxshowdevs = num_devices_specified;
445 
446 	/*
447 	 * People are generally only interested in disk statistics when
448 	 * they're running vmstat.  So, that's what we're going to give
449 	 * them if they don't specify anything by default.  We'll also give
450 	 * them any other random devices in the system so that we get to
451 	 * maxshowdevs devices, if that many devices exist.  If the user
452 	 * specifies devices on the command line, either through a pattern
453 	 * match or by naming them explicitly, we will give the user only
454 	 * those devices.
455 	 */
456 	if ((num_devices_specified == 0) && (num_matches == 0)) {
457 		if (devstat_buildmatch(da, &matches, &num_matches) != 0)
458 			xo_errx(1, "%s", devstat_errbuf);
459 		select_mode = DS_SELECT_ADD;
460 	} else
461 		select_mode = DS_SELECT_ONLY;
462 
463 	/*
464 	 * At this point, selectdevs will almost surely indicate that the
465 	 * device list has changed, so we don't look for return values of 0
466 	 * or 1.  If we get back -1, though, there is an error.
467 	 */
468 	if (devstat_selectdevs(&dev_select, &num_selected, &num_selections,
469 	    &select_generation, generation, cur.dinfo->devices,
470 	    num_devices, matches, num_matches, specified_devices,
471 	    num_devices_specified, select_mode,
472 	    maxshowdevs, 0) == -1)
473 		xo_errx(1, "%s", devstat_errbuf);
474 
475 	return(argv);
476 }
477 
478 /* Return system uptime in nanoseconds */
479 static long long
480 getuptime(void)
481 {
482 	struct timespec sp;
483 
484 	(void)clock_gettime(CLOCK_UPTIME, &sp);
485 	return((long long)sp.tv_sec * 1000000000LL + sp.tv_nsec);
486 }
487 
488 static void
489 fill_vmmeter(struct __vmmeter *vmmp)
490 {
491 	struct vmmeter vm_cnt;
492 	size_t size;
493 
494 	if (kd != NULL) {
495 		kread(X_SUM, &vm_cnt, sizeof(vm_cnt));
496 #define	GET_COUNTER(name) \
497 		vmmp->name = kvm_counter_u64_fetch(kd, (u_long)vm_cnt.name)
498 		GET_COUNTER(v_swtch);
499 		GET_COUNTER(v_trap);
500 		GET_COUNTER(v_syscall);
501 		GET_COUNTER(v_intr);
502 		GET_COUNTER(v_soft);
503 		GET_COUNTER(v_vm_faults);
504 		GET_COUNTER(v_io_faults);
505 		GET_COUNTER(v_cow_faults);
506 		GET_COUNTER(v_cow_optim);
507 		GET_COUNTER(v_zfod);
508 		GET_COUNTER(v_ozfod);
509 		GET_COUNTER(v_swapin);
510 		GET_COUNTER(v_swapout);
511 		GET_COUNTER(v_swappgsin);
512 		GET_COUNTER(v_swappgsout);
513 		GET_COUNTER(v_vnodein);
514 		GET_COUNTER(v_vnodeout);
515 		GET_COUNTER(v_vnodepgsin);
516 		GET_COUNTER(v_vnodepgsout);
517 		GET_COUNTER(v_intrans);
518 		GET_COUNTER(v_tfree);
519 		GET_COUNTER(v_forks);
520 		GET_COUNTER(v_vforks);
521 		GET_COUNTER(v_rforks);
522 		GET_COUNTER(v_kthreads);
523 		GET_COUNTER(v_forkpages);
524 		GET_COUNTER(v_vforkpages);
525 		GET_COUNTER(v_rforkpages);
526 		GET_COUNTER(v_kthreadpages);
527 #undef GET_COUNTER
528 	} else {
529 #define GET_VM_STATS(cat, name)	do {					\
530 	size = sizeof(vmmp->name);					\
531 	mysysctl("vm.stats." #cat "." #name, &vmmp->name, &size);	\
532 } while (0)
533 		/* sys */
534 		GET_VM_STATS(sys, v_swtch);
535 		GET_VM_STATS(sys, v_trap);
536 		GET_VM_STATS(sys, v_syscall);
537 		GET_VM_STATS(sys, v_intr);
538 		GET_VM_STATS(sys, v_soft);
539 
540 		/* vm */
541 		GET_VM_STATS(vm, v_vm_faults);
542 		GET_VM_STATS(vm, v_io_faults);
543 		GET_VM_STATS(vm, v_cow_faults);
544 		GET_VM_STATS(vm, v_cow_optim);
545 		GET_VM_STATS(vm, v_zfod);
546 		GET_VM_STATS(vm, v_ozfod);
547 		GET_VM_STATS(vm, v_swapin);
548 		GET_VM_STATS(vm, v_swapout);
549 		GET_VM_STATS(vm, v_swappgsin);
550 		GET_VM_STATS(vm, v_swappgsout);
551 		GET_VM_STATS(vm, v_vnodein);
552 		GET_VM_STATS(vm, v_vnodeout);
553 		GET_VM_STATS(vm, v_vnodepgsin);
554 		GET_VM_STATS(vm, v_vnodepgsout);
555 		GET_VM_STATS(vm, v_intrans);
556 		GET_VM_STATS(vm, v_reactivated);
557 		GET_VM_STATS(vm, v_pdwakeups);
558 		GET_VM_STATS(vm, v_pdpages);
559 		GET_VM_STATS(vm, v_pdshortfalls);
560 		GET_VM_STATS(vm, v_dfree);
561 		GET_VM_STATS(vm, v_pfree);
562 		GET_VM_STATS(vm, v_tfree);
563 		GET_VM_STATS(vm, v_page_size);
564 		GET_VM_STATS(vm, v_page_count);
565 		GET_VM_STATS(vm, v_free_reserved);
566 		GET_VM_STATS(vm, v_free_target);
567 		GET_VM_STATS(vm, v_free_min);
568 		GET_VM_STATS(vm, v_free_count);
569 		GET_VM_STATS(vm, v_wire_count);
570 		GET_VM_STATS(vm, v_user_wire_count);
571 		GET_VM_STATS(vm, v_active_count);
572 		GET_VM_STATS(vm, v_inactive_target);
573 		GET_VM_STATS(vm, v_inactive_count);
574 		GET_VM_STATS(vm, v_laundry_count);
575 		GET_VM_STATS(vm, v_pageout_free_min);
576 		GET_VM_STATS(vm, v_interrupt_free_min);
577 		/*GET_VM_STATS(vm, v_free_severe);*/
578 		GET_VM_STATS(vm, v_forks);
579 		GET_VM_STATS(vm, v_vforks);
580 		GET_VM_STATS(vm, v_rforks);
581 		GET_VM_STATS(vm, v_kthreads);
582 		GET_VM_STATS(vm, v_forkpages);
583 		GET_VM_STATS(vm, v_vforkpages);
584 		GET_VM_STATS(vm, v_rforkpages);
585 		GET_VM_STATS(vm, v_kthreadpages);
586 #undef GET_VM_STATS
587 	}
588 }
589 
590 static void
591 fill_vmtotal(struct vmtotal *vmtp)
592 {
593 	size_t size;
594 
595 	if (kd != NULL) {
596 		/* XXX fill vmtp */
597 		xo_errx(1, "not implemented");
598 	} else {
599 		size = sizeof(*vmtp);
600 		mysysctl("vm.vmtotal", vmtp, &size);
601 		if (size != sizeof(*vmtp))
602 			xo_errx(1, "vm.total size mismatch");
603 	}
604 }
605 
606 /* Determine how many cpu columns, and what index they are in kern.cp_times */
607 static int
608 getcpuinfo(u_long *maskp, int *maxidp)
609 {
610 	long *times;
611 	u_long mask;
612 	size_t size;
613 	int empty, i, j, maxcpu, maxid, ncpus;
614 
615 	if (kd != NULL)
616 		xo_errx(1, "not implemented");
617 	mask = 0;
618 	ncpus = 0;
619 	size = sizeof(maxcpu);
620 	mysysctl("kern.smp.maxcpus", &maxcpu, &size);
621 	if (size != sizeof(maxcpu))
622 		xo_errx(1, "sysctl kern.smp.maxcpus");
623 	size = sizeof(long) * maxcpu * CPUSTATES;
624 	times = malloc(size);
625 	if (times == NULL)
626 		xo_err(1, "malloc %zd bytes", size);
627 	mysysctl("kern.cp_times", times, &size);
628 	maxid = (size / CPUSTATES / sizeof(long)) - 1;
629 	for (i = 0; i <= maxid; i++) {
630 		empty = 1;
631 		for (j = 0; empty && j < CPUSTATES; j++) {
632 			if (times[i * CPUSTATES + j] != 0)
633 				empty = 0;
634 		}
635 		if (!empty) {
636 			mask |= (1ul << i);
637 			ncpus++;
638 		}
639 	}
640 	if (maskp)
641 		*maskp = mask;
642 	if (maxidp)
643 		*maxidp = maxid;
644 	return (ncpus);
645 }
646 
647 
648 static void
649 prthuman(const char *name, uint64_t val, int size, int flags)
650 {
651 	char buf[10];
652 	char fmt[128];
653 
654 	snprintf(fmt, sizeof(fmt), "{:%s/%%*s}", name);
655 
656 	if (size < 5 || size > 9)
657 		xo_errx(1, "doofus");
658 	flags |= HN_NOSPACE | HN_DECIMAL;
659 	humanize_number(buf, size, val, "", HN_AUTOSCALE, flags);
660 	xo_attr("value", "%ju", (uintmax_t) val);
661 	xo_emit(fmt, size, buf);
662 }
663 
664 static void
665 dovmstat(unsigned int interval, int reps)
666 {
667 	struct clockinfo clockrate;
668 	struct vmtotal total;
669 	struct devinfo *tmp_dinfo;
670 	u_long cpumask;
671 	size_t size;
672 	time_t uptime, halfuptime;
673 	int ncpus, maxid, rate_adj, retval;
674 
675 	uptime = getuptime() / 1000000000LL;
676 	halfuptime = uptime / 2;
677 	rate_adj = 1;
678 	ncpus = 1;
679 	maxid = 0;
680 	cpumask = 0;
681 
682 	/*
683 	 * If the user stops the program (control-Z) and then resumes it,
684 	 * print out the header again.
685 	 */
686 	(void)signal(SIGCONT, needhdr);
687 
688 	/*
689 	 * If our standard output is a tty, then install a SIGWINCH handler
690 	 * and set wresized so that our first iteration through the main
691 	 * vmstat loop will peek at the terminal's current rows to find out
692 	 * how many lines can fit in a screenful of output.
693 	 */
694 	if (isatty(fileno(stdout)) != 0) {
695 		wresized = 1;
696 		(void)signal(SIGWINCH, needresize);
697 	} else {
698 		wresized = 0;
699 		winlines = VMSTAT_DEFAULT_LINES;
700 	}
701 
702 	if (kd != NULL) {
703 		if (namelist[X_STATHZ].n_type != 0 &&
704 		    namelist[X_STATHZ].n_value != 0)
705 			kread(X_STATHZ, &hz, sizeof(hz));
706 		if (!hz)
707 			kread(X_HZ, &hz, sizeof(hz));
708 	} else {
709 		size = sizeof(clockrate);
710 		mysysctl("kern.clockrate", &clockrate, &size);
711 		if (size != sizeof(clockrate))
712 			xo_errx(1, "clockrate size mismatch");
713 		hz = clockrate.hz;
714 	}
715 
716 	if (Pflag) {
717 		ncpus = getcpuinfo(&cpumask, &maxid);
718 		size_cp_times = sizeof(long) * (maxid + 1) * CPUSTATES;
719 		cur_cp_times = calloc(1, size_cp_times);
720 		last_cp_times = calloc(1, size_cp_times);
721 	}
722 	for (hdrcnt = 1;;) {
723 		if (!--hdrcnt)
724 			printhdr(maxid, cpumask);
725 		if (kd != NULL) {
726 			if (kvm_getcptime(kd, cur.cp_time) < 0)
727 				xo_errx(1, "kvm_getcptime: %s", kvm_geterr(kd));
728 		} else {
729 			size = sizeof(cur.cp_time);
730 			mysysctl("kern.cp_time", &cur.cp_time, &size);
731 			if (size != sizeof(cur.cp_time))
732 				xo_errx(1, "cp_time size mismatch");
733 		}
734 		if (Pflag) {
735 			size = size_cp_times;
736 			mysysctl("kern.cp_times", cur_cp_times, &size);
737 			if (size != size_cp_times)
738 				xo_errx(1, "cp_times mismatch");
739 		}
740 
741 		tmp_dinfo = last.dinfo;
742 		last.dinfo = cur.dinfo;
743 		cur.dinfo = tmp_dinfo;
744 		last.snap_time = cur.snap_time;
745 
746 		/*
747 		 * Here what we want to do is refresh our device stats.
748 		 * getdevs() returns 1 when the device list has changed.
749 		 * If the device list has changed, we want to go through
750 		 * the selection process again, in case a device that we
751 		 * were previously displaying has gone away.
752 		 */
753 		switch (devstat_getdevs(NULL, &cur)) {
754 		case -1:
755 			xo_errx(1, "%s", devstat_errbuf);
756 			break;
757 		case 1:
758 			num_devices = cur.dinfo->numdevs;
759 			generation = cur.dinfo->generation;
760 
761 			retval = devstat_selectdevs(&dev_select, &num_selected,
762 			    &num_selections, &select_generation,
763 			    generation, cur.dinfo->devices,
764 			    num_devices, matches, num_matches,
765 			    specified_devices,
766 			    num_devices_specified, select_mode,
767 			    maxshowdevs, 0);
768 			switch (retval) {
769 			case -1:
770 				xo_errx(1, "%s", devstat_errbuf);
771 				break;
772 			case 1:
773 				printhdr(maxid, cpumask);
774 				break;
775 			default:
776 				break;
777 			}
778 			break;
779 		default:
780 			break;
781 		}
782 
783 		fill_vmmeter(&sum);
784 		fill_vmtotal(&total);
785 		xo_open_container("processes");
786 		xo_emit("{:runnable/%2d} {:waiting/%2ld} "
787 		    "{:swapped-out/%2ld}", total.t_rq - 1, total.t_dw +
788 		    total.t_pw, total.t_sw);
789 		xo_close_container("processes");
790 		xo_open_container("memory");
791 #define vmstat_pgtok(a) ((uintmax_t)(a) * (sum.v_page_size >> 10))
792 #define	rate(x)	(((x) * rate_adj + halfuptime) / uptime)	/* round */
793 		if (hflag) {
794 			prthuman("available-memory",
795 			    total.t_avm * (uint64_t)sum.v_page_size, 5, HN_B);
796 			prthuman("free-memory",
797 			    total.t_free * (uint64_t)sum.v_page_size, 5, HN_B);
798 			prthuman("total-page-faults",
799 			    (unsigned long)rate(sum.v_vm_faults -
800 			    osum.v_vm_faults), 5, 0);
801 			xo_emit(" ");
802 		} else {
803 			xo_emit(" ");
804 			xo_emit("{:available-memory/%7ju}",
805 			    vmstat_pgtok(total.t_avm));
806 			xo_emit(" ");
807 			xo_emit("{:free-memory/%7ju}",
808 			    vmstat_pgtok(total.t_free));
809 			xo_emit(" ");
810 			xo_emit("{:total-page-faults/%5lu} ",
811 			    (unsigned long)rate(sum.v_vm_faults -
812 			    osum.v_vm_faults));
813 		}
814 		xo_close_container("memory");
815 
816 		xo_open_container("paging-rates");
817 		xo_emit("{:page-reactivated/%3lu} ",
818 		    (unsigned long)rate(sum.v_reactivated -
819 		    osum.v_reactivated));
820 		xo_emit("{:paged-in/%3lu} ",
821 		    (unsigned long)rate(sum.v_swapin + sum.v_vnodein -
822 		    (osum.v_swapin + osum.v_vnodein)));
823 		xo_emit("{:paged-out/%3lu}",
824 		    (unsigned long)rate(sum.v_swapout + sum.v_vnodeout -
825 		    (osum.v_swapout + osum.v_vnodeout)));
826 		if (hflag) {
827 			prthuman("freed",
828 			    (unsigned long)rate(sum.v_tfree - osum.v_tfree),
829 			    5, 0);
830 			prthuman("scanned",
831 			    (unsigned long)rate(sum.v_pdpages - osum.v_pdpages),
832 			    5, 0);
833 			xo_emit(" ");
834 		} else {
835 			xo_emit(" ");
836 			xo_emit("{:freed/%5lu} ",
837 			    (unsigned long)rate(sum.v_tfree - osum.v_tfree));
838 			xo_emit("{:scanned/%4lu} ",
839 			    (unsigned long)rate(sum.v_pdpages - osum.v_pdpages));
840 		}
841 		xo_close_container("paging-rates");
842 
843 		devstats();
844 		xo_open_container("fault-rates");
845 		xo_emit("{:interrupts/%4lu}",
846 		    (unsigned long)rate(sum.v_intr - osum.v_intr));
847 		if (hflag) {
848 			prthuman("system-calls",
849 			    (unsigned long)rate(sum.v_syscall - osum.v_syscall),
850 			    5, 0);
851 			prthuman("context-switches",
852 			    (unsigned long)rate(sum.v_swtch - osum.v_swtch),
853 			    5, 0);
854 		} else {
855 			xo_emit(" ");
856 			xo_emit("{:system-calls/%5lu} "
857 			    "{:context-switches/%5lu}",
858 			    (unsigned long)rate(sum.v_syscall - osum.v_syscall),
859 			    (unsigned long)rate(sum.v_swtch - osum.v_swtch));
860 		}
861 		xo_close_container("fault-rates");
862 		if (Pflag)
863 			pcpustats(cpumask, maxid);
864 		else
865 			cpustats();
866 		xo_emit("\n");
867 		xo_flush();
868 		if (reps >= 0 && --reps <= 0)
869 			break;
870 		osum = sum;
871 		uptime = interval;
872 		rate_adj = 1000;
873 		/*
874 		 * We round upward to avoid losing low-frequency events
875 		 * (i.e., >= 1 per interval but < 1 per millisecond).
876 		 */
877 		if (interval != 1)
878 			halfuptime = (uptime + 1) / 2;
879 		else
880 			halfuptime = 0;
881 		(void)usleep(interval * 1000);
882 	}
883 }
884 
885 static void
886 printhdr(int maxid, u_long cpumask)
887 {
888 	int i, num_shown;
889 
890 	num_shown = MIN(num_selected, maxshowdevs);
891 	if (hflag)
892 		xo_emit(" {T:procs}    {T:memory}    {T:/page%*s}", 19, "");
893 	else
894 		xo_emit("{T:procs}     {T:memory}       {T:/page%*s}", 19, "");
895 	if (num_shown > 1)
896 		xo_emit("   {T:/disks %*s}  ", num_shown * 4 - 7, "");
897 	else if (num_shown == 1)
898 		xo_emit("   {T:disks}");
899 	xo_emit(" {T:faults}      ");
900 	if (Pflag) {
901 		for (i = 0; i <= maxid; i++) {
902 			if (cpumask & (1ul << i))
903 				xo_emit("  {T:/cpu%d}   ", i);
904 		}
905 		xo_emit("\n");
906 	} else
907 		xo_emit(" {T:cpu}\n");
908 	if (hflag) {
909 		xo_emit(" {T:r}  {T:b}  {T:w}  {T:avm}  {T:fre}  {T:flt}  {T:re}"
910 		    "  {T:pi}  {T:po}   {T:fr}   {T:sr} ");
911 	} else {
912 		xo_emit("{T:r} {T:b} {T:w}     {T:avm}     {T:fre}  {T:flt}  "
913 		    "{T:re}  {T:pi}  {T:po}    {T:fr}   {T:sr} ");
914 	}
915 	for (i = 0; i < num_devices; i++)
916 		if ((dev_select[i].selected) &&
917 		    (dev_select[i].selected <= maxshowdevs))
918 			xo_emit("{T:/%c%c%d} ", dev_select[i].device_name[0],
919 			    dev_select[i].device_name[1],
920 			    dev_select[i].unit_number);
921 	xo_emit("  {T:in}   {T:sy}   {T:cs}");
922 	if (Pflag) {
923 		for (i = 0; i <= maxid; i++) {
924 			if (cpumask & (1ul << i))
925 				xo_emit(" {T:us} {T:sy} {T:id}");
926 		}
927 		xo_emit("\n");
928 	} else
929 		xo_emit(" {T:us} {T:sy} {T:id}\n");
930 	if (wresized != 0)
931 		doresize();
932 	hdrcnt = winlines;
933 }
934 
935 /*
936  * Force a header to be prepended to the next output.
937  */
938 static void
939 needhdr(int dummy __unused)
940 {
941 
942 	hdrcnt = 1;
943 }
944 
945 /*
946  * When the terminal is resized, force an update of the maximum number of rows
947  * printed between each header repetition.  Then force a new header to be
948  * prepended to the next output.
949  */
950 void
951 needresize(int signo __unused)
952 {
953 
954 	wresized = 1;
955 	hdrcnt = 1;
956 }
957 
958 /*
959  * Update the global `winlines' count of terminal rows.
960  */
961 void
962 doresize(void)
963 {
964 	struct winsize w;
965 	int status;
966 
967 	for (;;) {
968 		status = ioctl(fileno(stdout), TIOCGWINSZ, &w);
969 		if (status == -1 && errno == EINTR)
970 			continue;
971 		else if (status == -1)
972 			xo_err(1, "ioctl");
973 		if (w.ws_row > 3)
974 			winlines = w.ws_row - 3;
975 		else
976 			winlines = VMSTAT_DEFAULT_LINES;
977 		break;
978 	}
979 
980 	/*
981 	 * Inhibit doresize() calls until we are rescheduled by SIGWINCH.
982 	 */
983 	wresized = 0;
984 }
985 
986 static long
987 pct(long top, long bot)
988 {
989 	long ans;
990 
991 	if (bot == 0)
992 		return(0);
993 	ans = (quad_t)top * 100 / bot;
994 	return (ans);
995 }
996 
997 #define	PCT(top, bot) pct((long)(top), (long)(bot))
998 
999 static void
1000 dosum(void)
1001 {
1002 	struct nchstats lnchstats;
1003 	size_t size;
1004 	long nchtotal;
1005 
1006 	fill_vmmeter(&sum);
1007 	xo_open_container("summary-statistics");
1008 	xo_emit("{:context-switches/%9u} {N:cpu context switches}\n",
1009 	    sum.v_swtch);
1010 	xo_emit("{:interrupts/%9u} {N:device interrupts}\n",
1011 	    sum.v_intr);
1012 	xo_emit("{:software-interrupts/%9u} {N:software interrupts}\n",
1013 	    sum.v_soft);
1014 	xo_emit("{:traps/%9u} {N:traps}\n", sum.v_trap);
1015 	xo_emit("{:system-calls/%9u} {N:system calls}\n",
1016 	    sum.v_syscall);
1017 	xo_emit("{:kernel-threads/%9u} {N:kernel threads created}\n",
1018 	    sum.v_kthreads);
1019 	xo_emit("{:forks/%9u} {N: fork() calls}\n", sum.v_forks);
1020 	xo_emit("{:vforks/%9u} {N:vfork() calls}\n",
1021 	    sum.v_vforks);
1022 	xo_emit("{:rforks/%9u} {N:rfork() calls}\n",
1023 	    sum.v_rforks);
1024 	xo_emit("{:swap-ins/%9u} {N:swap pager pageins}\n",
1025 	    sum.v_swapin);
1026 	xo_emit("{:swap-in-pages/%9u} {N:swap pager pages paged in}\n",
1027 	    sum.v_swappgsin);
1028 	xo_emit("{:swap-outs/%9u} {N:swap pager pageouts}\n",
1029 	    sum.v_swapout);
1030 	xo_emit("{:swap-out-pages/%9u} {N:swap pager pages paged out}\n",
1031 	    sum.v_swappgsout);
1032 	xo_emit("{:vnode-page-ins/%9u} {N:vnode pager pageins}\n",
1033 	    sum.v_vnodein);
1034 	xo_emit("{:vnode-page-in-pages/%9u} {N:vnode pager pages paged in}\n",
1035 	    sum.v_vnodepgsin);
1036 	xo_emit("{:vnode-page-outs/%9u} {N:vnode pager pageouts}\n",
1037 	    sum.v_vnodeout);
1038 	xo_emit("{:vnode-page-out-pages/%9u} {N:vnode pager pages paged out}\n",
1039 	    sum.v_vnodepgsout);
1040 	xo_emit("{:page-daemon-wakeups/%9u} {N:page daemon wakeups}\n",
1041 	    sum.v_pdwakeups);
1042 	xo_emit("{:page-daemon-pages/%9u} {N:pages examined by the page "
1043 	    "daemon}\n", sum.v_pdpages);
1044 	xo_emit("{:page-reclamation-shortfalls/%9u} {N:clean page reclamation "
1045 	    "shortfalls}\n", sum.v_pdshortfalls);
1046 	xo_emit("{:reactivated/%9u} {N:pages reactivated by the page daemon}\n",
1047 	    sum.v_reactivated);
1048 	xo_emit("{:copy-on-write-faults/%9u} {N:copy-on-write faults}\n",
1049 	    sum.v_cow_faults);
1050 	xo_emit("{:copy-on-write-optimized-faults/%9u} {N:copy-on-write "
1051 	    "optimized faults}\n", sum.v_cow_optim);
1052 	xo_emit("{:zero-fill-pages/%9u} {N:zero fill pages zeroed}\n",
1053 	    sum.v_zfod);
1054 	xo_emit("{:zero-fill-prezeroed/%9u} {N:zero fill pages prezeroed}\n",
1055 	    sum.v_ozfod);
1056 	xo_emit("{:intransit-blocking/%9u} {N:intransit blocking page faults}\n",
1057 	    sum.v_intrans);
1058 	xo_emit("{:total-faults/%9u} {N:total VM faults taken}\n",
1059 	    sum.v_vm_faults);
1060 	xo_emit("{:faults-requiring-io/%9u} {N:page faults requiring I\\/O}\n",
1061 	    sum.v_io_faults);
1062 	xo_emit("{:faults-from-thread-creation/%9u} {N:pages affected by "
1063 	    "kernel thread creation}\n", sum.v_kthreadpages);
1064 	xo_emit("{:faults-from-fork/%9u} {N:pages affected by  fork}()\n",
1065 	    sum.v_forkpages);
1066 	xo_emit("{:faults-from-vfork/%9u} {N:pages affected by vfork}()\n",
1067 	    sum.v_vforkpages);
1068 	xo_emit("{:pages-rfork/%9u} {N:pages affected by rfork}()\n",
1069 	    sum.v_rforkpages);
1070 	xo_emit("{:pages-freed/%9u} {N:pages freed}\n",
1071 	    sum.v_tfree);
1072 	xo_emit("{:pages-freed-by-daemon/%9u} {N:pages freed by daemon}\n",
1073 	    sum.v_dfree);
1074 	xo_emit("{:pages-freed-on-exit/%9u} {N:pages freed by exiting processes}\n",
1075 	    sum.v_pfree);
1076 	xo_emit("{:active-pages/%9u} {N:pages active}\n",
1077 	    sum.v_active_count);
1078 	xo_emit("{:inactive-pages/%9u} {N:pages inactive}\n",
1079 	    sum.v_inactive_count);
1080 	xo_emit("{:laundry-pages/%9u} {N:pages in the laundry queue}\n",
1081 	    sum.v_laundry_count);
1082 	xo_emit("{:wired-pages/%9u} {N:pages wired down}\n",
1083 	    sum.v_wire_count);
1084 	xo_emit("{:virtual-user-wired-pages/%9lu} {N:virtual user pages wired "
1085 	    "down}\n", sum.v_user_wire_count);
1086 	xo_emit("{:free-pages/%9u} {N:pages free}\n",
1087 	    sum.v_free_count);
1088 	xo_emit("{:bytes-per-page/%9u} {N:bytes per page}\n", sum.v_page_size);
1089 	if (kd != NULL) {
1090 		kread(X_NCHSTATS, &lnchstats, sizeof(lnchstats));
1091 	} else {
1092 		size = sizeof(lnchstats);
1093 		mysysctl("vfs.cache.nchstats", &lnchstats, &size);
1094 		if (size != sizeof(lnchstats))
1095 			xo_errx(1, "vfs.cache.nchstats size mismatch");
1096 	}
1097 	nchtotal = lnchstats.ncs_goodhits + lnchstats.ncs_neghits +
1098 	    lnchstats.ncs_badhits + lnchstats.ncs_falsehits +
1099 	    lnchstats.ncs_miss + lnchstats.ncs_long;
1100 	xo_emit("{:total-name-lookups/%9ld} {N:total name lookups}\n",
1101 	    nchtotal);
1102 	xo_emit("{P:/%9s} {N:cache hits} "
1103 	    "({:positive-cache-hits/%ld}% pos + "
1104 	    "{:negative-cache-hits/%ld}% {N:neg}) "
1105 	    "system {:cache-hit-percent/%ld}% per-directory\n",
1106 	    "", PCT(lnchstats.ncs_goodhits, nchtotal),
1107 	    PCT(lnchstats.ncs_neghits, nchtotal),
1108 	    PCT(lnchstats.ncs_pass2, nchtotal));
1109 	xo_emit("{P:/%9s} {L:deletions} {:deletions/%ld}%, "
1110 	    "{L:falsehits} {:false-hits/%ld}%, "
1111 	    "{L:toolong} {:too-long/%ld}%\n", "",
1112 	    PCT(lnchstats.ncs_badhits, nchtotal),
1113 	    PCT(lnchstats.ncs_falsehits, nchtotal),
1114 	    PCT(lnchstats.ncs_long, nchtotal));
1115 	xo_close_container("summary-statistics");
1116 }
1117 
1118 static void
1119 doforkst(void)
1120 {
1121 
1122 	fill_vmmeter(&sum);
1123 	xo_open_container("fork-statistics");
1124 	xo_emit("{:fork/%u} {N:forks}, {:fork-pages/%u} {N:pages}, "
1125 	    "{L:average} {:fork-average/%.2f}\n",
1126 	    sum.v_forks, sum.v_forkpages,
1127 	    sum.v_forks == 0 ? 0.0 :
1128 	    (double)sum.v_forkpages / sum.v_forks);
1129 	xo_emit("{:vfork/%u} {N:vforks}, {:vfork-pages/%u} {N:pages}, "
1130 	    "{L:average} {:vfork-average/%.2f}\n",
1131 	    sum.v_vforks, sum.v_vforkpages,
1132 	    sum.v_vforks == 0 ? 0.0 :
1133 	    (double)sum.v_vforkpages / sum.v_vforks);
1134 	xo_emit("{:rfork/%u} {N:rforks}, {:rfork-pages/%u} {N:pages}, "
1135 	    "{L:average} {:rfork-average/%.2f}\n",
1136 	    sum.v_rforks, sum.v_rforkpages,
1137 	    sum.v_rforks == 0 ? 0.0 :
1138 	    (double)sum.v_rforkpages / sum.v_rforks);
1139 	xo_close_container("fork-statistics");
1140 }
1141 
1142 static void
1143 devstats(void)
1144 {
1145 	long double busy_seconds, transfers_per_second;
1146 	long tmp;
1147 	int di, dn, state;
1148 
1149 	for (state = 0; state < CPUSTATES; ++state) {
1150 		tmp = cur.cp_time[state];
1151 		cur.cp_time[state] -= last.cp_time[state];
1152 		last.cp_time[state] = tmp;
1153 	}
1154 
1155 	busy_seconds = cur.snap_time - last.snap_time;
1156 
1157 	xo_open_list("device");
1158 	for (dn = 0; dn < num_devices; dn++) {
1159 		if (dev_select[dn].selected == 0 ||
1160 		    dev_select[dn].selected > maxshowdevs)
1161 			continue;
1162 
1163 		di = dev_select[dn].position;
1164 
1165 		if (devstat_compute_statistics(&cur.dinfo->devices[di],
1166 		    &last.dinfo->devices[di], busy_seconds,
1167 		    DSM_TRANSFERS_PER_SECOND, &transfers_per_second,
1168 		    DSM_NONE) != 0)
1169 			xo_errx(1, "%s", devstat_errbuf);
1170 
1171 		xo_open_instance("device");
1172 		xo_emit("{ekq:name/%c%c%d}{:transfers/%3.0Lf} ",
1173 		    dev_select[dn].device_name[0],
1174 		    dev_select[dn].device_name[1],
1175 		    dev_select[dn].unit_number,
1176 		    transfers_per_second);
1177 		xo_close_instance("device");
1178 	}
1179 	xo_close_list("device");
1180 }
1181 
1182 static void
1183 percent(const char *name, double pctv, int *over)
1184 {
1185 	int l;
1186 	char buf[10];
1187 	char fmt[128];
1188 
1189 	snprintf(fmt, sizeof(fmt), " {:%s/%%*s}", name);
1190 	l = snprintf(buf, sizeof(buf), "%.0f", pctv);
1191 	if (l == 1 && *over) {
1192 		xo_emit(fmt, 1, buf);
1193 		(*over)--;
1194 	} else
1195 		xo_emit(fmt, 2, buf);
1196 	if (l > 2)
1197 		(*over)++;
1198 }
1199 
1200 static void
1201 cpustats(void)
1202 {
1203 	double lpct, total;
1204 	int state, over;
1205 
1206 	total = 0;
1207 	for (state = 0; state < CPUSTATES; ++state)
1208 		total += cur.cp_time[state];
1209 	if (total > 0)
1210 		lpct = 100.0 / total;
1211 	else
1212 		lpct = 0.0;
1213 	over = 0;
1214 	xo_open_container("cpu-statistics");
1215 	percent("user", (cur.cp_time[CP_USER] + cur.cp_time[CP_NICE]) * lpct,
1216 	    &over);
1217 	percent("system", (cur.cp_time[CP_SYS] + cur.cp_time[CP_INTR]) * lpct,
1218 	    &over);
1219 	percent("idle", cur.cp_time[CP_IDLE] * lpct, &over);
1220 	xo_close_container("cpu-statistics");
1221 }
1222 
1223 static void
1224 pcpustats(u_long cpumask, int maxid)
1225 {
1226 	double lpct, total;
1227 	long tmp;
1228 	int i, over, state;
1229 
1230 	/* devstats does this for cp_time */
1231 	for (i = 0; i <= maxid; i++) {
1232 		if ((cpumask & (1ul << i)) == 0)
1233 			continue;
1234 		for (state = 0; state < CPUSTATES; ++state) {
1235 			tmp = cur_cp_times[i * CPUSTATES + state];
1236 			cur_cp_times[i * CPUSTATES + state] -= last_cp_times[i *
1237 			    CPUSTATES + state];
1238 			last_cp_times[i * CPUSTATES + state] = tmp;
1239 		}
1240 	}
1241 
1242 	over = 0;
1243 	xo_open_list("cpu");
1244 	for (i = 0; i <= maxid; i++) {
1245 		if ((cpumask & (1ul << i)) == 0)
1246 			continue;
1247 		xo_open_instance("cpu");
1248 		xo_emit("{ke:name/%d}", i);
1249 		total = 0;
1250 		for (state = 0; state < CPUSTATES; ++state)
1251 			total += cur_cp_times[i * CPUSTATES + state];
1252 		if (total)
1253 			lpct = 100.0 / total;
1254 		else
1255 			lpct = 0.0;
1256 		percent("user", (cur_cp_times[i * CPUSTATES + CP_USER] +
1257 		    cur_cp_times[i * CPUSTATES + CP_NICE]) * lpct, &over);
1258 		percent("system", (cur_cp_times[i * CPUSTATES + CP_SYS] +
1259 		    cur_cp_times[i * CPUSTATES + CP_INTR]) * lpct, &over);
1260 		percent("idle", cur_cp_times[i * CPUSTATES + CP_IDLE] * lpct,
1261 		    &over);
1262 		xo_close_instance("cpu");
1263 	}
1264 	xo_close_list("cpu");
1265 }
1266 
1267 static unsigned int
1268 read_intrcnts(unsigned long **intrcnts)
1269 {
1270 	size_t intrcntlen;
1271 	uintptr_t kaddr;
1272 
1273 	if (kd != NULL) {
1274 		kread(X_SINTRCNT, &intrcntlen, sizeof(intrcntlen));
1275 		if ((*intrcnts = malloc(intrcntlen)) == NULL)
1276 			err(1, "malloc()");
1277 		if (namelist[X_NINTRCNT].n_type == 0)
1278 			kread(X_INTRCNT, *intrcnts, intrcntlen);
1279 		else {
1280 			kread(X_INTRCNT, &kaddr, sizeof(kaddr));
1281 			kreadptr(kaddr, *intrcnts, intrcntlen);
1282 		}
1283 	} else {
1284 		for (*intrcnts = NULL, intrcntlen = 1024; ; intrcntlen *= 2) {
1285 			*intrcnts = reallocf(*intrcnts, intrcntlen);
1286 			if (*intrcnts == NULL)
1287 				err(1, "reallocf()");
1288 			if (mysysctl("hw.intrcnt", *intrcnts, &intrcntlen) == 0)
1289 				break;
1290 		}
1291 	}
1292 
1293 	return (intrcntlen / sizeof(unsigned long));
1294 }
1295 
1296 static void
1297 print_intrcnts(unsigned long *intrcnts, unsigned long *old_intrcnts,
1298     char *intrnames, unsigned int nintr, size_t istrnamlen, long long period_ms)
1299 {
1300 	unsigned long *intrcnt, *old_intrcnt;
1301 	char *intrname;
1302 	uint64_t inttotal, old_inttotal, total_count, total_rate;
1303 	unsigned long count, rate;
1304 	unsigned int i;
1305 
1306 	inttotal = 0;
1307 	old_inttotal = 0;
1308 	intrname = intrnames;
1309 	xo_open_list("interrupt");
1310 	for (i = 0, intrcnt=intrcnts, old_intrcnt=old_intrcnts; i < nintr; i++) {
1311 		if (intrname[0] != '\0' && (*intrcnt != 0 || aflag)) {
1312 			count = *intrcnt - *old_intrcnt;
1313 			rate = ((uint64_t)count * 1000 + period_ms / 2) / period_ms;
1314 			xo_open_instance("interrupt");
1315 			xo_emit("{d:name/%-*s}{ket:name/%s} "
1316 			    "{:total/%20lu} {:rate/%10lu}\n",
1317 			    (int)istrnamlen, intrname, intrname, count, rate);
1318 			xo_close_instance("interrupt");
1319 		}
1320 		intrname += strlen(intrname) + 1;
1321 		inttotal += *intrcnt++;
1322 		old_inttotal += *old_intrcnt++;
1323 	}
1324 	total_count = inttotal - old_inttotal;
1325 	total_rate = (total_count * 1000 + period_ms / 2) / period_ms;
1326 	xo_close_list("interrupt");
1327 	xo_emit("{L:/%-*s} {:total-interrupts/%20ju} "
1328 	    "{:total-rate/%10ju}\n", (int)istrnamlen,
1329 	    "Total", (uintmax_t)total_count, (uintmax_t)total_rate);
1330 }
1331 
1332 static void
1333 dointr(unsigned int interval, int reps)
1334 {
1335 	unsigned long *intrcnts, *old_intrcnts;
1336 	char *intrname, *intrnames;
1337 	long long period_ms, old_uptime, uptime;
1338 	size_t clen, inamlen, istrnamlen;
1339 	uintptr_t kaddr;
1340 	unsigned int nintr;
1341 
1342 	old_intrcnts = NULL;
1343 	uptime = getuptime();
1344 
1345 	/* Get the names of each interrupt source */
1346 	if (kd != NULL) {
1347 		kread(X_SINTRNAMES, &inamlen, sizeof(inamlen));
1348 		if ((intrnames = malloc(inamlen)) == NULL)
1349 			xo_err(1, "malloc()");
1350 		if (namelist[X_NINTRCNT].n_type == 0)
1351 			kread(X_INTRNAMES, intrnames, inamlen);
1352 		else {
1353 			kread(X_INTRNAMES, &kaddr, sizeof(kaddr));
1354 			kreadptr(kaddr, intrnames, inamlen);
1355 		}
1356 	} else {
1357 		for (intrnames = NULL, inamlen = 1024; ; inamlen *= 2) {
1358 			if ((intrnames = reallocf(intrnames, inamlen)) == NULL)
1359 				xo_err(1, "reallocf()");
1360 			if (mysysctl("hw.intrnames", intrnames, &inamlen) == 0)
1361 				break;
1362 		}
1363 	}
1364 
1365 	/* Determine the length of the longest interrupt name */
1366 	intrname = intrnames;
1367 	istrnamlen = strlen("interrupt");
1368 	while(*intrname != '\0') {
1369 		clen = strlen(intrname);
1370 		if (clen > istrnamlen)
1371 			istrnamlen = clen;
1372 		intrname += strlen(intrname) + 1;
1373 	}
1374 	xo_emit("{T:/%-*s} {T:/%20s} {T:/%10s}\n",
1375 	    (int)istrnamlen, "interrupt", "total", "rate");
1376 
1377 	/*
1378 	 * Loop reps times printing differential interrupt counts.  If reps is
1379 	 * zero, then run just once, printing total counts
1380 	 */
1381 	xo_open_container("interrupt-statistics");
1382 
1383 	period_ms = uptime / 1000000;
1384 	while(1) {
1385 		nintr = read_intrcnts(&intrcnts);
1386 		/*
1387 		 * Initialize old_intrcnts to 0 for the first pass, so
1388 		 * print_intrcnts will print total interrupts since boot
1389 		 */
1390 		if (old_intrcnts == NULL) {
1391 			old_intrcnts = calloc(nintr, sizeof(unsigned long));
1392 			if (old_intrcnts == NULL)
1393 				xo_err(1, "calloc()");
1394 		}
1395 
1396 		print_intrcnts(intrcnts, old_intrcnts, intrnames, nintr,
1397 		    istrnamlen, period_ms);
1398 		xo_flush();
1399 
1400 		free(old_intrcnts);
1401 		old_intrcnts = intrcnts;
1402 		if (reps >= 0 && --reps <= 0)
1403 			break;
1404 		usleep(interval * 1000);
1405 		old_uptime = uptime;
1406 		uptime = getuptime();
1407 		period_ms = (uptime - old_uptime) / 1000000;
1408 	}
1409 
1410 	xo_close_container("interrupt-statistics");
1411 }
1412 
1413 static void
1414 domemstat_malloc(void)
1415 {
1416 	struct memory_type_list *mtlp;
1417 	struct memory_type *mtp;
1418 	int error, first, i;
1419 
1420 	mtlp = memstat_mtl_alloc();
1421 	if (mtlp == NULL) {
1422 		xo_warn("memstat_mtl_alloc");
1423 		return;
1424 	}
1425 	if (kd == NULL) {
1426 		if (memstat_sysctl_malloc(mtlp, 0) < 0) {
1427 			xo_warnx("memstat_sysctl_malloc: %s",
1428 			    memstat_strerror(memstat_mtl_geterror(mtlp)));
1429 			return;
1430 		}
1431 	} else {
1432 		if (memstat_kvm_malloc(mtlp, kd) < 0) {
1433 			error = memstat_mtl_geterror(mtlp);
1434 			if (error == MEMSTAT_ERROR_KVM)
1435 				xo_warnx("memstat_kvm_malloc: %s",
1436 				    kvm_geterr(kd));
1437 			else
1438 				xo_warnx("memstat_kvm_malloc: %s",
1439 				    memstat_strerror(error));
1440 		}
1441 	}
1442 	xo_open_container("malloc-statistics");
1443 	xo_emit("{T:/%13s} {T:/%5s} {T:/%6s} {T:/%7s} {T:/%8s}  {T:Size(s)}\n",
1444 	    "Type", "InUse", "MemUse", "HighUse", "Requests");
1445 	xo_open_list("memory");
1446 	for (mtp = memstat_mtl_first(mtlp); mtp != NULL;
1447 	    mtp = memstat_mtl_next(mtp)) {
1448 		if (memstat_get_numallocs(mtp) == 0 &&
1449 		    memstat_get_count(mtp) == 0)
1450 			continue;
1451 		xo_open_instance("memory");
1452 		xo_emit("{k:type/%13s/%s} {:in-use/%5ju} "
1453 		    "{:memory-use/%5ju}{U:K} {:high-use/%7s} "
1454 		    "{:requests/%8ju}  ",
1455 		    memstat_get_name(mtp), (uintmax_t)memstat_get_count(mtp),
1456 		    ((uintmax_t)memstat_get_bytes(mtp) + 1023) / 1024, "-",
1457 		    (uintmax_t)memstat_get_numallocs(mtp));
1458 		first = 1;
1459 		xo_open_list("size");
1460 		for (i = 0; i < 32; i++) {
1461 			if (memstat_get_sizemask(mtp) & (1 << i)) {
1462 				if (!first)
1463 					xo_emit(",");
1464 				xo_emit("{l:size/%d}", 1 << (i + 4));
1465 				first = 0;
1466 			}
1467 		}
1468 		xo_close_list("size");
1469 		xo_close_instance("memory");
1470 		xo_emit("\n");
1471 	}
1472 	xo_close_list("memory");
1473 	xo_close_container("malloc-statistics");
1474 	memstat_mtl_free(mtlp);
1475 }
1476 
1477 static void
1478 domemstat_zone(void)
1479 {
1480 	struct memory_type_list *mtlp;
1481 	struct memory_type *mtp;
1482 	int error;
1483 	char name[MEMTYPE_MAXNAME + 1];
1484 
1485 	mtlp = memstat_mtl_alloc();
1486 	if (mtlp == NULL) {
1487 		xo_warn("memstat_mtl_alloc");
1488 		return;
1489 	}
1490 	if (kd == NULL) {
1491 		if (memstat_sysctl_uma(mtlp, 0) < 0) {
1492 			xo_warnx("memstat_sysctl_uma: %s",
1493 			    memstat_strerror(memstat_mtl_geterror(mtlp)));
1494 			return;
1495 		}
1496 	} else {
1497 		if (memstat_kvm_uma(mtlp, kd) < 0) {
1498 			error = memstat_mtl_geterror(mtlp);
1499 			if (error == MEMSTAT_ERROR_KVM)
1500 				xo_warnx("memstat_kvm_uma: %s",
1501 				    kvm_geterr(kd));
1502 			else
1503 				xo_warnx("memstat_kvm_uma: %s",
1504 				    memstat_strerror(error));
1505 		}
1506 	}
1507 	xo_open_container("memory-zone-statistics");
1508 	xo_emit("{T:/%-20s} {T:/%6s} {T:/%6s} {T:/%8s} {T:/%8s} {T:/%8s} {T:/%8s}"
1509 	    "{T:/%4s} {T:/%4s}\n\n", "ITEM", "SIZE",
1510 	    "LIMIT", "USED", "FREE", "REQ", "FAIL", "SLEEP", "XDOMAIN");
1511 	xo_open_list("zone");
1512 	for (mtp = memstat_mtl_first(mtlp); mtp != NULL;
1513 	    mtp = memstat_mtl_next(mtp)) {
1514 		strlcpy(name, memstat_get_name(mtp), MEMTYPE_MAXNAME);
1515 		strcat(name, ":");
1516 		xo_open_instance("zone");
1517 		xo_emit("{d:name/%-20s}{ke:name/%s} {:size/%6ju}, "
1518 		    "{:limit/%6ju},{:used/%8ju},"
1519 		    "{:free/%8ju},{:requests/%8ju},"
1520 		    "{:fail/%4ju},{:sleep/%4ju},{:xdomain/%4ju}\n", name,
1521 		    memstat_get_name(mtp),
1522 		    (uintmax_t)memstat_get_size(mtp),
1523 		    (uintmax_t)memstat_get_countlimit(mtp),
1524 		    (uintmax_t)memstat_get_count(mtp),
1525 		    (uintmax_t)memstat_get_free(mtp),
1526 		    (uintmax_t)memstat_get_numallocs(mtp),
1527 		    (uintmax_t)memstat_get_failures(mtp),
1528 		    (uintmax_t)memstat_get_sleeps(mtp),
1529 		    (uintmax_t)memstat_get_xdomain(mtp));
1530 		xo_close_instance("zone");
1531 	}
1532 	memstat_mtl_free(mtlp);
1533 	xo_close_list("zone");
1534 	xo_close_container("memory-zone-statistics");
1535 	xo_emit("\n");
1536 }
1537 
1538 static void
1539 display_object(struct kinfo_vmobject *kvo)
1540 {
1541 	const char *str;
1542 
1543 	xo_open_instance("object");
1544 	xo_emit("{:resident/%5ju} ", (uintmax_t)kvo->kvo_resident);
1545 	xo_emit("{:active/%5ju} ", (uintmax_t)kvo->kvo_active);
1546 	xo_emit("{:inactive/%5ju} ", (uintmax_t)kvo->kvo_inactive);
1547 	xo_emit("{:refcount/%3d} ", kvo->kvo_ref_count);
1548 	xo_emit("{:shadowcount/%3d} ", kvo->kvo_shadow_count);
1549 	switch (kvo->kvo_memattr) {
1550 #ifdef VM_MEMATTR_UNCACHEABLE
1551 	case VM_MEMATTR_UNCACHEABLE:
1552 		str = "UC";
1553 		break;
1554 #endif
1555 #ifdef VM_MEMATTR_WRITE_COMBINING
1556 	case VM_MEMATTR_WRITE_COMBINING:
1557 		str = "WC";
1558 		break;
1559 #endif
1560 #ifdef VM_MEMATTR_WRITE_THROUGH
1561 	case VM_MEMATTR_WRITE_THROUGH:
1562 		str = "WT";
1563 		break;
1564 #endif
1565 #ifdef VM_MEMATTR_WRITE_PROTECTED
1566 	case VM_MEMATTR_WRITE_PROTECTED:
1567 		str = "WP";
1568 		break;
1569 #endif
1570 #ifdef VM_MEMATTR_WRITE_BACK
1571 	case VM_MEMATTR_WRITE_BACK:
1572 		str = "WB";
1573 		break;
1574 #endif
1575 #ifdef VM_MEMATTR_WEAK_UNCACHEABLE
1576 	case VM_MEMATTR_WEAK_UNCACHEABLE:
1577 		str = "UC-";
1578 		break;
1579 #endif
1580 #ifdef VM_MEMATTR_WB_WA
1581 	case VM_MEMATTR_WB_WA:
1582 		str = "WB";
1583 		break;
1584 #endif
1585 #ifdef VM_MEMATTR_NOCACHE
1586 	case VM_MEMATTR_NOCACHE:
1587 		str = "NC";
1588 		break;
1589 #endif
1590 #ifdef VM_MEMATTR_DEVICE
1591 	case VM_MEMATTR_DEVICE:
1592 		str = "DEV";
1593 		break;
1594 #endif
1595 #ifdef VM_MEMATTR_CACHEABLE
1596 	case VM_MEMATTR_CACHEABLE:
1597 		str = "C";
1598 		break;
1599 #endif
1600 #ifdef VM_MEMATTR_PREFETCHABLE
1601 	case VM_MEMATTR_PREFETCHABLE:
1602 		str = "PRE";
1603 		break;
1604 #endif
1605 	default:
1606 		str = "??";
1607 		break;
1608 	}
1609 	xo_emit("{:attribute/%-3s} ", str);
1610 	switch (kvo->kvo_type) {
1611 	case KVME_TYPE_NONE:
1612 		str = "--";
1613 		break;
1614 	case KVME_TYPE_DEFAULT:
1615 		str = "df";
1616 		break;
1617 	case KVME_TYPE_VNODE:
1618 		str = "vn";
1619 		break;
1620 	case KVME_TYPE_SWAP:
1621 		str = "sw";
1622 		break;
1623 	case KVME_TYPE_DEVICE:
1624 		str = "dv";
1625 		break;
1626 	case KVME_TYPE_PHYS:
1627 		str = "ph";
1628 		break;
1629 	case KVME_TYPE_DEAD:
1630 		str = "dd";
1631 		break;
1632 	case KVME_TYPE_SG:
1633 		str = "sg";
1634 		break;
1635 	case KVME_TYPE_MGTDEVICE:
1636 		str = "md";
1637 		break;
1638 	case KVME_TYPE_UNKNOWN:
1639 	default:
1640 		str = "??";
1641 		break;
1642 	}
1643 	xo_emit("{:type/%-2s} ", str);
1644 	xo_emit("{:path/%-s}\n", kvo->kvo_path);
1645 	xo_close_instance("object");
1646 }
1647 
1648 static void
1649 doobjstat(void)
1650 {
1651 	struct kinfo_vmobject *kvo;
1652 	int cnt, i;
1653 
1654 	kvo = kinfo_getvmobject(&cnt);
1655 	if (kvo == NULL) {
1656 		xo_warn("Failed to fetch VM object list");
1657 		return;
1658 	}
1659 	xo_emit("{T:RES/%5s} {T:ACT/%5s} {T:INACT/%5s} {T:REF/%3s} {T:SHD/%3s} "
1660 	    "{T:CM/%3s} {T:TP/%2s} {T:PATH/%s}\n");
1661 	xo_open_list("object");
1662 	for (i = 0; i < cnt; i++)
1663 		display_object(&kvo[i]);
1664 	free(kvo);
1665 	xo_close_list("object");
1666 }
1667 
1668 /*
1669  * kread reads something from the kernel, given its nlist index.
1670  */
1671 static void
1672 kreado(int nlx, void *addr, size_t size, size_t offset)
1673 {
1674 	const char *sym;
1675 
1676 	if (namelist[nlx].n_type == 0 || namelist[nlx].n_value == 0) {
1677 		sym = namelist[nlx].n_name;
1678 		if (*sym == '_')
1679 			++sym;
1680 		xo_errx(1, "symbol %s not defined", sym);
1681 	}
1682 	if ((size_t)kvm_read(kd, namelist[nlx].n_value + offset, addr,
1683 	    size) != size) {
1684 		sym = namelist[nlx].n_name;
1685 		if (*sym == '_')
1686 			++sym;
1687 		xo_errx(1, "%s: %s", sym, kvm_geterr(kd));
1688 	}
1689 }
1690 
1691 static void
1692 kread(int nlx, void *addr, size_t size)
1693 {
1694 
1695 	kreado(nlx, addr, size, 0);
1696 }
1697 
1698 static void
1699 kreadptr(uintptr_t addr, void *buf, size_t size)
1700 {
1701 
1702 	if ((size_t)kvm_read(kd, addr, buf, size) != size)
1703 		xo_errx(1, "%s", kvm_geterr(kd));
1704 }
1705 
1706 static void __dead2
1707 usage(void)
1708 {
1709 	xo_error("%s%s",
1710 	    "usage: vmstat [-afHhimoPsz] [-M core [-N system]] [-c count] [-n devs]\n",
1711 	    "              [-p type,if,pass] [-w wait] [disks] [wait [count]]\n");
1712 	xo_finish();
1713 	exit(1);
1714 }
1715