xref: /illumos-gate/usr/src/cmd/mandoc/main.c (revision 338d6fc1b322c01b220f204edde962e843478a78)
1 /*	$Id: main.c,v 1.322 2019/03/06 10:18:58 schwarze Exp $ */
2 /*
3  * Copyright (c) 2008-2012 Kristaps Dzonsons <kristaps@bsd.lv>
4  * Copyright (c) 2010-2012, 2014-2019 Ingo Schwarze <schwarze@openbsd.org>
5  * Copyright (c) 2010 Joerg Sonnenberger <joerg@netbsd.org>
6  *
7  * Permission to use, copy, modify, and distribute this software for any
8  * purpose with or without fee is hereby granted, provided that the above
9  * copyright notice and this permission notice appear in all copies.
10  *
11  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES
12  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
14  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18  */
19 #include "config.h"
20 
21 #include <sys/types.h>
22 #include <sys/ioctl.h>
23 #include <sys/param.h>	/* MACHINE */
24 #include <sys/wait.h>
25 
26 #include <assert.h>
27 #include <ctype.h>
28 #if HAVE_ERR
29 #include <err.h>
30 #endif
31 #include <errno.h>
32 #include <fcntl.h>
33 #include <glob.h>
34 #if HAVE_SANDBOX_INIT
35 #include <sandbox.h>
36 #endif
37 #include <signal.h>
38 #include <stdio.h>
39 #include <stdint.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <termios.h>
43 #include <time.h>
44 #include <unistd.h>
45 
46 #include "mandoc_aux.h"
47 #include "mandoc.h"
48 #include "mandoc_xr.h"
49 #include "roff.h"
50 #include "mdoc.h"
51 #include "man.h"
52 #include "mandoc_parse.h"
53 #include "tag.h"
54 #include "main.h"
55 #include "manconf.h"
56 #include "mansearch.h"
57 
58 enum	outmode {
59 	OUTMODE_DEF = 0,
60 	OUTMODE_FLN,
61 	OUTMODE_LST,
62 	OUTMODE_ALL,
63 	OUTMODE_ONE
64 };
65 
66 enum	outt {
67 	OUTT_ASCII = 0,	/* -Tascii */
68 	OUTT_LOCALE,	/* -Tlocale */
69 	OUTT_UTF8,	/* -Tutf8 */
70 	OUTT_TREE,	/* -Ttree */
71 	OUTT_MAN,	/* -Tman */
72 	OUTT_HTML,	/* -Thtml */
73 	OUTT_MARKDOWN,	/* -Tmarkdown */
74 	OUTT_LINT,	/* -Tlint */
75 	OUTT_PS,	/* -Tps */
76 	OUTT_PDF	/* -Tpdf */
77 };
78 
79 struct	curparse {
80 	struct mparse	 *mp;
81 	struct manoutput *outopts;	/* output options */
82 	void		 *outdata;	/* data for output */
83 	char		 *os_s;		/* operating system for display */
84 	int		  wstop;	/* stop after a file with a warning */
85 	enum mandoc_os	  os_e;		/* check base system conventions */
86 	enum outt	  outtype;	/* which output to use */
87 };
88 
89 
90 int			  mandocdb(int, char *[]);
91 
92 static	void		  check_xr(void);
93 static	int		  fs_lookup(const struct manpaths *,
94 				size_t ipath, const char *,
95 				const char *, const char *,
96 				struct manpage **, size_t *);
97 static	int		  fs_search(const struct mansearch *,
98 				const struct manpaths *, int, char**,
99 				struct manpage **, size_t *);
100 static	int		  koptions(int *, char *);
101 static	void		  moptions(int *, char *);
102 static	void		  outdata_alloc(struct curparse *);
103 static	void		  parse(struct curparse *, int, const char *);
104 static	void		  passthrough(const char *, int, int);
105 static	pid_t		  spawn_pager(struct tag_files *);
106 static	int		  toptions(struct curparse *, char *);
107 static	void		  usage(enum argmode) __attribute__((__noreturn__));
108 static	int		  woptions(struct curparse *, char *);
109 
110 static	const int sec_prios[] = {1, 4, 5, 8, 6, 3, 7, 2, 9};
111 static	char		  help_arg[] = "help";
112 static	char		 *help_argv[] = {help_arg, NULL};
113 
114 
115 int
116 main(int argc, char *argv[])
117 {
118 	struct manconf	 conf;
119 	struct mansearch search;
120 	struct curparse	 curp;
121 	struct winsize	 ws;
122 	struct tag_files *tag_files;
123 	struct manpage	*res, *resp;
124 	const char	*progname, *sec, *thisarg;
125 	char		*conf_file, *defpaths, *auxpaths;
126 	char		*oarg, *tagarg;
127 	unsigned char	*uc;
128 	size_t		 i, sz;
129 	int		 prio, best_prio;
130 	enum outmode	 outmode;
131 	int		 fd, startdir;
132 	int		 show_usage;
133 	int		 options;
134 	int		 use_pager;
135 	int		 status, signum;
136 	int		 c;
137 	pid_t		 pager_pid, tc_pgid, man_pgid, pid;
138 
139 #if HAVE_PROGNAME
140 	progname = getprogname();
141 #else
142 	if (argc < 1)
143 		progname = mandoc_strdup("mandoc");
144 	else if ((progname = strrchr(argv[0], '/')) == NULL)
145 		progname = argv[0];
146 	else
147 		++progname;
148 	setprogname(progname);
149 #endif
150 
151 	mandoc_msg_setoutfile(stderr);
152 	if (strncmp(progname, "mandocdb", 8) == 0 ||
153 	    strcmp(progname, BINM_MAKEWHATIS) == 0)
154 		return mandocdb(argc, argv);
155 
156 #if HAVE_PLEDGE
157 	if (pledge("stdio rpath tmppath tty proc exec", NULL) == -1)
158 		err((int)MANDOCLEVEL_SYSERR, "pledge");
159 #endif
160 
161 #if HAVE_SANDBOX_INIT
162 	if (sandbox_init(kSBXProfileNoInternet, SANDBOX_NAMED, NULL) == -1)
163 		errx((int)MANDOCLEVEL_SYSERR, "sandbox_init");
164 #endif
165 
166 	/* Search options. */
167 
168 	memset(&conf, 0, sizeof(conf));
169 	conf_file = defpaths = NULL;
170 	auxpaths = NULL;
171 
172 	memset(&search, 0, sizeof(struct mansearch));
173 	search.outkey = "Nd";
174 	oarg = NULL;
175 
176 	if (strcmp(progname, BINM_MAN) == 0)
177 		search.argmode = ARG_NAME;
178 	else if (strcmp(progname, BINM_APROPOS) == 0)
179 		search.argmode = ARG_EXPR;
180 	else if (strcmp(progname, BINM_WHATIS) == 0)
181 		search.argmode = ARG_WORD;
182 	else if (strncmp(progname, "help", 4) == 0)
183 		search.argmode = ARG_NAME;
184 	else
185 		search.argmode = ARG_FILE;
186 
187 	/* Parser and formatter options. */
188 
189 	memset(&curp, 0, sizeof(struct curparse));
190 	curp.outtype = OUTT_LOCALE;
191 	curp.outopts = &conf.output;
192 	options = MPARSE_SO | MPARSE_UTF8 | MPARSE_LATIN1;
193 
194 	use_pager = 1;
195 	tag_files = NULL;
196 	show_usage = 0;
197 	outmode = OUTMODE_DEF;
198 
199 	while ((c = getopt(argc, argv,
200 	    "aC:cfhI:iK:klM:m:O:S:s:T:VW:w")) != -1) {
201 		if (c == 'i' && search.argmode == ARG_EXPR) {
202 			optind--;
203 			break;
204 		}
205 		switch (c) {
206 		case 'a':
207 			outmode = OUTMODE_ALL;
208 			break;
209 		case 'C':
210 			conf_file = optarg;
211 			break;
212 		case 'c':
213 			use_pager = 0;
214 			break;
215 		case 'f':
216 			search.argmode = ARG_WORD;
217 			break;
218 		case 'h':
219 			conf.output.synopsisonly = 1;
220 			use_pager = 0;
221 			outmode = OUTMODE_ALL;
222 			break;
223 		case 'I':
224 			if (strncmp(optarg, "os=", 3)) {
225 				warnx("-I %s: Bad argument", optarg);
226 				return (int)MANDOCLEVEL_BADARG;
227 			}
228 			if (curp.os_s != NULL) {
229 				warnx("-I %s: Duplicate argument", optarg);
230 				return (int)MANDOCLEVEL_BADARG;
231 			}
232 			curp.os_s = mandoc_strdup(optarg + 3);
233 			break;
234 		case 'K':
235 			if ( ! koptions(&options, optarg))
236 				return (int)MANDOCLEVEL_BADARG;
237 			break;
238 		case 'k':
239 			search.argmode = ARG_EXPR;
240 			break;
241 		case 'l':
242 			search.argmode = ARG_FILE;
243 			outmode = OUTMODE_ALL;
244 			break;
245 		case 'M':
246 			defpaths = optarg;
247 			break;
248 		case 'm':
249 			auxpaths = optarg;
250 			break;
251 		case 'O':
252 			oarg = optarg;
253 			break;
254 		case 'S':
255 			search.arch = optarg;
256 			break;
257 		case 's':
258 			search.sec = optarg;
259 			break;
260 		case 'T':
261 			if ( ! toptions(&curp, optarg))
262 				return (int)MANDOCLEVEL_BADARG;
263 			break;
264 		case 'W':
265 			if ( ! woptions(&curp, optarg))
266 				return (int)MANDOCLEVEL_BADARG;
267 			break;
268 		case 'w':
269 			outmode = OUTMODE_FLN;
270 			break;
271 		default:
272 			show_usage = 1;
273 			break;
274 		}
275 	}
276 
277 	if (show_usage)
278 		usage(search.argmode);
279 
280 	/* Postprocess options. */
281 
282 	if (outmode == OUTMODE_DEF) {
283 		switch (search.argmode) {
284 		case ARG_FILE:
285 			outmode = OUTMODE_ALL;
286 			use_pager = 0;
287 			break;
288 		case ARG_NAME:
289 			outmode = OUTMODE_ONE;
290 			break;
291 		default:
292 			outmode = OUTMODE_LST;
293 			break;
294 		}
295 	}
296 
297 	if (oarg != NULL) {
298 		if (outmode == OUTMODE_LST)
299 			search.outkey = oarg;
300 		else {
301 			while (oarg != NULL) {
302 				thisarg = oarg;
303 				if (manconf_output(&conf.output,
304 				    strsep(&oarg, ","), 0) == 0)
305 					continue;
306 				warnx("-O %s: Bad argument", thisarg);
307 				return (int)MANDOCLEVEL_BADARG;
308 			}
309 		}
310 	}
311 
312 	if (curp.outtype != OUTT_TREE || !curp.outopts->noval)
313 		options |= MPARSE_VALIDATE;
314 
315 	if (outmode == OUTMODE_FLN ||
316 	    outmode == OUTMODE_LST ||
317 	    !isatty(STDOUT_FILENO))
318 		use_pager = 0;
319 
320 	if (use_pager &&
321 	    (conf.output.width == 0 || conf.output.indent == 0) &&
322 	    ioctl(STDOUT_FILENO, TIOCGWINSZ, &ws) != -1 &&
323 	    ws.ws_col > 1) {
324 		if (conf.output.width == 0 && ws.ws_col < 79)
325 			conf.output.width = ws.ws_col - 1;
326 		if (conf.output.indent == 0 && ws.ws_col < 66)
327 			conf.output.indent = 3;
328 	}
329 
330 #if HAVE_PLEDGE
331 	if (!use_pager)
332 		if (pledge("stdio rpath", NULL) == -1)
333 			err((int)MANDOCLEVEL_SYSERR, "pledge");
334 #endif
335 
336 	/* Parse arguments. */
337 
338 	if (argc > 0) {
339 		argc -= optind;
340 		argv += optind;
341 	}
342 	resp = NULL;
343 
344 	/*
345 	 * Quirks for help(1)
346 	 * and for a man(1) section argument without -s.
347 	 */
348 
349 	if (search.argmode == ARG_NAME) {
350 		if (*progname == 'h') {
351 			if (argc == 0) {
352 				argv = help_argv;
353 				argc = 1;
354 			}
355 		} else if (argc > 1 &&
356 		    ((uc = (unsigned char *)argv[0]) != NULL) &&
357 		    ((isdigit(uc[0]) && (uc[1] == '\0' ||
358 		      (isalpha(uc[1]) && uc[2] == '\0'))) ||
359 		     (uc[0] == 'n' && uc[1] == '\0'))) {
360 			search.sec = (char *)uc;
361 			argv++;
362 			argc--;
363 		}
364 		if (search.arch == NULL)
365 			search.arch = getenv("MACHINE");
366 #ifdef MACHINE
367 		if (search.arch == NULL)
368 			search.arch = MACHINE;
369 #endif
370 	}
371 
372 	/*
373 	 * Use the first argument for -O tag in addition to
374 	 * using it as a search term for man(1) or apropos(1).
375 	 */
376 
377 	if (conf.output.tag != NULL && *conf.output.tag == '\0') {
378 		tagarg = argc > 0 && search.argmode == ARG_EXPR ?
379 		    strchr(*argv, '=') : NULL;
380 		conf.output.tag = tagarg == NULL ? *argv : tagarg + 1;
381 	}
382 
383 	/* man(1), whatis(1), apropos(1) */
384 
385 	if (search.argmode != ARG_FILE) {
386 		if (search.argmode == ARG_NAME &&
387 		    outmode == OUTMODE_ONE)
388 			search.firstmatch = 1;
389 
390 		/* Access the mandoc database. */
391 
392 		manconf_parse(&conf, conf_file, defpaths, auxpaths);
393 		if ( ! mansearch(&search, &conf.manpath,
394 		    argc, argv, &res, &sz))
395 			usage(search.argmode);
396 
397 		if (sz == 0 && search.argmode == ARG_NAME)
398 			fs_search(&search, &conf.manpath,
399 			    argc, argv, &res, &sz);
400 
401 		if (search.argmode == ARG_NAME) {
402 			for (c = 0; c < argc; c++) {
403 				if (strchr(argv[c], '/') == NULL)
404 					continue;
405 				if (access(argv[c], R_OK) == -1) {
406 					warn("%s", argv[c]);
407 					continue;
408 				}
409 				res = mandoc_reallocarray(res,
410 				    sz + 1, sizeof(*res));
411 				res[sz].file = mandoc_strdup(argv[c]);
412 				res[sz].names = NULL;
413 				res[sz].output = NULL;
414 				res[sz].ipath = SIZE_MAX;
415 				res[sz].sec = 10;
416 				res[sz].form = FORM_SRC;
417 				sz++;
418 			}
419 		}
420 
421 		if (sz == 0) {
422 			if (search.argmode != ARG_NAME)
423 				warnx("nothing appropriate");
424 			mandoc_msg_setrc(MANDOCLEVEL_BADARG);
425 			goto out;
426 		}
427 
428 		/*
429 		 * For standard man(1) and -a output mode,
430 		 * prepare for copying filename pointers
431 		 * into the program parameter array.
432 		 */
433 
434 		if (outmode == OUTMODE_ONE) {
435 			argc = 1;
436 			best_prio = 20;
437 		} else if (outmode == OUTMODE_ALL)
438 			argc = (int)sz;
439 
440 		/* Iterate all matching manuals. */
441 
442 		resp = res;
443 		for (i = 0; i < sz; i++) {
444 			if (outmode == OUTMODE_FLN)
445 				puts(res[i].file);
446 			else if (outmode == OUTMODE_LST)
447 				printf("%s - %s\n", res[i].names,
448 				    res[i].output == NULL ? "" :
449 				    res[i].output);
450 			else if (outmode == OUTMODE_ONE) {
451 				/* Search for the best section. */
452 				sec = res[i].file;
453 				sec += strcspn(sec, "123456789");
454 				if (sec[0] == '\0')
455 					continue;
456 				prio = sec_prios[sec[0] - '1'];
457 				if (sec[1] != '/')
458 					prio += 10;
459 				if (prio >= best_prio)
460 					continue;
461 				best_prio = prio;
462 				resp = res + i;
463 			}
464 		}
465 
466 		/*
467 		 * For man(1), -a and -i output mode, fall through
468 		 * to the main mandoc(1) code iterating files
469 		 * and running the parsers on each of them.
470 		 */
471 
472 		if (outmode == OUTMODE_FLN || outmode == OUTMODE_LST)
473 			goto out;
474 	}
475 
476 	/* mandoc(1) */
477 
478 #if HAVE_PLEDGE
479 	if (use_pager) {
480 		if (pledge("stdio rpath tmppath tty proc exec", NULL) == -1)
481 			err((int)MANDOCLEVEL_SYSERR, "pledge");
482 	} else {
483 		if (pledge("stdio rpath", NULL) == -1)
484 			err((int)MANDOCLEVEL_SYSERR, "pledge");
485 	}
486 #endif
487 
488 	if (search.argmode == ARG_FILE)
489 		moptions(&options, auxpaths);
490 
491 	mchars_alloc();
492 	curp.mp = mparse_alloc(options, curp.os_e, curp.os_s);
493 
494 	if (argc < 1) {
495 		if (use_pager) {
496 			tag_files = tag_init();
497 			tag_files->tagname = conf.output.tag;
498 		}
499 		thisarg = "<stdin>";
500 		mandoc_msg_setinfilename(thisarg);
501 		parse(&curp, STDIN_FILENO, thisarg);
502 		mandoc_msg_setinfilename(NULL);
503 	}
504 
505 	/*
506 	 * Remember the original working directory, if possible.
507 	 * This will be needed if some names on the command line
508 	 * are page names and some are relative file names.
509 	 * Do not error out if the current directory is not
510 	 * readable: Maybe it won't be needed after all.
511 	 */
512 	startdir = open(".", O_RDONLY | O_DIRECTORY);
513 
514 	while (argc > 0) {
515 
516 		/*
517 		 * Changing directories is not needed in ARG_FILE mode.
518 		 * Do it on a best-effort basis.  Even in case of
519 		 * failure, some functionality may still work.
520 		 */
521 		if (resp != NULL) {
522 			if (resp->ipath != SIZE_MAX)
523 				(void)chdir(conf.manpath.paths[resp->ipath]);
524 			else if (startdir != -1)
525 				(void)fchdir(startdir);
526 			thisarg = resp->file;
527 		} else
528 			thisarg = *argv;
529 
530 		fd = mparse_open(curp.mp, thisarg);
531 		if (fd != -1) {
532 			if (use_pager) {
533 				use_pager = 0;
534 				tag_files = tag_init();
535 				tag_files->tagname = conf.output.tag;
536 			}
537 
538 			mandoc_msg_setinfilename(thisarg);
539 			if (resp == NULL || resp->form == FORM_SRC)
540 				parse(&curp, fd, thisarg);
541 			else
542 				passthrough(resp->file, fd,
543 				    conf.output.synopsisonly);
544 			mandoc_msg_setinfilename(NULL);
545 
546 			if (ferror(stdout)) {
547 				if (tag_files != NULL) {
548 					warn("%s", tag_files->ofn);
549 					tag_unlink();
550 					tag_files = NULL;
551 				} else
552 					warn("stdout");
553 				mandoc_msg_setrc(MANDOCLEVEL_SYSERR);
554 				break;
555 			}
556 
557 			if (argc > 1 && curp.outtype <= OUTT_UTF8) {
558 				if (curp.outdata == NULL)
559 					outdata_alloc(&curp);
560 				terminal_sepline(curp.outdata);
561 			}
562 		} else
563 			mandoc_msg(MANDOCERR_FILE, 0, 0,
564 			    "%s: %s", thisarg, strerror(errno));
565 
566 		if (curp.wstop && mandoc_msg_getrc() != MANDOCLEVEL_OK)
567 			break;
568 
569 		if (resp != NULL)
570 			resp++;
571 		else
572 			argv++;
573 		if (--argc)
574 			mparse_reset(curp.mp);
575 	}
576 	if (startdir != -1) {
577 		(void)fchdir(startdir);
578 		close(startdir);
579 	}
580 
581 	if (curp.outdata != NULL) {
582 		switch (curp.outtype) {
583 		case OUTT_HTML:
584 			html_free(curp.outdata);
585 			break;
586 		case OUTT_UTF8:
587 		case OUTT_LOCALE:
588 		case OUTT_ASCII:
589 			ascii_free(curp.outdata);
590 			break;
591 		case OUTT_PDF:
592 		case OUTT_PS:
593 			pspdf_free(curp.outdata);
594 			break;
595 		default:
596 			break;
597 		}
598 	}
599 	mandoc_xr_free();
600 	mparse_free(curp.mp);
601 	mchars_free();
602 
603 out:
604 	if (search.argmode != ARG_FILE) {
605 		manconf_free(&conf);
606 		mansearch_free(res, sz);
607 	}
608 
609 	free(curp.os_s);
610 
611 	/*
612 	 * When using a pager, finish writing both temporary files,
613 	 * fork it, wait for the user to close it, and clean up.
614 	 */
615 
616 	if (tag_files != NULL) {
617 		fclose(stdout);
618 		tag_write();
619 		man_pgid = getpgid(0);
620 		tag_files->tcpgid = man_pgid == getpid() ?
621 		    getpgid(getppid()) : man_pgid;
622 		pager_pid = 0;
623 		signum = SIGSTOP;
624 		for (;;) {
625 
626 			/* Stop here until moved to the foreground. */
627 
628 			tc_pgid = tcgetpgrp(tag_files->ofd);
629 			if (tc_pgid != man_pgid) {
630 				if (tc_pgid == pager_pid) {
631 					(void)tcsetpgrp(tag_files->ofd,
632 					    man_pgid);
633 					if (signum == SIGTTIN)
634 						continue;
635 				} else
636 					tag_files->tcpgid = tc_pgid;
637 				kill(0, signum);
638 				continue;
639 			}
640 
641 			/* Once in the foreground, activate the pager. */
642 
643 			if (pager_pid) {
644 				(void)tcsetpgrp(tag_files->ofd, pager_pid);
645 				kill(pager_pid, SIGCONT);
646 			} else
647 				pager_pid = spawn_pager(tag_files);
648 
649 			/* Wait for the pager to stop or exit. */
650 
651 			while ((pid = waitpid(pager_pid, &status,
652 			    WUNTRACED)) == -1 && errno == EINTR)
653 				continue;
654 
655 			if (pid == -1) {
656 				warn("wait");
657 				mandoc_msg_setrc(MANDOCLEVEL_SYSERR);
658 				break;
659 			}
660 			if (!WIFSTOPPED(status))
661 				break;
662 
663 			signum = WSTOPSIG(status);
664 		}
665 		tag_unlink();
666 	}
667 	return (int)mandoc_msg_getrc();
668 }
669 
670 static void
671 usage(enum argmode argmode)
672 {
673 
674 	switch (argmode) {
675 	case ARG_FILE:
676 		fputs("usage: mandoc [-ac] [-I os=name] "
677 		    "[-K encoding] [-mdoc | -man] [-O options]\n"
678 		    "\t      [-T output] [-W level] [file ...]\n", stderr);
679 		break;
680 	case ARG_NAME:
681 		fputs("usage: man [-acfhklw] [-C file] [-M path] "
682 		    "[-m path] [-S subsection]\n"
683 		    "\t   [[-s] section] name ...\n", stderr);
684 		break;
685 	case ARG_WORD:
686 		fputs("usage: whatis [-afk] [-C file] "
687 		    "[-M path] [-m path] [-O outkey] [-S arch]\n"
688 		    "\t      [-s section] name ...\n", stderr);
689 		break;
690 	case ARG_EXPR:
691 		fputs("usage: apropos [-afk] [-C file] "
692 		    "[-M path] [-m path] [-O outkey] [-S arch]\n"
693 		    "\t       [-s section] expression ...\n", stderr);
694 		break;
695 	}
696 	exit((int)MANDOCLEVEL_BADARG);
697 }
698 
699 static int
700 fs_lookup(const struct manpaths *paths, size_t ipath,
701 	const char *sec, const char *arch, const char *name,
702 	struct manpage **res, size_t *ressz)
703 {
704 	glob_t		 globinfo;
705 	struct manpage	*page;
706 	char		*file;
707 	int		 globres;
708 	enum form	 form;
709 
710 	form = FORM_SRC;
711 	mandoc_asprintf(&file, "%s/man%s/%s.%s",
712 	    paths->paths[ipath], sec, name, sec);
713 	if (access(file, R_OK) != -1)
714 		goto found;
715 	free(file);
716 
717 	mandoc_asprintf(&file, "%s/cat%s/%s.0",
718 	    paths->paths[ipath], sec, name);
719 	if (access(file, R_OK) != -1) {
720 		form = FORM_CAT;
721 		goto found;
722 	}
723 	free(file);
724 
725 	if (arch != NULL) {
726 		mandoc_asprintf(&file, "%s/man%s/%s/%s.%s",
727 		    paths->paths[ipath], sec, arch, name, sec);
728 		if (access(file, R_OK) != -1)
729 			goto found;
730 		free(file);
731 	}
732 
733 	mandoc_asprintf(&file, "%s/man%s/%s.[01-9]*",
734 	    paths->paths[ipath], sec, name);
735 	globres = glob(file, 0, NULL, &globinfo);
736 	if (globres != 0 && globres != GLOB_NOMATCH)
737 		warn("%s: glob", file);
738 	free(file);
739 	if (globres == 0)
740 		file = mandoc_strdup(*globinfo.gl_pathv);
741 	globfree(&globinfo);
742 	if (globres == 0)
743 		goto found;
744 	if (res != NULL || ipath + 1 != paths->sz)
745 		return 0;
746 
747 	mandoc_asprintf(&file, "%s.%s", name, sec);
748 	globres = access(file, R_OK);
749 	free(file);
750 	return globres != -1;
751 
752 found:
753 	warnx("outdated mandoc.db lacks %s(%s) entry, run %s %s",
754 	    name, sec, BINM_MAKEWHATIS, paths->paths[ipath]);
755 	if (res == NULL) {
756 		free(file);
757 		return 1;
758 	}
759 	*res = mandoc_reallocarray(*res, ++*ressz, sizeof(struct manpage));
760 	page = *res + (*ressz - 1);
761 	page->file = file;
762 	page->names = NULL;
763 	page->output = NULL;
764 	page->ipath = ipath;
765 	page->sec = (*sec >= '1' && *sec <= '9') ? *sec - '1' + 1 : 10;
766 	page->form = form;
767 	return 1;
768 }
769 
770 static int
771 fs_search(const struct mansearch *cfg, const struct manpaths *paths,
772 	int argc, char **argv, struct manpage **res, size_t *ressz)
773 {
774 	const char *const sections[] =
775 	    {"1", "8", "6", "2", "3", "5", "7", "4", "9", "3p"};
776 	const size_t nsec = sizeof(sections)/sizeof(sections[0]);
777 
778 	size_t		 ipath, isec, lastsz;
779 
780 	assert(cfg->argmode == ARG_NAME);
781 
782 	if (res != NULL)
783 		*res = NULL;
784 	*ressz = lastsz = 0;
785 	while (argc) {
786 		for (ipath = 0; ipath < paths->sz; ipath++) {
787 			if (cfg->sec != NULL) {
788 				if (fs_lookup(paths, ipath, cfg->sec,
789 				    cfg->arch, *argv, res, ressz) &&
790 				    cfg->firstmatch)
791 					return 1;
792 			} else for (isec = 0; isec < nsec; isec++)
793 				if (fs_lookup(paths, ipath, sections[isec],
794 				    cfg->arch, *argv, res, ressz) &&
795 				    cfg->firstmatch)
796 					return 1;
797 		}
798 		if (res != NULL && *ressz == lastsz &&
799 		    strchr(*argv, '/') == NULL) {
800 			if (cfg->arch != NULL &&
801 			    arch_valid(cfg->arch, OSENUM) == 0)
802 				warnx("Unknown architecture \"%s\".",
803 				    cfg->arch);
804 			else if (cfg->sec == NULL)
805 				warnx("No entry for %s in the manual.",
806 				    *argv);
807 			else
808 				warnx("No entry for %s in section %s "
809 				    "of the manual.", *argv, cfg->sec);
810 		}
811 		lastsz = *ressz;
812 		argv++;
813 		argc--;
814 	}
815 	return 0;
816 }
817 
818 static void
819 parse(struct curparse *curp, int fd, const char *file)
820 {
821 	struct roff_meta *meta;
822 
823 	/* Begin by parsing the file itself. */
824 
825 	assert(file);
826 	assert(fd >= 0);
827 
828 	mparse_readfd(curp->mp, fd, file);
829 	if (fd != STDIN_FILENO)
830 		close(fd);
831 
832 	/*
833 	 * With -Wstop and warnings or errors of at least the requested
834 	 * level, do not produce output.
835 	 */
836 
837 	if (curp->wstop && mandoc_msg_getrc() != MANDOCLEVEL_OK)
838 		return;
839 
840 	if (curp->outdata == NULL)
841 		outdata_alloc(curp);
842 	else if (curp->outtype == OUTT_HTML)
843 		html_reset(curp);
844 
845 	mandoc_xr_reset();
846 	meta = mparse_result(curp->mp);
847 
848 	/* Execute the out device, if it exists. */
849 
850 	if (meta->macroset == MACROSET_MDOC) {
851 		switch (curp->outtype) {
852 		case OUTT_HTML:
853 			html_mdoc(curp->outdata, meta);
854 			break;
855 		case OUTT_TREE:
856 			tree_mdoc(curp->outdata, meta);
857 			break;
858 		case OUTT_MAN:
859 			man_mdoc(curp->outdata, meta);
860 			break;
861 		case OUTT_PDF:
862 		case OUTT_ASCII:
863 		case OUTT_UTF8:
864 		case OUTT_LOCALE:
865 		case OUTT_PS:
866 			terminal_mdoc(curp->outdata, meta);
867 			break;
868 		case OUTT_MARKDOWN:
869 			markdown_mdoc(curp->outdata, meta);
870 			break;
871 		default:
872 			break;
873 		}
874 	}
875 	if (meta->macroset == MACROSET_MAN) {
876 		switch (curp->outtype) {
877 		case OUTT_HTML:
878 			html_man(curp->outdata, meta);
879 			break;
880 		case OUTT_TREE:
881 			tree_man(curp->outdata, meta);
882 			break;
883 		case OUTT_MAN:
884 			mparse_copy(curp->mp);
885 			break;
886 		case OUTT_PDF:
887 		case OUTT_ASCII:
888 		case OUTT_UTF8:
889 		case OUTT_LOCALE:
890 		case OUTT_PS:
891 			terminal_man(curp->outdata, meta);
892 			break;
893 		default:
894 			break;
895 		}
896 	}
897 	if (mandoc_msg_getmin() < MANDOCERR_STYLE)
898 		check_xr();
899 }
900 
901 static void
902 check_xr(void)
903 {
904 	static struct manpaths	 paths;
905 	struct mansearch	 search;
906 	struct mandoc_xr	*xr;
907 	size_t			 sz;
908 
909 	if (paths.sz == 0)
910 		manpath_base(&paths);
911 
912 	for (xr = mandoc_xr_get(); xr != NULL; xr = xr->next) {
913 		if (xr->line == -1)
914 			continue;
915 		search.arch = NULL;
916 		search.sec = xr->sec;
917 		search.outkey = NULL;
918 		search.argmode = ARG_NAME;
919 		search.firstmatch = 1;
920 		if (mansearch(&search, &paths, 1, &xr->name, NULL, &sz))
921 			continue;
922 		if (fs_search(&search, &paths, 1, &xr->name, NULL, &sz))
923 			continue;
924 		if (xr->count == 1)
925 			mandoc_msg(MANDOCERR_XR_BAD, xr->line,
926 			    xr->pos + 1, "Xr %s %s", xr->name, xr->sec);
927 		else
928 			mandoc_msg(MANDOCERR_XR_BAD, xr->line,
929 			    xr->pos + 1, "Xr %s %s (%d times)",
930 			    xr->name, xr->sec, xr->count);
931 	}
932 }
933 
934 static void
935 outdata_alloc(struct curparse *curp)
936 {
937 	switch (curp->outtype) {
938 	case OUTT_HTML:
939 		curp->outdata = html_alloc(curp->outopts);
940 		break;
941 	case OUTT_UTF8:
942 		curp->outdata = utf8_alloc(curp->outopts);
943 		break;
944 	case OUTT_LOCALE:
945 		curp->outdata = locale_alloc(curp->outopts);
946 		break;
947 	case OUTT_ASCII:
948 		curp->outdata = ascii_alloc(curp->outopts);
949 		break;
950 	case OUTT_PDF:
951 		curp->outdata = pdf_alloc(curp->outopts);
952 		break;
953 	case OUTT_PS:
954 		curp->outdata = ps_alloc(curp->outopts);
955 		break;
956 	default:
957 		break;
958 	}
959 }
960 
961 static void
962 passthrough(const char *file, int fd, int synopsis_only)
963 {
964 	const char	 synb[] = "S\bSY\bYN\bNO\bOP\bPS\bSI\bIS\bS";
965 	const char	 synr[] = "SYNOPSIS";
966 
967 	FILE		*stream;
968 	const char	*syscall;
969 	char		*line, *cp;
970 	size_t		 linesz;
971 	ssize_t		 len, written;
972 	int		 print;
973 
974 	line = NULL;
975 	linesz = 0;
976 
977 	if (fflush(stdout) == EOF) {
978 		syscall = "fflush";
979 		goto fail;
980 	}
981 
982 	if ((stream = fdopen(fd, "r")) == NULL) {
983 		close(fd);
984 		syscall = "fdopen";
985 		goto fail;
986 	}
987 
988 	print = 0;
989 	while ((len = getline(&line, &linesz, stream)) != -1) {
990 		cp = line;
991 		if (synopsis_only) {
992 			if (print) {
993 				if ( ! isspace((unsigned char)*cp))
994 					goto done;
995 				while (isspace((unsigned char)*cp)) {
996 					cp++;
997 					len--;
998 				}
999 			} else {
1000 				if (strcmp(cp, synb) == 0 ||
1001 				    strcmp(cp, synr) == 0)
1002 					print = 1;
1003 				continue;
1004 			}
1005 		}
1006 		for (; len > 0; len -= written) {
1007 			if ((written = write(STDOUT_FILENO, cp, len)) != -1)
1008 				continue;
1009 			fclose(stream);
1010 			syscall = "write";
1011 			goto fail;
1012 		}
1013 	}
1014 
1015 	if (ferror(stream)) {
1016 		fclose(stream);
1017 		syscall = "getline";
1018 		goto fail;
1019 	}
1020 
1021 done:
1022 	free(line);
1023 	fclose(stream);
1024 	return;
1025 
1026 fail:
1027 	free(line);
1028 	warn("%s: SYSERR: %s", file, syscall);
1029 	mandoc_msg_setrc(MANDOCLEVEL_SYSERR);
1030 }
1031 
1032 static int
1033 koptions(int *options, char *arg)
1034 {
1035 
1036 	if ( ! strcmp(arg, "utf-8")) {
1037 		*options |=  MPARSE_UTF8;
1038 		*options &= ~MPARSE_LATIN1;
1039 	} else if ( ! strcmp(arg, "iso-8859-1")) {
1040 		*options |=  MPARSE_LATIN1;
1041 		*options &= ~MPARSE_UTF8;
1042 	} else if ( ! strcmp(arg, "us-ascii")) {
1043 		*options &= ~(MPARSE_UTF8 | MPARSE_LATIN1);
1044 	} else {
1045 		warnx("-K %s: Bad argument", arg);
1046 		return 0;
1047 	}
1048 	return 1;
1049 }
1050 
1051 static void
1052 moptions(int *options, char *arg)
1053 {
1054 
1055 	if (arg == NULL)
1056 		return;
1057 	if (strcmp(arg, "doc") == 0)
1058 		*options |= MPARSE_MDOC;
1059 	else if (strcmp(arg, "an") == 0)
1060 		*options |= MPARSE_MAN;
1061 }
1062 
1063 static int
1064 toptions(struct curparse *curp, char *arg)
1065 {
1066 
1067 	if (0 == strcmp(arg, "ascii"))
1068 		curp->outtype = OUTT_ASCII;
1069 	else if (0 == strcmp(arg, "lint")) {
1070 		curp->outtype = OUTT_LINT;
1071 		mandoc_msg_setoutfile(stdout);
1072 		mandoc_msg_setmin(MANDOCERR_BASE);
1073 	} else if (0 == strcmp(arg, "tree"))
1074 		curp->outtype = OUTT_TREE;
1075 	else if (0 == strcmp(arg, "man"))
1076 		curp->outtype = OUTT_MAN;
1077 	else if (0 == strcmp(arg, "html"))
1078 		curp->outtype = OUTT_HTML;
1079 	else if (0 == strcmp(arg, "markdown"))
1080 		curp->outtype = OUTT_MARKDOWN;
1081 	else if (0 == strcmp(arg, "utf8"))
1082 		curp->outtype = OUTT_UTF8;
1083 	else if (0 == strcmp(arg, "locale"))
1084 		curp->outtype = OUTT_LOCALE;
1085 	else if (0 == strcmp(arg, "ps"))
1086 		curp->outtype = OUTT_PS;
1087 	else if (0 == strcmp(arg, "pdf"))
1088 		curp->outtype = OUTT_PDF;
1089 	else {
1090 		warnx("-T %s: Bad argument", arg);
1091 		return 0;
1092 	}
1093 
1094 	return 1;
1095 }
1096 
1097 static int
1098 woptions(struct curparse *curp, char *arg)
1099 {
1100 	char		*v, *o;
1101 	const char	*toks[11];
1102 
1103 	toks[0] = "stop";
1104 	toks[1] = "all";
1105 	toks[2] = "base";
1106 	toks[3] = "style";
1107 	toks[4] = "warning";
1108 	toks[5] = "error";
1109 	toks[6] = "unsupp";
1110 	toks[7] = "fatal";
1111 	toks[8] = "openbsd";
1112 	toks[9] = "netbsd";
1113 	toks[10] = NULL;
1114 
1115 	while (*arg) {
1116 		o = arg;
1117 		switch (getsubopt(&arg, (char * const *)toks, &v)) {
1118 		case 0:
1119 			curp->wstop = 1;
1120 			break;
1121 		case 1:
1122 		case 2:
1123 			mandoc_msg_setmin(MANDOCERR_BASE);
1124 			break;
1125 		case 3:
1126 			mandoc_msg_setmin(MANDOCERR_STYLE);
1127 			break;
1128 		case 4:
1129 			mandoc_msg_setmin(MANDOCERR_WARNING);
1130 			break;
1131 		case 5:
1132 			mandoc_msg_setmin(MANDOCERR_ERROR);
1133 			break;
1134 		case 6:
1135 			mandoc_msg_setmin(MANDOCERR_UNSUPP);
1136 			break;
1137 		case 7:
1138 			mandoc_msg_setmin(MANDOCERR_MAX);
1139 			break;
1140 		case 8:
1141 			mandoc_msg_setmin(MANDOCERR_BASE);
1142 			curp->os_e = MANDOC_OS_OPENBSD;
1143 			break;
1144 		case 9:
1145 			mandoc_msg_setmin(MANDOCERR_BASE);
1146 			curp->os_e = MANDOC_OS_NETBSD;
1147 			break;
1148 		default:
1149 			warnx("-W %s: Bad argument", o);
1150 			return 0;
1151 		}
1152 	}
1153 	return 1;
1154 }
1155 
1156 static pid_t
1157 spawn_pager(struct tag_files *tag_files)
1158 {
1159 	const struct timespec timeout = { 0, 100000000 };  /* 0.1s */
1160 #define MAX_PAGER_ARGS 16
1161 	char		*argv[MAX_PAGER_ARGS];
1162 	const char	*pager;
1163 	char		*cp;
1164 #if HAVE_LESS_T
1165 	size_t		 cmdlen;
1166 #endif
1167 	int		 argc, use_ofn;
1168 	pid_t		 pager_pid;
1169 
1170 	pager = getenv("MANPAGER");
1171 	if (pager == NULL || *pager == '\0')
1172 		pager = getenv("PAGER");
1173 	if (pager == NULL || *pager == '\0')
1174 		pager = "more -s";
1175 	cp = mandoc_strdup(pager);
1176 
1177 	/*
1178 	 * Parse the pager command into words.
1179 	 * Intentionally do not do anything fancy here.
1180 	 */
1181 
1182 	argc = 0;
1183 	while (argc + 5 < MAX_PAGER_ARGS) {
1184 		argv[argc++] = cp;
1185 		cp = strchr(cp, ' ');
1186 		if (cp == NULL)
1187 			break;
1188 		*cp++ = '\0';
1189 		while (*cp == ' ')
1190 			cp++;
1191 		if (*cp == '\0')
1192 			break;
1193 	}
1194 
1195 	/* For less(1), use the tag file. */
1196 
1197 	use_ofn = 1;
1198 #if HAVE_LESS_T
1199 	if ((cmdlen = strlen(argv[0])) >= 4) {
1200 		cp = argv[0] + cmdlen - 4;
1201 		if (strcmp(cp, "less") == 0) {
1202 			argv[argc++] = mandoc_strdup("-T");
1203 			argv[argc++] = tag_files->tfn;
1204 			if (tag_files->tagname != NULL) {
1205 				argv[argc++] = mandoc_strdup("-t");
1206 				argv[argc++] = tag_files->tagname;
1207 				use_ofn = 0;
1208 			}
1209 		}
1210 	}
1211 #endif
1212 	if (use_ofn)
1213 		argv[argc++] = tag_files->ofn;
1214 	argv[argc] = NULL;
1215 
1216 	switch (pager_pid = fork()) {
1217 	case -1:
1218 		err((int)MANDOCLEVEL_SYSERR, "fork");
1219 	case 0:
1220 		break;
1221 	default:
1222 		(void)setpgid(pager_pid, 0);
1223 		(void)tcsetpgrp(tag_files->ofd, pager_pid);
1224 #if HAVE_PLEDGE
1225 		if (pledge("stdio rpath tmppath tty proc", NULL) == -1)
1226 			err((int)MANDOCLEVEL_SYSERR, "pledge");
1227 #endif
1228 		tag_files->pager_pid = pager_pid;
1229 		return pager_pid;
1230 	}
1231 
1232 	/* The child process becomes the pager. */
1233 
1234 	if (dup2(tag_files->ofd, STDOUT_FILENO) == -1)
1235 		err((int)MANDOCLEVEL_SYSERR, "pager stdout");
1236 	close(tag_files->ofd);
1237 	assert(tag_files->tfd == -1);
1238 
1239 	/* Do not start the pager before controlling the terminal. */
1240 
1241 	while (tcgetpgrp(STDOUT_FILENO) != getpid())
1242 		nanosleep(&timeout, NULL);
1243 
1244 	execvp(argv[0], argv);
1245 	err((int)MANDOCLEVEL_SYSERR, "exec %s", argv[0]);
1246 }
1247