xref: /freebsd/contrib/openpam/lib/libpam/openpam_readword.c (revision ce77a8d6923d67accfee464f031330c83f551f9e)
1f7e6344dSDag-Erling Smørgrav /*-
2f7e6344dSDag-Erling Smørgrav  * Copyright (c) 2012 Dag-Erling Smørgrav
3f7e6344dSDag-Erling Smørgrav  * All rights reserved.
4f7e6344dSDag-Erling Smørgrav  *
5f7e6344dSDag-Erling Smørgrav  * Redistribution and use in source and binary forms, with or without
6f7e6344dSDag-Erling Smørgrav  * modification, are permitted provided that the following conditions
7f7e6344dSDag-Erling Smørgrav  * are met:
8f7e6344dSDag-Erling Smørgrav  * 1. Redistributions of source code must retain the above copyright
9*ce77a8d6SDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer.
10f7e6344dSDag-Erling Smørgrav  * 2. Redistributions in binary form must reproduce the above copyright
11f7e6344dSDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer in the
12f7e6344dSDag-Erling Smørgrav  *    documentation and/or other materials provided with the distribution.
13f7e6344dSDag-Erling Smørgrav  * 3. The name of the author may not be used to endorse or promote
14f7e6344dSDag-Erling Smørgrav  *    products derived from this software without specific prior written
15f7e6344dSDag-Erling Smørgrav  *    permission.
16f7e6344dSDag-Erling Smørgrav  *
17f7e6344dSDag-Erling Smørgrav  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18f7e6344dSDag-Erling Smørgrav  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19f7e6344dSDag-Erling Smørgrav  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20f7e6344dSDag-Erling Smørgrav  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21f7e6344dSDag-Erling Smørgrav  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22f7e6344dSDag-Erling Smørgrav  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23f7e6344dSDag-Erling Smørgrav  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24f7e6344dSDag-Erling Smørgrav  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25f7e6344dSDag-Erling Smørgrav  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26f7e6344dSDag-Erling Smørgrav  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27f7e6344dSDag-Erling Smørgrav  * SUCH DAMAGE.
28f7e6344dSDag-Erling Smørgrav  *
29*ce77a8d6SDag-Erling Smørgrav  * $Id: openpam_readword.c 648 2013-03-05 17:54:27Z des $
30f7e6344dSDag-Erling Smørgrav  */
31f7e6344dSDag-Erling Smørgrav 
32f7e6344dSDag-Erling Smørgrav #ifdef HAVE_CONFIG_H
33f7e6344dSDag-Erling Smørgrav # include "config.h"
34f7e6344dSDag-Erling Smørgrav #endif
35f7e6344dSDag-Erling Smørgrav 
36f7e6344dSDag-Erling Smørgrav #include <errno.h>
37f7e6344dSDag-Erling Smørgrav #include <stdio.h>
38f7e6344dSDag-Erling Smørgrav #include <stdlib.h>
39f7e6344dSDag-Erling Smørgrav 
40f7e6344dSDag-Erling Smørgrav #include <security/pam_appl.h>
41f7e6344dSDag-Erling Smørgrav 
42f7e6344dSDag-Erling Smørgrav #include "openpam_impl.h"
43f7e6344dSDag-Erling Smørgrav #include "openpam_ctype.h"
44f7e6344dSDag-Erling Smørgrav 
45f7e6344dSDag-Erling Smørgrav #define MIN_WORD_SIZE	32
46f7e6344dSDag-Erling Smørgrav 
47f7e6344dSDag-Erling Smørgrav /*
48f7e6344dSDag-Erling Smørgrav  * OpenPAM extension
49f7e6344dSDag-Erling Smørgrav  *
50f7e6344dSDag-Erling Smørgrav  * Read a word from a file, respecting shell quoting rules.
51f7e6344dSDag-Erling Smørgrav  */
52f7e6344dSDag-Erling Smørgrav 
53f7e6344dSDag-Erling Smørgrav char *
54f7e6344dSDag-Erling Smørgrav openpam_readword(FILE *f, int *lineno, size_t *lenp)
55f7e6344dSDag-Erling Smørgrav {
56f7e6344dSDag-Erling Smørgrav 	char *word;
57f7e6344dSDag-Erling Smørgrav 	size_t size, len;
58f7e6344dSDag-Erling Smørgrav 	int ch, comment, escape, quote;
59f7e6344dSDag-Erling Smørgrav 	int serrno;
60f7e6344dSDag-Erling Smørgrav 
61f7e6344dSDag-Erling Smørgrav 	errno = 0;
62f7e6344dSDag-Erling Smørgrav 
63f7e6344dSDag-Erling Smørgrav 	/* skip initial whitespace */
64f7e6344dSDag-Erling Smørgrav 	comment = 0;
65f7e6344dSDag-Erling Smørgrav 	while ((ch = getc(f)) != EOF && ch != '\n') {
66f7e6344dSDag-Erling Smørgrav 		if (ch == '#')
67f7e6344dSDag-Erling Smørgrav 			comment = 1;
68f7e6344dSDag-Erling Smørgrav 		if (!is_lws(ch) && !comment)
69f7e6344dSDag-Erling Smørgrav 			break;
70f7e6344dSDag-Erling Smørgrav 	}
71f7e6344dSDag-Erling Smørgrav 	if (ch == EOF)
72f7e6344dSDag-Erling Smørgrav 		return (NULL);
73f7e6344dSDag-Erling Smørgrav 	ungetc(ch, f);
74f7e6344dSDag-Erling Smørgrav 	if (ch == '\n')
75f7e6344dSDag-Erling Smørgrav 		return (NULL);
76f7e6344dSDag-Erling Smørgrav 
77f7e6344dSDag-Erling Smørgrav 	word = NULL;
78f7e6344dSDag-Erling Smørgrav 	size = len = 0;
79f7e6344dSDag-Erling Smørgrav 	escape = quote = 0;
80f7e6344dSDag-Erling Smørgrav 	while ((ch = fgetc(f)) != EOF && (!is_ws(ch) || quote || escape)) {
81f7e6344dSDag-Erling Smørgrav 		if (ch == '\\' && !escape && quote != '\'') {
82f7e6344dSDag-Erling Smørgrav 			/* escape next character */
83f7e6344dSDag-Erling Smørgrav 			escape = ch;
84f7e6344dSDag-Erling Smørgrav 		} else if ((ch == '\'' || ch == '"') && !quote && !escape) {
85f7e6344dSDag-Erling Smørgrav 			/* begin quote */
86f7e6344dSDag-Erling Smørgrav 			quote = ch;
87f7e6344dSDag-Erling Smørgrav 			/* edge case: empty quoted string */
88f7e6344dSDag-Erling Smørgrav 			if (openpam_straddch(&word, &size, &len, 0) != 0)
89f7e6344dSDag-Erling Smørgrav 				return (NULL);
90f7e6344dSDag-Erling Smørgrav 		} else if (ch == quote && !escape) {
91f7e6344dSDag-Erling Smørgrav 			/* end quote */
92f7e6344dSDag-Erling Smørgrav 			quote = 0;
93f7e6344dSDag-Erling Smørgrav 		} else if (ch == '\n' && escape && quote != '\'') {
94f7e6344dSDag-Erling Smørgrav 			/* line continuation */
95f7e6344dSDag-Erling Smørgrav 			escape = 0;
96f7e6344dSDag-Erling Smørgrav 		} else {
97f7e6344dSDag-Erling Smørgrav 			if (escape && quote && ch != '\\' && ch != quote &&
98f7e6344dSDag-Erling Smørgrav 			    openpam_straddch(&word, &size, &len, '\\') != 0) {
99f7e6344dSDag-Erling Smørgrav 				free(word);
100f7e6344dSDag-Erling Smørgrav 				errno = ENOMEM;
101f7e6344dSDag-Erling Smørgrav 				return (NULL);
102f7e6344dSDag-Erling Smørgrav 			}
103f7e6344dSDag-Erling Smørgrav 			if (openpam_straddch(&word, &size, &len, ch) != 0) {
104f7e6344dSDag-Erling Smørgrav 				free(word);
105f7e6344dSDag-Erling Smørgrav 				errno = ENOMEM;
106f7e6344dSDag-Erling Smørgrav 				return (NULL);
107f7e6344dSDag-Erling Smørgrav 			}
108f7e6344dSDag-Erling Smørgrav 			escape = 0;
109f7e6344dSDag-Erling Smørgrav 		}
110f7e6344dSDag-Erling Smørgrav 		if (lineno != NULL && ch == '\n')
111f7e6344dSDag-Erling Smørgrav 			++*lineno;
112f7e6344dSDag-Erling Smørgrav 	}
113f7e6344dSDag-Erling Smørgrav 	if (ch == EOF && ferror(f)) {
114f7e6344dSDag-Erling Smørgrav 		serrno = errno;
115f7e6344dSDag-Erling Smørgrav 		free(word);
116f7e6344dSDag-Erling Smørgrav 		errno = serrno;
117f7e6344dSDag-Erling Smørgrav 		return (NULL);
118f7e6344dSDag-Erling Smørgrav 	}
119f7e6344dSDag-Erling Smørgrav 	if (ch == EOF && (escape || quote)) {
120f7e6344dSDag-Erling Smørgrav 		/* Missing escaped character or closing quote. */
121f7e6344dSDag-Erling Smørgrav 		openpam_log(PAM_LOG_ERROR, "unexpected end of file");
122f7e6344dSDag-Erling Smørgrav 		free(word);
123f7e6344dSDag-Erling Smørgrav 		errno = EINVAL;
124f7e6344dSDag-Erling Smørgrav 		return (NULL);
125f7e6344dSDag-Erling Smørgrav 	}
126f7e6344dSDag-Erling Smørgrav 	ungetc(ch, f);
127f7e6344dSDag-Erling Smørgrav 	if (lenp != NULL)
128f7e6344dSDag-Erling Smørgrav 		*lenp = len;
129f7e6344dSDag-Erling Smørgrav 	return (word);
130f7e6344dSDag-Erling Smørgrav }
131f7e6344dSDag-Erling Smørgrav 
132f7e6344dSDag-Erling Smørgrav /**
133f7e6344dSDag-Erling Smørgrav  * The =openpam_readword function reads the next word from a file, and
134f7e6344dSDag-Erling Smørgrav  * returns it in a NUL-terminated buffer allocated with =!malloc.
135f7e6344dSDag-Erling Smørgrav  *
136f7e6344dSDag-Erling Smørgrav  * A word is a sequence of non-whitespace characters.
137f7e6344dSDag-Erling Smørgrav  * However, whitespace characters can be included in a word if quoted or
138f7e6344dSDag-Erling Smørgrav  * escaped according to the following rules:
139f7e6344dSDag-Erling Smørgrav  *
140f7e6344dSDag-Erling Smørgrav  *  - An unescaped single or double quote introduces a quoted string,
141f7e6344dSDag-Erling Smørgrav  *    which ends when the same quote character is encountered a second
142f7e6344dSDag-Erling Smørgrav  *    time.
143f7e6344dSDag-Erling Smørgrav  *    The quotes themselves are stripped.
144f7e6344dSDag-Erling Smørgrav  *
145f7e6344dSDag-Erling Smørgrav  *  - Within a single- or double-quoted string, all whitespace characters,
146f7e6344dSDag-Erling Smørgrav  *    including the newline character, are preserved as-is.
147f7e6344dSDag-Erling Smørgrav  *
148f7e6344dSDag-Erling Smørgrav  *  - Outside a quoted string, a backslash escapes the next character,
149f7e6344dSDag-Erling Smørgrav  *    which is preserved as-is, unless that character is a newline, in
150f7e6344dSDag-Erling Smørgrav  *    which case it is discarded and reading continues at the beginning of
151f7e6344dSDag-Erling Smørgrav  *    the next line as if the backslash and newline had not been there.
152f7e6344dSDag-Erling Smørgrav  *    In all cases, the backslash itself is discarded.
153f7e6344dSDag-Erling Smørgrav  *
154f7e6344dSDag-Erling Smørgrav  *  - Within a single-quoted string, double quotes and backslashes are
155f7e6344dSDag-Erling Smørgrav  *    preserved as-is.
156f7e6344dSDag-Erling Smørgrav  *
157f7e6344dSDag-Erling Smørgrav  *  - Within a double-quoted string, a single quote is preserved as-is,
158f7e6344dSDag-Erling Smørgrav  *    and a backslash is preserved as-is unless used to escape a double
159f7e6344dSDag-Erling Smørgrav  *    quote.
160f7e6344dSDag-Erling Smørgrav  *
161f7e6344dSDag-Erling Smørgrav  * In addition, if the first non-whitespace character on the line is a
162f7e6344dSDag-Erling Smørgrav  * hash character (#), the rest of the line is discarded.
163f7e6344dSDag-Erling Smørgrav  * If a hash character occurs within a word, however, it is preserved
164f7e6344dSDag-Erling Smørgrav  * as-is.
165f7e6344dSDag-Erling Smørgrav  * A backslash at the end of a comment does cause line continuation.
166f7e6344dSDag-Erling Smørgrav  *
167f7e6344dSDag-Erling Smørgrav  * If =lineno is not =NULL, the integer variable it points to is
168f7e6344dSDag-Erling Smørgrav  * incremented every time a quoted or escaped newline character is read.
169f7e6344dSDag-Erling Smørgrav  *
170f7e6344dSDag-Erling Smørgrav  * If =lenp is not =NULL, the length of the word (after quotes and
171f7e6344dSDag-Erling Smørgrav  * backslashes have been removed) is stored in the variable it points to.
172f7e6344dSDag-Erling Smørgrav  *
173f7e6344dSDag-Erling Smørgrav  * RETURN VALUES
174f7e6344dSDag-Erling Smørgrav  *
175f7e6344dSDag-Erling Smørgrav  * If successful, the =openpam_readword function returns a pointer to a
176f7e6344dSDag-Erling Smørgrav  * dynamically allocated NUL-terminated string containing the first word
177f7e6344dSDag-Erling Smørgrav  * encountered on the line.
178f7e6344dSDag-Erling Smørgrav  *
179f7e6344dSDag-Erling Smørgrav  * The caller is responsible for releasing the returned buffer by passing
180f7e6344dSDag-Erling Smørgrav  * it to =!free.
181f7e6344dSDag-Erling Smørgrav  *
182f7e6344dSDag-Erling Smørgrav  * If =openpam_readword reaches the end of the line or file before any
183f7e6344dSDag-Erling Smørgrav  * characters are copied to the word, it returns =NULL.  In the former
184f7e6344dSDag-Erling Smørgrav  * case, the newline is pushed back to the file.
185f7e6344dSDag-Erling Smørgrav  *
186f7e6344dSDag-Erling Smørgrav  * If =openpam_readword reaches the end of the file while a quote or
187f7e6344dSDag-Erling Smørgrav  * backslash escape is in effect, it sets :errno to =EINVAL and returns
188f7e6344dSDag-Erling Smørgrav  * =NULL.
189f7e6344dSDag-Erling Smørgrav  *
190f7e6344dSDag-Erling Smørgrav  * IMPLEMENTATION NOTES
191f7e6344dSDag-Erling Smørgrav  *
192f7e6344dSDag-Erling Smørgrav  * The parsing rules are intended to be equivalent to the normal POSIX
193f7e6344dSDag-Erling Smørgrav  * shell quoting rules.
194f7e6344dSDag-Erling Smørgrav  * Any discrepancy is a bug and should be reported to the author along
195f7e6344dSDag-Erling Smørgrav  * with sample input that can be used to reproduce the error.
196f7e6344dSDag-Erling Smørgrav  *
197f7e6344dSDag-Erling Smørgrav  * >openpam_readline
198f7e6344dSDag-Erling Smørgrav  * >openpam_readlinev
199f7e6344dSDag-Erling Smørgrav  *
200f7e6344dSDag-Erling Smørgrav  * AUTHOR DES
201f7e6344dSDag-Erling Smørgrav  */
202