xref: /freebsd/lib/libc/gen/wordexp.c (revision 842ad8ac0b5cb0989b9580d6af84bb97571aa701)
1faea1495STim J. Robbins /*-
2faea1495STim J. Robbins  * Copyright (c) 2002 Tim J. Robbins.
3faea1495STim J. Robbins  * All rights reserved.
4faea1495STim J. Robbins  *
5faea1495STim J. Robbins  * Redistribution and use in source and binary forms, with or without
6faea1495STim J. Robbins  * modification, are permitted provided that the following conditions
7faea1495STim J. Robbins  * are met:
8faea1495STim J. Robbins  * 1. Redistributions of source code must retain the above copyright
9faea1495STim J. Robbins  *    notice, this list of conditions and the following disclaimer.
10faea1495STim J. Robbins  * 2. Redistributions in binary form must reproduce the above copyright
11faea1495STim J. Robbins  *    notice, this list of conditions and the following disclaimer in the
12faea1495STim J. Robbins  *    documentation and/or other materials provided with the distribution.
13faea1495STim J. Robbins  *
14faea1495STim J. Robbins  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15faea1495STim J. Robbins  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16faea1495STim J. Robbins  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17faea1495STim J. Robbins  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18faea1495STim J. Robbins  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19faea1495STim J. Robbins  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20faea1495STim J. Robbins  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21faea1495STim J. Robbins  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22faea1495STim J. Robbins  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23faea1495STim J. Robbins  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24faea1495STim J. Robbins  * SUCH DAMAGE.
25faea1495STim J. Robbins  */
26faea1495STim J. Robbins 
27faea1495STim J. Robbins #include "namespace.h"
28faea1495STim J. Robbins #include <sys/cdefs.h>
29faea1495STim J. Robbins #include <sys/types.h>
30faea1495STim J. Robbins #include <sys/wait.h>
31364e9ccbSJilles Tjoelker #include <errno.h>
32faea1495STim J. Robbins #include <fcntl.h>
33faea1495STim J. Robbins #include <paths.h>
34364e9ccbSJilles Tjoelker #include <signal.h>
35faea1495STim J. Robbins #include <stdio.h>
36faea1495STim J. Robbins #include <stdlib.h>
37faea1495STim J. Robbins #include <string.h>
38faea1495STim J. Robbins #include <unistd.h>
39faea1495STim J. Robbins #include <wordexp.h>
40faea1495STim J. Robbins #include "un-namespace.h"
41faea1495STim J. Robbins 
42faea1495STim J. Robbins __FBSDID("$FreeBSD$");
43faea1495STim J. Robbins 
44faea1495STim J. Robbins static int	we_askshell(const char *, wordexp_t *, int);
45faea1495STim J. Robbins static int	we_check(const char *, int);
46faea1495STim J. Robbins 
47faea1495STim J. Robbins /*
48faea1495STim J. Robbins  * wordexp --
49faea1495STim J. Robbins  *	Perform shell word expansion on `words' and place the resulting list
50faea1495STim J. Robbins  *	of words in `we'. See wordexp(3).
51faea1495STim J. Robbins  *
52faea1495STim J. Robbins  *	Specified by IEEE Std. 1003.1-2001.
53faea1495STim J. Robbins  */
54faea1495STim J. Robbins int
55faea1495STim J. Robbins wordexp(const char * __restrict words, wordexp_t * __restrict we, int flags)
56faea1495STim J. Robbins {
57faea1495STim J. Robbins 	int error;
58faea1495STim J. Robbins 
59faea1495STim J. Robbins 	if (flags & WRDE_REUSE)
60faea1495STim J. Robbins 		wordfree(we);
61faea1495STim J. Robbins 	if ((flags & WRDE_APPEND) == 0) {
62faea1495STim J. Robbins 		we->we_wordc = 0;
63faea1495STim J. Robbins 		we->we_wordv = NULL;
64faea1495STim J. Robbins 		we->we_strings = NULL;
65faea1495STim J. Robbins 		we->we_nbytes = 0;
66faea1495STim J. Robbins 	}
67faea1495STim J. Robbins 	if ((error = we_check(words, flags)) != 0) {
68faea1495STim J. Robbins 		wordfree(we);
69faea1495STim J. Robbins 		return (error);
70faea1495STim J. Robbins 	}
71faea1495STim J. Robbins 	if ((error = we_askshell(words, we, flags)) != 0) {
72faea1495STim J. Robbins 		wordfree(we);
73faea1495STim J. Robbins 		return (error);
74faea1495STim J. Robbins 	}
75faea1495STim J. Robbins 	return (0);
76faea1495STim J. Robbins }
77faea1495STim J. Robbins 
78364e9ccbSJilles Tjoelker static size_t
79364e9ccbSJilles Tjoelker we_read_fully(int fd, char *buffer, size_t len)
80364e9ccbSJilles Tjoelker {
81364e9ccbSJilles Tjoelker 	size_t done;
82364e9ccbSJilles Tjoelker 	ssize_t nread;
83364e9ccbSJilles Tjoelker 
84364e9ccbSJilles Tjoelker 	done = 0;
85364e9ccbSJilles Tjoelker 	do {
86364e9ccbSJilles Tjoelker 		nread = _read(fd, buffer + done, len - done);
87364e9ccbSJilles Tjoelker 		if (nread == -1 && errno == EINTR)
88364e9ccbSJilles Tjoelker 			continue;
89364e9ccbSJilles Tjoelker 		if (nread <= 0)
90364e9ccbSJilles Tjoelker 			break;
91364e9ccbSJilles Tjoelker 		done += nread;
92364e9ccbSJilles Tjoelker 	} while (done != len);
93364e9ccbSJilles Tjoelker 	return done;
94364e9ccbSJilles Tjoelker }
95364e9ccbSJilles Tjoelker 
96faea1495STim J. Robbins /*
97faea1495STim J. Robbins  * we_askshell --
98faea1495STim J. Robbins  *	Use the `wordexp' /bin/sh builtin function to do most of the work
99faea1495STim J. Robbins  *	in expanding the word string. This function is complicated by
100faea1495STim J. Robbins  *	memory management.
101faea1495STim J. Robbins  */
102faea1495STim J. Robbins static int
103faea1495STim J. Robbins we_askshell(const char *words, wordexp_t *we, int flags)
104faea1495STim J. Robbins {
105faea1495STim J. Robbins 	int pdes[2];			/* Pipe to child */
106faea1495STim J. Robbins 	char bbuf[9];			/* Buffer for byte count */
107faea1495STim J. Robbins 	char wbuf[9];			/* Buffer for word count */
108faea1495STim J. Robbins 	long nwords, nbytes;		/* Number of words, bytes from child */
109faea1495STim J. Robbins 	long i;				/* Handy integer */
110faea1495STim J. Robbins 	size_t sofs;			/* Offset into we->we_strings */
111faea1495STim J. Robbins 	size_t vofs;			/* Offset into we->we_wordv */
112faea1495STim J. Robbins 	pid_t pid;			/* Process ID of child */
113364e9ccbSJilles Tjoelker 	pid_t wpid;			/* waitpid return value */
114faea1495STim J. Robbins 	int status;			/* Child exit status */
115364e9ccbSJilles Tjoelker 	int error;			/* Our return value */
116364e9ccbSJilles Tjoelker 	int serrno;			/* errno to return */
117faea1495STim J. Robbins 	char *np, *p;			/* Handy pointers */
118faea1495STim J. Robbins 	char *nstrings;			/* Temporary for realloc() */
119faea1495STim J. Robbins 	char **nwv;			/* Temporary for realloc() */
120364e9ccbSJilles Tjoelker 	sigset_t newsigblock, oldsigblock;
1212f61288cSJilles Tjoelker 	const char *ifs;
122faea1495STim J. Robbins 
123364e9ccbSJilles Tjoelker 	serrno = errno;
1242f61288cSJilles Tjoelker 	ifs = getenv("IFS");
125faea1495STim J. Robbins 
126f6d7148dSJilles Tjoelker 	if (pipe2(pdes, O_CLOEXEC) < 0)
127faea1495STim J. Robbins 		return (WRDE_NOSPACE);	/* XXX */
128364e9ccbSJilles Tjoelker 	(void)sigemptyset(&newsigblock);
129364e9ccbSJilles Tjoelker 	(void)sigaddset(&newsigblock, SIGCHLD);
130364e9ccbSJilles Tjoelker 	(void)_sigprocmask(SIG_BLOCK, &newsigblock, &oldsigblock);
131faea1495STim J. Robbins 	if ((pid = fork()) < 0) {
132364e9ccbSJilles Tjoelker 		serrno = errno;
1332005f192STim J. Robbins 		_close(pdes[0]);
1342005f192STim J. Robbins 		_close(pdes[1]);
135364e9ccbSJilles Tjoelker 		(void)_sigprocmask(SIG_SETMASK, &oldsigblock, NULL);
136364e9ccbSJilles Tjoelker 		errno = serrno;
137faea1495STim J. Robbins 		return (WRDE_NOSPACE);	/* XXX */
138faea1495STim J. Robbins 	}
139faea1495STim J. Robbins 	else if (pid == 0) {
140faea1495STim J. Robbins 		/*
141*842ad8acSJilles Tjoelker 		 * We are the child; make /bin/sh expand `words'.
142faea1495STim J. Robbins 		 */
143364e9ccbSJilles Tjoelker 		(void)_sigprocmask(SIG_SETMASK, &oldsigblock, NULL);
144f6d7148dSJilles Tjoelker 		if ((pdes[1] != STDOUT_FILENO ?
145f6d7148dSJilles Tjoelker 		    _dup2(pdes[1], STDOUT_FILENO) :
146f6d7148dSJilles Tjoelker 		    _fcntl(pdes[1], F_SETFD, 0)) < 0)
147faea1495STim J. Robbins 			_exit(1);
148faea1495STim J. Robbins 		execl(_PATH_BSHELL, "sh", flags & WRDE_UNDEF ? "-u" : "+u",
149*842ad8acSJilles Tjoelker 		    "-c", "IFS=$1;eval \"$2\";eval \"set -- $3\";IFS=;a=\"$*\";"
150*842ad8acSJilles Tjoelker 		    "printf '%08x' \"$#\" \"${#a}\";printf '%s\\0' \"$@\"",
151*842ad8acSJilles Tjoelker 		    "",
1522f61288cSJilles Tjoelker 		    ifs != NULL ? ifs : " \t\n",
153ae4c676cSJilles Tjoelker 		    flags & WRDE_SHOWERR ? "" : "exec 2>/dev/null", words,
154ae4c676cSJilles Tjoelker 		    (char *)NULL);
155faea1495STim J. Robbins 		_exit(1);
156faea1495STim J. Robbins 	}
157faea1495STim J. Robbins 
158faea1495STim J. Robbins 	/*
159faea1495STim J. Robbins 	 * We are the parent; read the output of the shell wordexp function,
160faea1495STim J. Robbins 	 * which is a 32-bit hexadecimal word count, a 32-bit hexadecimal
161faea1495STim J. Robbins 	 * byte count (not including terminating null bytes), followed by
162faea1495STim J. Robbins 	 * the expanded words separated by nulls.
163faea1495STim J. Robbins 	 */
1642005f192STim J. Robbins 	_close(pdes[1]);
165364e9ccbSJilles Tjoelker 	if (we_read_fully(pdes[0], wbuf, 8) != 8 ||
166364e9ccbSJilles Tjoelker 			we_read_fully(pdes[0], bbuf, 8) != 8) {
167364e9ccbSJilles Tjoelker 		error = flags & WRDE_UNDEF ? WRDE_BADVAL : WRDE_SYNTAX;
168364e9ccbSJilles Tjoelker 		serrno = errno;
169364e9ccbSJilles Tjoelker 		goto cleanup;
170faea1495STim J. Robbins 	}
171faea1495STim J. Robbins 	wbuf[8] = bbuf[8] = '\0';
172faea1495STim J. Robbins 	nwords = strtol(wbuf, NULL, 16);
173faea1495STim J. Robbins 	nbytes = strtol(bbuf, NULL, 16) + nwords;
174faea1495STim J. Robbins 
175faea1495STim J. Robbins 	/*
176faea1495STim J. Robbins 	 * Allocate or reallocate (when flags & WRDE_APPEND) the word vector
177faea1495STim J. Robbins 	 * and string storage buffers for the expanded words we're about to
178faea1495STim J. Robbins 	 * read from the child.
179faea1495STim J. Robbins 	 */
180faea1495STim J. Robbins 	sofs = we->we_nbytes;
181faea1495STim J. Robbins 	vofs = we->we_wordc;
182b7114d4aSTim J. Robbins 	if ((flags & (WRDE_DOOFFS|WRDE_APPEND)) == (WRDE_DOOFFS|WRDE_APPEND))
183fe634ca7STim J. Robbins 		vofs += we->we_offs;
184faea1495STim J. Robbins 	we->we_wordc += nwords;
185faea1495STim J. Robbins 	we->we_nbytes += nbytes;
186faea1495STim J. Robbins 	if ((nwv = realloc(we->we_wordv, (we->we_wordc + 1 +
187b7114d4aSTim J. Robbins 	    (flags & WRDE_DOOFFS ?  we->we_offs : 0)) *
188faea1495STim J. Robbins 	    sizeof(char *))) == NULL) {
189364e9ccbSJilles Tjoelker 		error = WRDE_NOSPACE;
190364e9ccbSJilles Tjoelker 		goto cleanup;
191faea1495STim J. Robbins 	}
192faea1495STim J. Robbins 	we->we_wordv = nwv;
193faea1495STim J. Robbins 	if ((nstrings = realloc(we->we_strings, we->we_nbytes)) == NULL) {
194364e9ccbSJilles Tjoelker 		error = WRDE_NOSPACE;
195364e9ccbSJilles Tjoelker 		goto cleanup;
196faea1495STim J. Robbins 	}
197faea1495STim J. Robbins 	for (i = 0; i < vofs; i++)
198faea1495STim J. Robbins 		if (we->we_wordv[i] != NULL)
199faea1495STim J. Robbins 			we->we_wordv[i] += nstrings - we->we_strings;
200faea1495STim J. Robbins 	we->we_strings = nstrings;
201faea1495STim J. Robbins 
202364e9ccbSJilles Tjoelker 	if (we_read_fully(pdes[0], we->we_strings + sofs, nbytes) != nbytes) {
203364e9ccbSJilles Tjoelker 		error = flags & WRDE_UNDEF ? WRDE_BADVAL : WRDE_SYNTAX;
204364e9ccbSJilles Tjoelker 		serrno = errno;
205364e9ccbSJilles Tjoelker 		goto cleanup;
206faea1495STim J. Robbins 	}
207faea1495STim J. Robbins 
208364e9ccbSJilles Tjoelker 	error = 0;
209364e9ccbSJilles Tjoelker cleanup:
2102005f192STim J. Robbins 	_close(pdes[0]);
211364e9ccbSJilles Tjoelker 	do
212364e9ccbSJilles Tjoelker 		wpid = _waitpid(pid, &status, 0);
213364e9ccbSJilles Tjoelker 	while (wpid < 0 && errno == EINTR);
214364e9ccbSJilles Tjoelker 	(void)_sigprocmask(SIG_SETMASK, &oldsigblock, NULL);
215364e9ccbSJilles Tjoelker 	if (error != 0) {
216364e9ccbSJilles Tjoelker 		errno = serrno;
217364e9ccbSJilles Tjoelker 		return (error);
218faea1495STim J. Robbins 	}
219364e9ccbSJilles Tjoelker 	if (wpid < 0 || !WIFEXITED(status) || WEXITSTATUS(status) != 0)
220364e9ccbSJilles Tjoelker 		return (flags & WRDE_UNDEF ? WRDE_BADVAL : WRDE_SYNTAX);
221faea1495STim J. Robbins 
222faea1495STim J. Robbins 	/*
223faea1495STim J. Robbins 	 * Break the null-terminated expanded word strings out into
224faea1495STim J. Robbins 	 * the vector.
225faea1495STim J. Robbins 	 */
226b7114d4aSTim J. Robbins 	if (vofs == 0 && flags & WRDE_DOOFFS)
227faea1495STim J. Robbins 		while (vofs < we->we_offs)
228faea1495STim J. Robbins 			we->we_wordv[vofs++] = NULL;
229faea1495STim J. Robbins 	p = we->we_strings + sofs;
230faea1495STim J. Robbins 	while (nwords-- != 0) {
231faea1495STim J. Robbins 		we->we_wordv[vofs++] = p;
232faea1495STim J. Robbins 		if ((np = memchr(p, '\0', nbytes)) == NULL)
233faea1495STim J. Robbins 			return (WRDE_NOSPACE);	/* XXX */
234faea1495STim J. Robbins 		nbytes -= np - p + 1;
235faea1495STim J. Robbins 		p = np + 1;
236faea1495STim J. Robbins 	}
237faea1495STim J. Robbins 	we->we_wordv[vofs] = NULL;
238faea1495STim J. Robbins 
239faea1495STim J. Robbins 	return (0);
240faea1495STim J. Robbins }
241faea1495STim J. Robbins 
242faea1495STim J. Robbins /*
243faea1495STim J. Robbins  * we_check --
244faea1495STim J. Robbins  *	Check that the string contains none of the following unquoted
245faea1495STim J. Robbins  *	special characters: <newline> |&;<>(){}
246faea1495STim J. Robbins  *	or command substitutions when WRDE_NOCMD is set in flags.
247faea1495STim J. Robbins  */
24897c1c8f8STim J. Robbins static int
249faea1495STim J. Robbins we_check(const char *words, int flags)
250faea1495STim J. Robbins {
251faea1495STim J. Robbins 	char c;
252faea1495STim J. Robbins 	int dquote, level, quote, squote;
253faea1495STim J. Robbins 
254faea1495STim J. Robbins 	quote = squote = dquote = 0;
255faea1495STim J. Robbins 	while ((c = *words++) != '\0') {
256faea1495STim J. Robbins 		switch (c) {
257faea1495STim J. Robbins 		case '\\':
2588d0f6b5fSJilles Tjoelker 			if (squote == 0)
259faea1495STim J. Robbins 				quote ^= 1;
260fe634ca7STim J. Robbins 			continue;
261faea1495STim J. Robbins 		case '\'':
262faea1495STim J. Robbins 			if (quote + dquote == 0)
263faea1495STim J. Robbins 				squote ^= 1;
264faea1495STim J. Robbins 			break;
265faea1495STim J. Robbins 		case '"':
266faea1495STim J. Robbins 			if (quote + squote == 0)
267faea1495STim J. Robbins 				dquote ^= 1;
268faea1495STim J. Robbins 			break;
269faea1495STim J. Robbins 		case '`':
270faea1495STim J. Robbins 			if (quote + squote == 0 && flags & WRDE_NOCMD)
271faea1495STim J. Robbins 				return (WRDE_CMDSUB);
272faea1495STim J. Robbins 			while ((c = *words++) != '\0' && c != '`')
273faea1495STim J. Robbins 				if (c == '\\' && (c = *words++) == '\0')
274faea1495STim J. Robbins 					break;
275faea1495STim J. Robbins 			if (c == '\0')
276faea1495STim J. Robbins 				return (WRDE_SYNTAX);
277faea1495STim J. Robbins 			break;
278faea1495STim J. Robbins 		case '|': case '&': case ';': case '<': case '>':
279faea1495STim J. Robbins 		case '{': case '}': case '(': case ')': case '\n':
280faea1495STim J. Robbins 			if (quote + squote + dquote == 0)
281faea1495STim J. Robbins 				return (WRDE_BADCHAR);
282faea1495STim J. Robbins 			break;
283faea1495STim J. Robbins 		case '$':
284faea1495STim J. Robbins 			if ((c = *words++) == '\0')
285faea1495STim J. Robbins 				break;
286fe634ca7STim J. Robbins 			else if (quote + squote == 0 && c == '(') {
287fe634ca7STim J. Robbins 				if (flags & WRDE_NOCMD && *words != '(')
288faea1495STim J. Robbins 					return (WRDE_CMDSUB);
289faea1495STim J. Robbins 				level = 1;
290faea1495STim J. Robbins 				while ((c = *words++) != '\0') {
291faea1495STim J. Robbins 					if (c == '\\') {
292faea1495STim J. Robbins 						if ((c = *words++) == '\0')
293faea1495STim J. Robbins 							break;
294faea1495STim J. Robbins 					} else if (c == '(')
295faea1495STim J. Robbins 						level++;
296faea1495STim J. Robbins 					else if (c == ')' && --level == 0)
297faea1495STim J. Robbins 						break;
298faea1495STim J. Robbins 				}
299faea1495STim J. Robbins 				if (c == '\0' || level != 0)
300faea1495STim J. Robbins 					return (WRDE_SYNTAX);
301fe634ca7STim J. Robbins 			} else if (quote + squote == 0 && c == '{') {
302faea1495STim J. Robbins 				level = 1;
303faea1495STim J. Robbins 				while ((c = *words++) != '\0') {
304faea1495STim J. Robbins 					if (c == '\\') {
305faea1495STim J. Robbins 						if ((c = *words++) == '\0')
306faea1495STim J. Robbins 							break;
307faea1495STim J. Robbins 					} else if (c == '{')
308faea1495STim J. Robbins 						level++;
309faea1495STim J. Robbins 					else if (c == '}' && --level == 0)
310faea1495STim J. Robbins 						break;
311faea1495STim J. Robbins 				}
312faea1495STim J. Robbins 				if (c == '\0' || level != 0)
313faea1495STim J. Robbins 					return (WRDE_SYNTAX);
314fe634ca7STim J. Robbins 			} else
3150c0349bfSGarrett Wollman 				--words;
316faea1495STim J. Robbins 			break;
317faea1495STim J. Robbins 		default:
318faea1495STim J. Robbins 			break;
319faea1495STim J. Robbins 		}
320fe634ca7STim J. Robbins 		quote = 0;
321faea1495STim J. Robbins 	}
322faea1495STim J. Robbins 	if (quote + squote + dquote != 0)
323faea1495STim J. Robbins 		return (WRDE_SYNTAX);
324faea1495STim J. Robbins 
325faea1495STim J. Robbins 	return (0);
326faea1495STim J. Robbins }
327faea1495STim J. Robbins 
328faea1495STim J. Robbins /*
329faea1495STim J. Robbins  * wordfree --
330faea1495STim J. Robbins  *	Free the result of wordexp(). See wordexp(3).
331faea1495STim J. Robbins  *
332faea1495STim J. Robbins  *	Specified by IEEE Std. 1003.1-2001.
333faea1495STim J. Robbins  */
334faea1495STim J. Robbins void
335faea1495STim J. Robbins wordfree(wordexp_t *we)
336faea1495STim J. Robbins {
337faea1495STim J. Robbins 
338faea1495STim J. Robbins 	if (we == NULL)
339faea1495STim J. Robbins 		return;
340faea1495STim J. Robbins 	free(we->we_wordv);
341faea1495STim J. Robbins 	free(we->we_strings);
342faea1495STim J. Robbins 	we->we_wordv = NULL;
343faea1495STim J. Robbins 	we->we_strings = NULL;
344faea1495STim J. Robbins 	we->we_nbytes = 0;
345faea1495STim J. Robbins 	we->we_wordc = 0;
346faea1495STim J. Robbins }
347