xref: /freebsd/contrib/file/src/compress.c (revision 40427cca7a9ae77b095936fb1954417c290cfb17)
1b6cee71dSXin LI /*
2b6cee71dSXin LI  * Copyright (c) Ian F. Darwin 1986-1995.
3b6cee71dSXin LI  * Software written by Ian F. Darwin and others;
4b6cee71dSXin LI  * maintained 1995-present by Christos Zoulas and others.
5b6cee71dSXin LI  *
6b6cee71dSXin LI  * Redistribution and use in source and binary forms, with or without
7b6cee71dSXin LI  * modification, are permitted provided that the following conditions
8b6cee71dSXin LI  * are met:
9b6cee71dSXin LI  * 1. Redistributions of source code must retain the above copyright
10b6cee71dSXin LI  *    notice immediately at the beginning of the file, without modification,
11b6cee71dSXin LI  *    this list of conditions, and the following disclaimer.
12b6cee71dSXin LI  * 2. Redistributions in binary form must reproduce the above copyright
13b6cee71dSXin LI  *    notice, this list of conditions and the following disclaimer in the
14b6cee71dSXin LI  *    documentation and/or other materials provided with the distribution.
15b6cee71dSXin LI  *
16b6cee71dSXin LI  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17b6cee71dSXin LI  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18b6cee71dSXin LI  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19b6cee71dSXin LI  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
20b6cee71dSXin LI  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21b6cee71dSXin LI  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22b6cee71dSXin LI  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23b6cee71dSXin LI  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24b6cee71dSXin LI  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25b6cee71dSXin LI  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26b6cee71dSXin LI  * SUCH DAMAGE.
27b6cee71dSXin LI  */
28b6cee71dSXin LI /*
29b6cee71dSXin LI  * compress routines:
30b6cee71dSXin LI  *	zmagic() - returns 0 if not recognized, uncompresses and prints
31b6cee71dSXin LI  *		   information if recognized
32b6cee71dSXin LI  *	uncompress(method, old, n, newch) - uncompress old into new,
33b6cee71dSXin LI  *					    using method, return sizeof new
34b6cee71dSXin LI  */
35b6cee71dSXin LI #include "file.h"
36b6cee71dSXin LI 
37b6cee71dSXin LI #ifndef lint
38*40427ccaSGordon Tetlow FILE_RCSID("@(#)$File: compress.c,v 1.105 2017/05/25 00:13:03 christos Exp $")
39b6cee71dSXin LI #endif
40b6cee71dSXin LI 
41b6cee71dSXin LI #include "magic.h"
42b6cee71dSXin LI #include <stdlib.h>
43b6cee71dSXin LI #ifdef HAVE_UNISTD_H
44b6cee71dSXin LI #include <unistd.h>
45b6cee71dSXin LI #endif
46b6cee71dSXin LI #include <string.h>
47b6cee71dSXin LI #include <errno.h>
483e41d09dSXin LI #include <ctype.h>
493e41d09dSXin LI #include <stdarg.h>
505f0216bdSXin LI #ifdef HAVE_SIGNAL_H
514460e5b0SXin LI #include <signal.h>
525f0216bdSXin LI # ifndef HAVE_SIG_T
535f0216bdSXin LI typedef void (*sig_t)(int);
545f0216bdSXin LI # endif /* HAVE_SIG_T */
555f0216bdSXin LI #endif
56c2931133SXin LI #if !defined(__MINGW32__) && !defined(WIN32)
57b6cee71dSXin LI #include <sys/ioctl.h>
58b6cee71dSXin LI #endif
59b6cee71dSXin LI #ifdef HAVE_SYS_WAIT_H
60b6cee71dSXin LI #include <sys/wait.h>
61b6cee71dSXin LI #endif
62b6cee71dSXin LI #if defined(HAVE_SYS_TIME_H)
63b6cee71dSXin LI #include <sys/time.h>
64b6cee71dSXin LI #endif
65*40427ccaSGordon Tetlow #if defined(HAVE_ZLIB_H) && defined(ZLIBSUPPORT)
66b6cee71dSXin LI #define BUILTIN_DECOMPRESS
67b6cee71dSXin LI #include <zlib.h>
683e41d09dSXin LI #endif
693e41d09dSXin LI #ifdef DEBUG
703e41d09dSXin LI int tty = -1;
713e41d09dSXin LI #define DPRINTF(...)	do { \
723e41d09dSXin LI 	if (tty == -1) \
733e41d09dSXin LI 		tty = open("/dev/tty", O_RDWR); \
743e41d09dSXin LI 	if (tty == -1) \
753e41d09dSXin LI 		abort(); \
763e41d09dSXin LI 	dprintf(tty, __VA_ARGS__); \
773e41d09dSXin LI } while (/*CONSTCOND*/0)
783e41d09dSXin LI #else
793e41d09dSXin LI #define DPRINTF(...)
80b6cee71dSXin LI #endif
81b6cee71dSXin LI 
823e41d09dSXin LI #ifdef ZLIBSUPPORT
833e41d09dSXin LI /*
843e41d09dSXin LI  * The following python code is not really used because ZLIBSUPPORT is only
853e41d09dSXin LI  * defined if we have a built-in zlib, and the built-in zlib handles that.
86*40427ccaSGordon Tetlow  * That is not true for android where we have zlib.h and not -lz.
873e41d09dSXin LI  */
883e41d09dSXin LI static const char zlibcode[] =
893e41d09dSXin LI     "import sys, zlib; sys.stdout.write(zlib.decompress(sys.stdin.read()))";
903e41d09dSXin LI 
913e41d09dSXin LI static const char *zlib_args[] = { "python", "-c", zlibcode, NULL };
923e41d09dSXin LI 
933e41d09dSXin LI static int
943e41d09dSXin LI zlibcmp(const unsigned char *buf)
953e41d09dSXin LI {
963e41d09dSXin LI 	unsigned short x = 1;
97*40427ccaSGordon Tetlow 	unsigned char *s = CAST(unsigned char *, CAST(void *, &x));
983e41d09dSXin LI 
993e41d09dSXin LI 	if ((buf[0] & 0xf) != 8 || (buf[0] & 0x80) != 0)
1003e41d09dSXin LI 		return 0;
1013e41d09dSXin LI 	if (s[0] != 1)	/* endianness test */
1023e41d09dSXin LI 		x = buf[0] | (buf[1] << 8);
1033e41d09dSXin LI 	else
1043e41d09dSXin LI 		x = buf[1] | (buf[0] << 8);
1053e41d09dSXin LI 	if (x % 31)
1063e41d09dSXin LI 		return 0;
1073e41d09dSXin LI 	return 1;
1083e41d09dSXin LI }
1093e41d09dSXin LI #endif
1103e41d09dSXin LI 
1113e41d09dSXin LI #define gzip_flags "-cd"
1123e41d09dSXin LI #define lrzip_flags "-do"
1133e41d09dSXin LI #define lzip_flags gzip_flags
1143e41d09dSXin LI 
1153e41d09dSXin LI static const char *gzip_args[] = {
1163e41d09dSXin LI 	"gzip", gzip_flags, NULL
1173e41d09dSXin LI };
1183e41d09dSXin LI static const char *uncompress_args[] = {
1193e41d09dSXin LI 	"uncompress", "-c", NULL
1203e41d09dSXin LI };
1213e41d09dSXin LI static const char *bzip2_args[] = {
1223e41d09dSXin LI 	"bzip2", "-cd", NULL
1233e41d09dSXin LI };
1243e41d09dSXin LI static const char *lzip_args[] = {
1253e41d09dSXin LI 	"lzip", lzip_flags, NULL
1263e41d09dSXin LI };
1273e41d09dSXin LI static const char *xz_args[] = {
1283e41d09dSXin LI 	"xz", "-cd", NULL
1293e41d09dSXin LI };
1303e41d09dSXin LI static const char *lrzip_args[] = {
1313e41d09dSXin LI 	"lrzip", lrzip_flags, NULL
1323e41d09dSXin LI };
1333e41d09dSXin LI static const char *lz4_args[] = {
1343e41d09dSXin LI 	"lz4", "-cd", NULL
135b6cee71dSXin LI };
136a5d223e6SXin LI static const char *zstd_args[] = {
137a5d223e6SXin LI 	"zstd", "-cd", NULL
138a5d223e6SXin LI };
139b6cee71dSXin LI 
1403e41d09dSXin LI private const struct {
1413e41d09dSXin LI 	const void *magic;
1423e41d09dSXin LI 	size_t maglen;
1433e41d09dSXin LI 	const char **argv;
1443e41d09dSXin LI } compr[] = {
1453e41d09dSXin LI 	{ "\037\235",	2, gzip_args },		/* compressed */
1463e41d09dSXin LI 	/* Uncompress can get stuck; so use gzip first if we have it
1473e41d09dSXin LI 	 * Idea from Damien Clark, thanks! */
1483e41d09dSXin LI 	{ "\037\235",	2, uncompress_args },	/* compressed */
1493e41d09dSXin LI 	{ "\037\213",	2, gzip_args },		/* gzipped */
1503e41d09dSXin LI 	{ "\037\236",	2, gzip_args },		/* frozen */
1513e41d09dSXin LI 	{ "\037\240",	2, gzip_args },		/* SCO LZH */
1523e41d09dSXin LI 	/* the standard pack utilities do not accept standard input */
1533e41d09dSXin LI 	{ "\037\036",	2, gzip_args },		/* packed */
1543e41d09dSXin LI 	{ "PK\3\4",	4, gzip_args },		/* pkzipped, */
1553e41d09dSXin LI 	/* ...only first file examined */
1563e41d09dSXin LI 	{ "BZh",	3, bzip2_args },	/* bzip2-ed */
1573e41d09dSXin LI 	{ "LZIP",	4, lzip_args },		/* lzip-ed */
1583e41d09dSXin LI  	{ "\3757zXZ\0",	6, xz_args },		/* XZ Utils */
1593e41d09dSXin LI  	{ "LRZI",	4, lrzip_args },	/* LRZIP */
1603e41d09dSXin LI  	{ "\004\"M\030",4, lz4_args },		/* LZ4 */
161a5d223e6SXin LI  	{ "\x28\xB5\x2F\xFD", 4, zstd_args },	/* zstd */
1623e41d09dSXin LI #ifdef ZLIBSUPPORT
163a5d223e6SXin LI 	{ RCAST(const void *, zlibcmp),	0, zlib_args },		/* zlib */
1643e41d09dSXin LI #endif
1653e41d09dSXin LI };
1663e41d09dSXin LI 
1673e41d09dSXin LI #define OKDATA 	0
1683e41d09dSXin LI #define NODATA	1
1693e41d09dSXin LI #define ERRDATA	2
170b6cee71dSXin LI 
171b6cee71dSXin LI private ssize_t swrite(int, const void *, size_t);
172b6cee71dSXin LI #if HAVE_FORK
173b6cee71dSXin LI private size_t ncompr = sizeof(compr) / sizeof(compr[0]);
1743e41d09dSXin LI private int uncompressbuf(int, size_t, size_t, const unsigned char *,
1753e41d09dSXin LI     unsigned char **, size_t *);
176b6cee71dSXin LI #ifdef BUILTIN_DECOMPRESS
1773e41d09dSXin LI private int uncompresszlib(const unsigned char *, unsigned char **, size_t,
1783e41d09dSXin LI     size_t *, int);
1793e41d09dSXin LI private int uncompressgzipped(const unsigned char *, unsigned char **, size_t,
1803e41d09dSXin LI     size_t *);
181b6cee71dSXin LI #endif
1823e41d09dSXin LI static int makeerror(unsigned char **, size_t *, const char *, ...)
1833e41d09dSXin LI     __attribute__((__format__(__printf__, 3, 4)));
1843e41d09dSXin LI private const char *methodname(size_t);
185b6cee71dSXin LI 
186b6cee71dSXin LI protected int
187b6cee71dSXin LI file_zmagic(struct magic_set *ms, int fd, const char *name,
188b6cee71dSXin LI     const unsigned char *buf, size_t nbytes)
189b6cee71dSXin LI {
190b6cee71dSXin LI 	unsigned char *newbuf = NULL;
191b6cee71dSXin LI 	size_t i, nsz;
1923e41d09dSXin LI 	char *rbuf;
1933e41d09dSXin LI 	file_pushbuf_t *pb;
19420f8619dSXin LI 	int urv, prv, rv = 0;
195b6cee71dSXin LI 	int mime = ms->flags & MAGIC_MIME;
1965f0216bdSXin LI #ifdef HAVE_SIGNAL_H
1974460e5b0SXin LI 	sig_t osigpipe;
1985f0216bdSXin LI #endif
199b6cee71dSXin LI 
200b6cee71dSXin LI 	if ((ms->flags & MAGIC_COMPRESS) == 0)
201b6cee71dSXin LI 		return 0;
202b6cee71dSXin LI 
2035f0216bdSXin LI #ifdef HAVE_SIGNAL_H
2044460e5b0SXin LI 	osigpipe = signal(SIGPIPE, SIG_IGN);
2055f0216bdSXin LI #endif
206b6cee71dSXin LI 	for (i = 0; i < ncompr; i++) {
2073e41d09dSXin LI 		int zm;
208b6cee71dSXin LI 		if (nbytes < compr[i].maglen)
209b6cee71dSXin LI 			continue;
2103e41d09dSXin LI #ifdef ZLIBSUPPORT
2113e41d09dSXin LI 		if (compr[i].maglen == 0)
212a5d223e6SXin LI 			zm = (RCAST(int (*)(const unsigned char *),
2133e41d09dSXin LI 			    CCAST(void *, compr[i].magic)))(buf);
2143e41d09dSXin LI 		else
2153e41d09dSXin LI #endif
2163e41d09dSXin LI 			zm = memcmp(buf, compr[i].magic, compr[i].maglen) == 0;
217b6cee71dSXin LI 
2183e41d09dSXin LI 		if (!zm)
2193e41d09dSXin LI 			continue;
2203e41d09dSXin LI 		nsz = nbytes;
22120f8619dSXin LI 		urv = uncompressbuf(fd, ms->bytes_max, i, buf, &newbuf, &nsz);
22220f8619dSXin LI 		DPRINTF("uncompressbuf = %d, %s, %zu\n", urv, (char *)newbuf,
2233e41d09dSXin LI 		    nsz);
22420f8619dSXin LI 		switch (urv) {
2253e41d09dSXin LI 		case OKDATA:
2263e41d09dSXin LI 		case ERRDATA:
2273e41d09dSXin LI 
2283e41d09dSXin LI 			ms->flags &= ~MAGIC_COMPRESS;
22920f8619dSXin LI 			if (urv == ERRDATA)
23020f8619dSXin LI 				prv = file_printf(ms, "%s ERROR: %s",
2313e41d09dSXin LI 				    methodname(i), newbuf);
2323e41d09dSXin LI 			else
23320f8619dSXin LI 				prv = file_buffer(ms, -1, name, newbuf, nsz);
23420f8619dSXin LI 			if (prv == -1)
2353e41d09dSXin LI 				goto error;
23620f8619dSXin LI 			rv = 1;
2373e41d09dSXin LI 			if ((ms->flags & MAGIC_COMPRESS_TRANSP) != 0)
2383e41d09dSXin LI 				goto out;
2393e41d09dSXin LI 			if (mime != MAGIC_MIME && mime != 0)
2403e41d09dSXin LI 				goto out;
2413e41d09dSXin LI 			if ((file_printf(ms,
2423e41d09dSXin LI 			    mime ? " compressed-encoding=" : " (")) == -1)
2433e41d09dSXin LI 				goto error;
2443e41d09dSXin LI 			if ((pb = file_push_buffer(ms)) == NULL)
245b6cee71dSXin LI 				goto error;
24620f8619dSXin LI 			/*
24720f8619dSXin LI 			 * XXX: If file_buffer fails here, we overwrite
24820f8619dSXin LI 			 * the compressed text. FIXME.
24920f8619dSXin LI 			 */
250b6cee71dSXin LI 			if (file_buffer(ms, -1, NULL, buf, nbytes) == -1)
251b6cee71dSXin LI 				goto error;
2523e41d09dSXin LI 			if ((rbuf = file_pop_buffer(ms, pb)) != NULL) {
2533e41d09dSXin LI 				if (file_printf(ms, "%s", rbuf) == -1) {
2543e41d09dSXin LI 					free(rbuf);
255b6cee71dSXin LI 					goto error;
256b6cee71dSXin LI 				}
2573e41d09dSXin LI 				free(rbuf);
2583e41d09dSXin LI 			}
2593e41d09dSXin LI 			if (!mime && file_printf(ms, ")") == -1)
2603e41d09dSXin LI 				goto error;
26120f8619dSXin LI 			/*FALLTHROUGH*/
2623e41d09dSXin LI 		case NODATA:
26320f8619dSXin LI 			break;
2643e41d09dSXin LI 		default:
2653e41d09dSXin LI 			abort();
26620f8619dSXin LI 			/*NOTREACHED*/
26720f8619dSXin LI 		error:
26820f8619dSXin LI 			rv = -1;
26920f8619dSXin LI 			break;
2703e41d09dSXin LI 		}
2713e41d09dSXin LI 	}
2723e41d09dSXin LI out:
27320f8619dSXin LI 	DPRINTF("rv = %d\n", rv);
27420f8619dSXin LI 
2755f0216bdSXin LI #ifdef HAVE_SIGNAL_H
2764460e5b0SXin LI 	(void)signal(SIGPIPE, osigpipe);
2775f0216bdSXin LI #endif
278b6cee71dSXin LI 	free(newbuf);
279b6cee71dSXin LI 	ms->flags |= MAGIC_COMPRESS;
2803e41d09dSXin LI 	DPRINTF("Zmagic returns %d\n", rv);
281b6cee71dSXin LI 	return rv;
282b6cee71dSXin LI }
283b6cee71dSXin LI #endif
284b6cee71dSXin LI /*
285b6cee71dSXin LI  * `safe' write for sockets and pipes.
286b6cee71dSXin LI  */
287b6cee71dSXin LI private ssize_t
288b6cee71dSXin LI swrite(int fd, const void *buf, size_t n)
289b6cee71dSXin LI {
290b6cee71dSXin LI 	ssize_t rv;
291b6cee71dSXin LI 	size_t rn = n;
292b6cee71dSXin LI 
293b6cee71dSXin LI 	do
294b6cee71dSXin LI 		switch (rv = write(fd, buf, n)) {
295b6cee71dSXin LI 		case -1:
296b6cee71dSXin LI 			if (errno == EINTR)
297b6cee71dSXin LI 				continue;
298b6cee71dSXin LI 			return -1;
299b6cee71dSXin LI 		default:
300b6cee71dSXin LI 			n -= rv;
301b6cee71dSXin LI 			buf = CAST(const char *, buf) + rv;
302b6cee71dSXin LI 			break;
303b6cee71dSXin LI 		}
304b6cee71dSXin LI 	while (n > 0);
305b6cee71dSXin LI 	return rn;
306b6cee71dSXin LI }
307b6cee71dSXin LI 
308b6cee71dSXin LI 
309b6cee71dSXin LI /*
310b6cee71dSXin LI  * `safe' read for sockets and pipes.
311b6cee71dSXin LI  */
312b6cee71dSXin LI protected ssize_t
313b6cee71dSXin LI sread(int fd, void *buf, size_t n, int canbepipe __attribute__((__unused__)))
314b6cee71dSXin LI {
315b6cee71dSXin LI 	ssize_t rv;
316b6cee71dSXin LI #ifdef FIONREAD
317b6cee71dSXin LI 	int t = 0;
318b6cee71dSXin LI #endif
319b6cee71dSXin LI 	size_t rn = n;
320b6cee71dSXin LI 
321b6cee71dSXin LI 	if (fd == STDIN_FILENO)
322b6cee71dSXin LI 		goto nocheck;
323b6cee71dSXin LI 
324b6cee71dSXin LI #ifdef FIONREAD
325b6cee71dSXin LI 	if (canbepipe && (ioctl(fd, FIONREAD, &t) == -1 || t == 0)) {
326b6cee71dSXin LI #ifdef FD_ZERO
327b6cee71dSXin LI 		ssize_t cnt;
328b6cee71dSXin LI 		for (cnt = 0;; cnt++) {
329b6cee71dSXin LI 			fd_set check;
330b6cee71dSXin LI 			struct timeval tout = {0, 100 * 1000};
331b6cee71dSXin LI 			int selrv;
332b6cee71dSXin LI 
333b6cee71dSXin LI 			FD_ZERO(&check);
334b6cee71dSXin LI 			FD_SET(fd, &check);
335b6cee71dSXin LI 
336b6cee71dSXin LI 			/*
337b6cee71dSXin LI 			 * Avoid soft deadlock: do not read if there
338b6cee71dSXin LI 			 * is nothing to read from sockets and pipes.
339b6cee71dSXin LI 			 */
340b6cee71dSXin LI 			selrv = select(fd + 1, &check, NULL, NULL, &tout);
341b6cee71dSXin LI 			if (selrv == -1) {
342b6cee71dSXin LI 				if (errno == EINTR || errno == EAGAIN)
343b6cee71dSXin LI 					continue;
344b6cee71dSXin LI 			} else if (selrv == 0 && cnt >= 5) {
345b6cee71dSXin LI 				return 0;
346b6cee71dSXin LI 			} else
347b6cee71dSXin LI 				break;
348b6cee71dSXin LI 		}
349b6cee71dSXin LI #endif
350b6cee71dSXin LI 		(void)ioctl(fd, FIONREAD, &t);
351b6cee71dSXin LI 	}
352b6cee71dSXin LI 
353b6cee71dSXin LI 	if (t > 0 && (size_t)t < n) {
354b6cee71dSXin LI 		n = t;
355b6cee71dSXin LI 		rn = n;
356b6cee71dSXin LI 	}
357b6cee71dSXin LI #endif
358b6cee71dSXin LI 
359b6cee71dSXin LI nocheck:
360b6cee71dSXin LI 	do
361b6cee71dSXin LI 		switch ((rv = read(fd, buf, n))) {
362b6cee71dSXin LI 		case -1:
363b6cee71dSXin LI 			if (errno == EINTR)
364b6cee71dSXin LI 				continue;
365b6cee71dSXin LI 			return -1;
366b6cee71dSXin LI 		case 0:
367b6cee71dSXin LI 			return rn - n;
368b6cee71dSXin LI 		default:
369b6cee71dSXin LI 			n -= rv;
370a5d223e6SXin LI 			buf = CAST(char *, CCAST(void *, buf)) + rv;
371b6cee71dSXin LI 			break;
372b6cee71dSXin LI 		}
373b6cee71dSXin LI 	while (n > 0);
374b6cee71dSXin LI 	return rn;
375b6cee71dSXin LI }
376b6cee71dSXin LI 
377b6cee71dSXin LI protected int
378b6cee71dSXin LI file_pipe2file(struct magic_set *ms, int fd, const void *startbuf,
379b6cee71dSXin LI     size_t nbytes)
380b6cee71dSXin LI {
381b6cee71dSXin LI 	char buf[4096];
382b6cee71dSXin LI 	ssize_t r;
383b6cee71dSXin LI 	int tfd;
384b6cee71dSXin LI 
385b6cee71dSXin LI 	(void)strlcpy(buf, "/tmp/file.XXXXXX", sizeof buf);
386b6cee71dSXin LI #ifndef HAVE_MKSTEMP
387b6cee71dSXin LI 	{
388b6cee71dSXin LI 		char *ptr = mktemp(buf);
389b6cee71dSXin LI 		tfd = open(ptr, O_RDWR|O_TRUNC|O_EXCL|O_CREAT, 0600);
390b6cee71dSXin LI 		r = errno;
391b6cee71dSXin LI 		(void)unlink(ptr);
392b6cee71dSXin LI 		errno = r;
393b6cee71dSXin LI 	}
394b6cee71dSXin LI #else
395b6cee71dSXin LI 	{
396b6cee71dSXin LI 		int te;
397b6cee71dSXin LI 		tfd = mkstemp(buf);
398b6cee71dSXin LI 		te = errno;
399b6cee71dSXin LI 		(void)unlink(buf);
400b6cee71dSXin LI 		errno = te;
401b6cee71dSXin LI 	}
402b6cee71dSXin LI #endif
403b6cee71dSXin LI 	if (tfd == -1) {
404b6cee71dSXin LI 		file_error(ms, errno,
405b6cee71dSXin LI 		    "cannot create temporary file for pipe copy");
406b6cee71dSXin LI 		return -1;
407b6cee71dSXin LI 	}
408b6cee71dSXin LI 
409b6cee71dSXin LI 	if (swrite(tfd, startbuf, nbytes) != (ssize_t)nbytes)
410b6cee71dSXin LI 		r = 1;
411b6cee71dSXin LI 	else {
412b6cee71dSXin LI 		while ((r = sread(fd, buf, sizeof(buf), 1)) > 0)
413b6cee71dSXin LI 			if (swrite(tfd, buf, (size_t)r) != r)
414b6cee71dSXin LI 				break;
415b6cee71dSXin LI 	}
416b6cee71dSXin LI 
417b6cee71dSXin LI 	switch (r) {
418b6cee71dSXin LI 	case -1:
419b6cee71dSXin LI 		file_error(ms, errno, "error copying from pipe to temp file");
420b6cee71dSXin LI 		return -1;
421b6cee71dSXin LI 	case 0:
422b6cee71dSXin LI 		break;
423b6cee71dSXin LI 	default:
424b6cee71dSXin LI 		file_error(ms, errno, "error while writing to temp file");
425b6cee71dSXin LI 		return -1;
426b6cee71dSXin LI 	}
427b6cee71dSXin LI 
428b6cee71dSXin LI 	/*
429b6cee71dSXin LI 	 * We duplicate the file descriptor, because fclose on a
430b6cee71dSXin LI 	 * tmpfile will delete the file, but any open descriptors
431b6cee71dSXin LI 	 * can still access the phantom inode.
432b6cee71dSXin LI 	 */
433b6cee71dSXin LI 	if ((fd = dup2(tfd, fd)) == -1) {
434b6cee71dSXin LI 		file_error(ms, errno, "could not dup descriptor for temp file");
435b6cee71dSXin LI 		return -1;
436b6cee71dSXin LI 	}
437b6cee71dSXin LI 	(void)close(tfd);
438b6cee71dSXin LI 	if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
439b6cee71dSXin LI 		file_badseek(ms);
440b6cee71dSXin LI 		return -1;
441b6cee71dSXin LI 	}
442b6cee71dSXin LI 	return fd;
443b6cee71dSXin LI }
444b6cee71dSXin LI #if HAVE_FORK
445b6cee71dSXin LI #ifdef BUILTIN_DECOMPRESS
446b6cee71dSXin LI 
447b6cee71dSXin LI #define FHCRC		(1 << 1)
448b6cee71dSXin LI #define FEXTRA		(1 << 2)
449b6cee71dSXin LI #define FNAME		(1 << 3)
450b6cee71dSXin LI #define FCOMMENT	(1 << 4)
451b6cee71dSXin LI 
4523e41d09dSXin LI 
4533e41d09dSXin LI private int
4543e41d09dSXin LI uncompressgzipped(const unsigned char *old, unsigned char **newch,
4553e41d09dSXin LI     size_t bytes_max, size_t *n)
456b6cee71dSXin LI {
457b6cee71dSXin LI 	unsigned char flg = old[3];
458b6cee71dSXin LI 	size_t data_start = 10;
459b6cee71dSXin LI 
460b6cee71dSXin LI 	if (flg & FEXTRA) {
4613e41d09dSXin LI 		if (data_start + 1 >= *n)
4623e41d09dSXin LI 			goto err;
463b6cee71dSXin LI 		data_start += 2 + old[data_start] + old[data_start + 1] * 256;
464b6cee71dSXin LI 	}
465b6cee71dSXin LI 	if (flg & FNAME) {
4663e41d09dSXin LI 		while(data_start < *n && old[data_start])
467b6cee71dSXin LI 			data_start++;
468b6cee71dSXin LI 		data_start++;
469b6cee71dSXin LI 	}
470b6cee71dSXin LI 	if (flg & FCOMMENT) {
4713e41d09dSXin LI 		while(data_start < *n && old[data_start])
472b6cee71dSXin LI 			data_start++;
473b6cee71dSXin LI 		data_start++;
474b6cee71dSXin LI 	}
475b6cee71dSXin LI 	if (flg & FHCRC)
476b6cee71dSXin LI 		data_start += 2;
477b6cee71dSXin LI 
4783e41d09dSXin LI 	if (data_start >= *n)
4793e41d09dSXin LI 		goto err;
4803e41d09dSXin LI 
4813e41d09dSXin LI 	*n -= data_start;
4823e41d09dSXin LI 	old += data_start;
4833e41d09dSXin LI 	return uncompresszlib(old, newch, bytes_max, n, 0);
4843e41d09dSXin LI err:
4853e41d09dSXin LI 	return makeerror(newch, n, "File too short");
486b6cee71dSXin LI }
487b6cee71dSXin LI 
4883e41d09dSXin LI private int
4893e41d09dSXin LI uncompresszlib(const unsigned char *old, unsigned char **newch,
4903e41d09dSXin LI     size_t bytes_max, size_t *n, int zlib)
4913e41d09dSXin LI {
4923e41d09dSXin LI 	int rc;
4933e41d09dSXin LI 	z_stream z;
4943e41d09dSXin LI 
4953e41d09dSXin LI 	if ((*newch = CAST(unsigned char *, malloc(bytes_max + 1))) == NULL)
4963e41d09dSXin LI 		return makeerror(newch, n, "No buffer, %s", strerror(errno));
4973e41d09dSXin LI 
4983e41d09dSXin LI 	z.next_in = CCAST(Bytef *, old);
4993e41d09dSXin LI 	z.avail_in = CAST(uint32_t, *n);
500b6cee71dSXin LI 	z.next_out = *newch;
501*40427ccaSGordon Tetlow 	z.avail_out = CAST(unsigned int, bytes_max);
502b6cee71dSXin LI 	z.zalloc = Z_NULL;
503b6cee71dSXin LI 	z.zfree = Z_NULL;
504b6cee71dSXin LI 	z.opaque = Z_NULL;
505b6cee71dSXin LI 
506b6cee71dSXin LI 	/* LINTED bug in header macro */
5073e41d09dSXin LI 	rc = zlib ? inflateInit(&z) : inflateInit2(&z, -15);
5083e41d09dSXin LI 	if (rc != Z_OK)
5093e41d09dSXin LI 		goto err;
510b6cee71dSXin LI 
511b6cee71dSXin LI 	rc = inflate(&z, Z_SYNC_FLUSH);
5123e41d09dSXin LI 	if (rc != Z_OK && rc != Z_STREAM_END)
5133e41d09dSXin LI 		goto err;
514b6cee71dSXin LI 
5153e41d09dSXin LI 	*n = (size_t)z.total_out;
5163e41d09dSXin LI 	rc = inflateEnd(&z);
5173e41d09dSXin LI 	if (rc != Z_OK)
5183e41d09dSXin LI 		goto err;
519b6cee71dSXin LI 
520b6cee71dSXin LI 	/* let's keep the nul-terminate tradition */
5213e41d09dSXin LI 	(*newch)[*n] = '\0';
522b6cee71dSXin LI 
5233e41d09dSXin LI 	return OKDATA;
5243e41d09dSXin LI err:
525a5d223e6SXin LI 	strlcpy((char *)*newch, z.msg ? z.msg : zError(rc), bytes_max);
5263e41d09dSXin LI 	*n = strlen((char *)*newch);
5273e41d09dSXin LI 	return ERRDATA;
528b6cee71dSXin LI }
529b6cee71dSXin LI #endif
530b6cee71dSXin LI 
5313e41d09dSXin LI static int
5323e41d09dSXin LI makeerror(unsigned char **buf, size_t *len, const char *fmt, ...)
533b6cee71dSXin LI {
5343e41d09dSXin LI 	char *msg;
5353e41d09dSXin LI 	va_list ap;
5363e41d09dSXin LI 	int rv;
537b6cee71dSXin LI 
5383e41d09dSXin LI 	va_start(ap, fmt);
5393e41d09dSXin LI 	rv = vasprintf(&msg, fmt, ap);
5403e41d09dSXin LI 	va_end(ap);
5413e41d09dSXin LI 	if (rv < 0) {
5423e41d09dSXin LI 		*buf = NULL;
5433e41d09dSXin LI 		*len = 0;
544b6cee71dSXin LI 		return NODATA;
545b6cee71dSXin LI 	}
5463e41d09dSXin LI 	*buf = (unsigned char *)msg;
5473e41d09dSXin LI 	*len = strlen(msg);
5483e41d09dSXin LI 	return ERRDATA;
549b6cee71dSXin LI }
550b6cee71dSXin LI 
5513e41d09dSXin LI static void
5523e41d09dSXin LI closefd(int *fd, size_t i)
5533e41d09dSXin LI {
5543e41d09dSXin LI 	if (fd[i] == -1)
5553e41d09dSXin LI 		return;
5563e41d09dSXin LI 	(void) close(fd[i]);
5573e41d09dSXin LI 	fd[i] = -1;
5583e41d09dSXin LI }
559b6cee71dSXin LI 
5603e41d09dSXin LI static void
5613e41d09dSXin LI closep(int *fd)
5623e41d09dSXin LI {
5633e41d09dSXin LI 	size_t i;
5643e41d09dSXin LI 	for (i = 0; i < 2; i++)
5653e41d09dSXin LI 		closefd(fd, i);
5663e41d09dSXin LI }
5673e41d09dSXin LI 
5683e41d09dSXin LI static void
5693e41d09dSXin LI copydesc(int i, int *fd)
5703e41d09dSXin LI {
5713e41d09dSXin LI 	int j = fd[i == STDIN_FILENO ? 0 : 1];
5723e41d09dSXin LI 	if (j == i)
5733e41d09dSXin LI 		return;
5743e41d09dSXin LI 	if (dup2(j, i) == -1) {
5753e41d09dSXin LI 		DPRINTF("dup(%d, %d) failed (%s)\n", j, i, strerror(errno));
576b6cee71dSXin LI 		exit(1);
5773e41d09dSXin LI 	}
5783e41d09dSXin LI 	closep(fd);
5793e41d09dSXin LI }
580b6cee71dSXin LI 
5813e41d09dSXin LI static void
5823e41d09dSXin LI writechild(int fdp[3][2], const void *old, size_t n)
5833e41d09dSXin LI {
5843e41d09dSXin LI 	int status;
5853e41d09dSXin LI 
5863e41d09dSXin LI 	closefd(fdp[STDIN_FILENO], 0);
587b6cee71dSXin LI 	/*
588b6cee71dSXin LI 	 * fork again, to avoid blocking because both
589b6cee71dSXin LI 	 * pipes filled
590b6cee71dSXin LI 	 */
591b6cee71dSXin LI 	switch (fork()) {
592b6cee71dSXin LI 	case 0: /* child */
5933e41d09dSXin LI 		closefd(fdp[STDOUT_FILENO], 0);
5943e41d09dSXin LI 		if (swrite(fdp[STDIN_FILENO][1], old, n) != (ssize_t)n) {
5953e41d09dSXin LI 			DPRINTF("Write failed (%s)\n", strerror(errno));
596b6cee71dSXin LI 			exit(1);
597b6cee71dSXin LI 		}
598b6cee71dSXin LI 		exit(0);
599b6cee71dSXin LI 		/*NOTREACHED*/
600b6cee71dSXin LI 
601b6cee71dSXin LI 	case -1:
6023e41d09dSXin LI 		DPRINTF("Fork failed (%s)\n", strerror(errno));
603b6cee71dSXin LI 		exit(1);
604b6cee71dSXin LI 		/*NOTREACHED*/
605b6cee71dSXin LI 
606b6cee71dSXin LI 	default:  /* parent */
607c2931133SXin LI 		if (wait(&status) == -1) {
6083e41d09dSXin LI 			DPRINTF("Wait failed (%s)\n", strerror(errno));
609c2931133SXin LI 			exit(1);
610c2931133SXin LI 		}
6113e41d09dSXin LI 		DPRINTF("Grandchild wait return %#x\n", status);
612b6cee71dSXin LI 	}
6133e41d09dSXin LI 	closefd(fdp[STDIN_FILENO], 1);
614b6cee71dSXin LI }
615b6cee71dSXin LI 
6163e41d09dSXin LI static ssize_t
6173e41d09dSXin LI filter_error(unsigned char *ubuf, ssize_t n)
6183e41d09dSXin LI {
6193e41d09dSXin LI 	char *p;
6203e41d09dSXin LI 	char *buf;
621c2931133SXin LI 
6223e41d09dSXin LI 	ubuf[n] = '\0';
6233e41d09dSXin LI 	buf = (char *)ubuf;
6243e41d09dSXin LI 	while (isspace((unsigned char)*buf))
6253e41d09dSXin LI 		buf++;
6263e41d09dSXin LI 	DPRINTF("Filter error[[[%s]]]\n", buf);
6273e41d09dSXin LI 	if ((p = strchr((char *)buf, '\n')) != NULL)
6283e41d09dSXin LI 		*p = '\0';
6293e41d09dSXin LI 	if ((p = strchr((char *)buf, ';')) != NULL)
6303e41d09dSXin LI 		*p = '\0';
6313e41d09dSXin LI 	if ((p = strrchr((char *)buf, ':')) != NULL) {
6323e41d09dSXin LI 		++p;
6333e41d09dSXin LI 		while (isspace((unsigned char)*p))
6343e41d09dSXin LI 			p++;
6353e41d09dSXin LI 		n = strlen(p);
636*40427ccaSGordon Tetlow 		memmove(ubuf, p, CAST(size_t, n + 1));
6373e41d09dSXin LI 	}
6383e41d09dSXin LI 	DPRINTF("Filter error after[[[%s]]]\n", (char *)ubuf);
6393e41d09dSXin LI 	if (islower(*ubuf))
6403e41d09dSXin LI 		*ubuf = toupper(*ubuf);
641b6cee71dSXin LI 	return n;
642b6cee71dSXin LI }
6433e41d09dSXin LI 
6443e41d09dSXin LI private const char *
6453e41d09dSXin LI methodname(size_t method)
6463e41d09dSXin LI {
6473e41d09dSXin LI #ifdef BUILTIN_DECOMPRESS
6483e41d09dSXin LI         /* FIXME: This doesn't cope with bzip2 */
6493e41d09dSXin LI 	if (method == 2 || compr[method].maglen == 0)
6503e41d09dSXin LI 	    return "zlib";
6513e41d09dSXin LI #endif
6523e41d09dSXin LI 	return compr[method].argv[0];
6533e41d09dSXin LI }
6543e41d09dSXin LI 
6553e41d09dSXin LI private int
6563e41d09dSXin LI uncompressbuf(int fd, size_t bytes_max, size_t method, const unsigned char *old,
6573e41d09dSXin LI     unsigned char **newch, size_t* n)
6583e41d09dSXin LI {
6593e41d09dSXin LI 	int fdp[3][2];
6603e41d09dSXin LI 	int status, rv;
6613e41d09dSXin LI 	size_t i;
6623e41d09dSXin LI 	ssize_t r;
6633e41d09dSXin LI 
6643e41d09dSXin LI #ifdef BUILTIN_DECOMPRESS
6653e41d09dSXin LI         /* FIXME: This doesn't cope with bzip2 */
6663e41d09dSXin LI 	if (method == 2)
6673e41d09dSXin LI 		return uncompressgzipped(old, newch, bytes_max, n);
6683e41d09dSXin LI 	if (compr[method].maglen == 0)
6693e41d09dSXin LI 		return uncompresszlib(old, newch, bytes_max, n, 1);
6703e41d09dSXin LI #endif
6713e41d09dSXin LI 	(void)fflush(stdout);
6723e41d09dSXin LI 	(void)fflush(stderr);
6733e41d09dSXin LI 
6743e41d09dSXin LI 	for (i = 0; i < __arraycount(fdp); i++)
6753e41d09dSXin LI 		fdp[i][0] = fdp[i][1] = -1;
6763e41d09dSXin LI 
6773e41d09dSXin LI 	if ((fd == -1 && pipe(fdp[STDIN_FILENO]) == -1) ||
6783e41d09dSXin LI 	    pipe(fdp[STDOUT_FILENO]) == -1 || pipe(fdp[STDERR_FILENO]) == -1) {
6793e41d09dSXin LI 		closep(fdp[STDIN_FILENO]);
6803e41d09dSXin LI 		closep(fdp[STDOUT_FILENO]);
6813e41d09dSXin LI 		return makeerror(newch, n, "Cannot create pipe, %s",
6823e41d09dSXin LI 		    strerror(errno));
6833e41d09dSXin LI 	}
6843e41d09dSXin LI 	switch (fork()) {
6853e41d09dSXin LI 	case 0:	/* child */
6863e41d09dSXin LI 		if (fd != -1) {
6873e41d09dSXin LI 			fdp[STDIN_FILENO][0] = fd;
6883e41d09dSXin LI 			(void) lseek(fd, (off_t)0, SEEK_SET);
6893e41d09dSXin LI 		}
6903e41d09dSXin LI 
6913e41d09dSXin LI 		for (i = 0; i < __arraycount(fdp); i++)
692*40427ccaSGordon Tetlow 			copydesc(CAST(int, i), fdp[i]);
6933e41d09dSXin LI 
6943e41d09dSXin LI 		(void)execvp(compr[method].argv[0],
6953e41d09dSXin LI 		    (char *const *)(intptr_t)compr[method].argv);
6963e41d09dSXin LI 		dprintf(STDERR_FILENO, "exec `%s' failed, %s",
6973e41d09dSXin LI 		    compr[method].argv[0], strerror(errno));
6983e41d09dSXin LI 		exit(1);
6993e41d09dSXin LI 		/*NOTREACHED*/
7003e41d09dSXin LI 	case -1:
7013e41d09dSXin LI 		return makeerror(newch, n, "Cannot fork, %s",
7023e41d09dSXin LI 		    strerror(errno));
7033e41d09dSXin LI 
7043e41d09dSXin LI 	default: /* parent */
7053e41d09dSXin LI 		for (i = 1; i < __arraycount(fdp); i++)
7063e41d09dSXin LI 			closefd(fdp[i], 1);
7073e41d09dSXin LI 
7083e41d09dSXin LI 		/* Write the buffer data to the child, if we don't have fd */
7093e41d09dSXin LI 		if (fd == -1)
7103e41d09dSXin LI 			writechild(fdp, old, *n);
7113e41d09dSXin LI 
7123e41d09dSXin LI 		*newch = CAST(unsigned char *, malloc(bytes_max + 1));
7133e41d09dSXin LI 		if (*newch == NULL) {
7143e41d09dSXin LI 			rv = makeerror(newch, n, "No buffer, %s",
7153e41d09dSXin LI 			    strerror(errno));
7163e41d09dSXin LI 			goto err;
7173e41d09dSXin LI 		}
7183e41d09dSXin LI 		rv = OKDATA;
7193e41d09dSXin LI 		if ((r = sread(fdp[STDOUT_FILENO][0], *newch, bytes_max, 0)) > 0)
7203e41d09dSXin LI 			break;
7213e41d09dSXin LI 		DPRINTF("Read stdout failed %d (%s)\n", fdp[STDOUT_FILENO][0],
7223e41d09dSXin LI 		    r != -1 ? strerror(errno) : "no data");
7233e41d09dSXin LI 
7243e41d09dSXin LI 		rv = ERRDATA;
7253e41d09dSXin LI 		if (r == 0 &&
7263e41d09dSXin LI 		    (r = sread(fdp[STDERR_FILENO][0], *newch, bytes_max, 0)) > 0)
7273e41d09dSXin LI 		{
7283e41d09dSXin LI 			r = filter_error(*newch, r);
7293e41d09dSXin LI 			break;
7303e41d09dSXin LI 		}
7313e41d09dSXin LI 		free(*newch);
7323e41d09dSXin LI 		if  (r == 0)
7333e41d09dSXin LI 			rv = makeerror(newch, n, "Read failed, %s",
7343e41d09dSXin LI 			    strerror(errno));
7353e41d09dSXin LI 		else
7363e41d09dSXin LI 			rv = makeerror(newch, n, "No data");
7373e41d09dSXin LI 		goto err;
7383e41d09dSXin LI 	}
7393e41d09dSXin LI 
7403e41d09dSXin LI 	*n = r;
7413e41d09dSXin LI 	/* NUL terminate, as every buffer is handled here. */
7423e41d09dSXin LI 	(*newch)[*n] = '\0';
7433e41d09dSXin LI err:
7443e41d09dSXin LI 	closefd(fdp[STDIN_FILENO], 1);
7453e41d09dSXin LI 	closefd(fdp[STDOUT_FILENO], 0);
7463e41d09dSXin LI 	closefd(fdp[STDERR_FILENO], 0);
7473e41d09dSXin LI 	if (wait(&status) == -1) {
7483e41d09dSXin LI 		free(*newch);
7493e41d09dSXin LI 		rv = makeerror(newch, n, "Wait failed, %s", strerror(errno));
7503e41d09dSXin LI 		DPRINTF("Child wait return %#x\n", status);
7513e41d09dSXin LI 	} else if (!WIFEXITED(status)) {
752*40427ccaSGordon Tetlow 		DPRINTF("Child not exited (%#x)\n", status);
7533e41d09dSXin LI 	} else if (WEXITSTATUS(status) != 0) {
754*40427ccaSGordon Tetlow 		DPRINTF("Child exited (%#x)\n", WEXITSTATUS(status));
7553e41d09dSXin LI 	}
7563e41d09dSXin LI 
7573e41d09dSXin LI 	closefd(fdp[STDIN_FILENO], 0);
7583e41d09dSXin LI 	DPRINTF("Returning %p n=%zu rv=%d\n", *newch, *n, rv);
7593e41d09dSXin LI 
7603e41d09dSXin LI 	return rv;
761b6cee71dSXin LI }
762b6cee71dSXin LI #endif
763