1 /*-
2  * Copyright (c) 2003-2009 Tim Kientzle
3  * Copyright (c) 2010-2012 Michihiro NAKAJIMA
4  * Copyright (c) 2016 Martin Matuska
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
17  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19  * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
21  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
22  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
23  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
25  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 
28 #include "archive_platform.h"
29 
30 /* This is the tree-walking code for POSIX systems. */
31 #if !defined(_WIN32) || defined(__CYGWIN__)
32 
33 #ifdef HAVE_SYS_TYPES_H
34 #include <sys/types.h>
35 #endif
36 #ifdef HAVE_SYS_EXTATTR_H
37 #include <sys/extattr.h>
38 #endif
39 #ifdef HAVE_SYS_IOCTL_H
40 #include <sys/ioctl.h>
41 #endif
42 #ifdef HAVE_SYS_PARAM_H
43 #include <sys/param.h>
44 #endif
45 #ifdef HAVE_SYS_STAT_H
46 #include <sys/stat.h>
47 #endif
48 #if defined(HAVE_SYS_XATTR_H)
49 #include <sys/xattr.h>
50 #elif defined(HAVE_ATTR_XATTR_H)
51 #include <attr/xattr.h>
52 #endif
53 #ifdef HAVE_SYS_EA_H
54 #include <sys/ea.h>
55 #endif
56 #ifdef HAVE_COPYFILE_H
57 #include <copyfile.h>
58 #endif
59 #ifdef HAVE_ERRNO_H
60 #include <errno.h>
61 #endif
62 #ifdef HAVE_FCNTL_H
63 #include <fcntl.h>
64 #endif
65 #ifdef HAVE_LIMITS_H
66 #include <limits.h>
67 #endif
68 #ifdef HAVE_LINUX_TYPES_H
69 #include <linux/types.h>
70 #endif
71 #ifdef HAVE_LINUX_FIEMAP_H
72 #include <linux/fiemap.h>
73 #endif
74 #ifdef HAVE_LINUX_FS_H
75 #include <linux/fs.h>
76 #endif
77 /*
78  * Some Linux distributions have both linux/ext2_fs.h and ext2fs/ext2_fs.h.
79  * As the include guards don't agree, the order of include is important.
80  */
81 #ifdef HAVE_LINUX_EXT2_FS_H
82 #include <linux/ext2_fs.h>      /* for Linux file flags */
83 #endif
84 #if defined(HAVE_EXT2FS_EXT2_FS_H) && !defined(__CYGWIN__)
85 #include <ext2fs/ext2_fs.h>     /* Linux file flags, broken on Cygwin */
86 #endif
87 #ifdef HAVE_PATHS_H
88 #include <paths.h>
89 #endif
90 #ifdef HAVE_UNISTD_H
91 #include <unistd.h>
92 #endif
93 
94 #include "archive.h"
95 #include "archive_entry.h"
96 #include "archive_private.h"
97 #include "archive_read_disk_private.h"
98 
99 #ifndef O_CLOEXEC
100 #define O_CLOEXEC	0
101 #endif
102 
103 static int setup_mac_metadata(struct archive_read_disk *,
104     struct archive_entry *, int *fd);
105 #ifdef ARCHIVE_XATTR_FREEBSD
106 static int setup_xattrs_namespace(struct archive_read_disk *,
107     struct archive_entry *, int *, int);
108 #endif
109 static int setup_xattrs(struct archive_read_disk *,
110     struct archive_entry *, int *fd);
111 static int setup_sparse(struct archive_read_disk *,
112     struct archive_entry *, int *fd);
113 #if defined(HAVE_LINUX_FIEMAP_H)
114 static int setup_sparse_fiemap(struct archive_read_disk *,
115     struct archive_entry *, int *fd);
116 #endif
117 
118 #if !ARCHIVE_ACL_SUPPORT
119 int
archive_read_disk_entry_setup_acls(struct archive_read_disk * a,struct archive_entry * entry,int * fd)120 archive_read_disk_entry_setup_acls(struct archive_read_disk *a,
121     struct archive_entry *entry, int *fd)
122 {
123 	(void)a;      /* UNUSED */
124 	(void)entry;  /* UNUSED */
125 	(void)fd;     /* UNUSED */
126 	return (ARCHIVE_OK);
127 }
128 #endif
129 
130 /*
131  * Enter working directory and return working pathname of archive_entry.
132  * If a pointer to an integer is provided and its value is below zero
133  * open a file descriptor on this pathname.
134  */
135 const char *
archive_read_disk_entry_setup_path(struct archive_read_disk * a,struct archive_entry * entry,int * fd)136 archive_read_disk_entry_setup_path(struct archive_read_disk *a,
137     struct archive_entry *entry, int *fd)
138 {
139 	const char *path;
140 
141 	path = archive_entry_sourcepath(entry);
142 
143 	if (path == NULL || (a->tree != NULL &&
144 	    a->tree_enter_working_dir(a->tree) != 0))
145 		path = archive_entry_pathname(entry);
146 	if (path == NULL) {
147 		archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
148 		   "Couldn't determine path");
149 	} else if (fd != NULL && *fd < 0 && a->tree != NULL &&
150 	    (a->follow_symlinks || archive_entry_filetype(entry) != AE_IFLNK)) {
151 		*fd = a->open_on_current_dir(a->tree, path,
152 		    O_RDONLY | O_NONBLOCK);
153 	}
154 	return (path);
155 }
156 
157 int
archive_read_disk_entry_from_file(struct archive * _a,struct archive_entry * entry,int fd,const struct stat * st)158 archive_read_disk_entry_from_file(struct archive *_a,
159     struct archive_entry *entry,
160     int fd,
161     const struct stat *st)
162 {
163 	struct archive_read_disk *a = (struct archive_read_disk *)_a;
164 	const char *path, *name;
165 	struct stat s;
166 	int initial_fd = fd;
167 	int r, r1;
168 
169 	archive_check_magic(_a, ARCHIVE_READ_DISK_MAGIC, ARCHIVE_STATE_ANY,
170 		"archive_read_disk_entry_from_file");
171 
172 	archive_clear_error(_a);
173 	path = archive_entry_sourcepath(entry);
174 	if (path == NULL)
175 		path = archive_entry_pathname(entry);
176 
177 	if (a->tree == NULL) {
178 		if (st == NULL) {
179 #if HAVE_FSTAT
180 			if (fd >= 0) {
181 				if (fstat(fd, &s) != 0) {
182 					archive_set_error(&a->archive, errno,
183 					    "Can't fstat");
184 					return (ARCHIVE_FAILED);
185 				}
186 			} else
187 #endif
188 #if HAVE_LSTAT
189 			if (!a->follow_symlinks) {
190 				if (lstat(path, &s) != 0) {
191 					archive_set_error(&a->archive, errno,
192 					    "Can't lstat %s", path);
193 					return (ARCHIVE_FAILED);
194 				}
195 			} else
196 #endif
197 			if (la_stat(path, &s) != 0) {
198 				archive_set_error(&a->archive, errno,
199 				    "Can't stat %s", path);
200 				return (ARCHIVE_FAILED);
201 			}
202 			st = &s;
203 		}
204 		archive_entry_copy_stat(entry, st);
205 	}
206 
207 	/* Lookup uname/gname */
208 	name = archive_read_disk_uname(_a, archive_entry_uid(entry));
209 	if (name != NULL)
210 		archive_entry_copy_uname(entry, name);
211 	name = archive_read_disk_gname(_a, archive_entry_gid(entry));
212 	if (name != NULL)
213 		archive_entry_copy_gname(entry, name);
214 
215 #ifdef HAVE_STRUCT_STAT_ST_FLAGS
216 	/* On FreeBSD, we get flags for free with the stat. */
217 	/* TODO: Does this belong in copy_stat()? */
218 	if ((a->flags & ARCHIVE_READDISK_NO_FFLAGS) == 0 && st->st_flags != 0)
219 		archive_entry_set_fflags(entry, st->st_flags, 0);
220 #endif
221 
222 #if (defined(FS_IOC_GETFLAGS) && defined(HAVE_WORKING_FS_IOC_GETFLAGS)) || \
223     (defined(EXT2_IOC_GETFLAGS) && defined(HAVE_WORKING_EXT2_IOC_GETFLAGS))
224 	/* Linux requires an extra ioctl to pull the flags.  Although
225 	 * this is an extra step, it has a nice side-effect: We get an
226 	 * open file descriptor which we can use in the subsequent lookups. */
227 	if ((a->flags & ARCHIVE_READDISK_NO_FFLAGS) == 0 &&
228 	    (S_ISREG(st->st_mode) || S_ISDIR(st->st_mode))) {
229 		if (fd < 0) {
230 			if (a->tree != NULL)
231 				fd = a->open_on_current_dir(a->tree, path,
232 					O_RDONLY | O_NONBLOCK | O_CLOEXEC);
233 			else
234 				fd = open(path, O_RDONLY | O_NONBLOCK |
235 						O_CLOEXEC);
236 			__archive_ensure_cloexec_flag(fd);
237 		}
238 		if (fd >= 0) {
239 			int stflags;
240 			r = ioctl(fd,
241 #if defined(FS_IOC_GETFLAGS)
242 			    FS_IOC_GETFLAGS,
243 #else
244 			    EXT2_IOC_GETFLAGS,
245 #endif
246 			    &stflags);
247 			if (r == 0 && stflags != 0)
248 				archive_entry_set_fflags(entry, stflags, 0);
249 		}
250 	}
251 #endif
252 
253 #if defined(HAVE_READLINK) || defined(HAVE_READLINKAT)
254 	if (S_ISLNK(st->st_mode)) {
255 		size_t linkbuffer_len = st->st_size;
256 		char *linkbuffer;
257 		int lnklen;
258 
259 		linkbuffer = malloc(linkbuffer_len + 1);
260 		if (linkbuffer == NULL) {
261 			archive_set_error(&a->archive, ENOMEM,
262 			    "Couldn't read link data");
263 			return (ARCHIVE_FAILED);
264 		}
265 		if (a->tree != NULL) {
266 #ifdef HAVE_READLINKAT
267 			lnklen = readlinkat(a->tree_current_dir_fd(a->tree),
268 			    path, linkbuffer, linkbuffer_len);
269 #else
270 			if (a->tree_enter_working_dir(a->tree) != 0) {
271 				archive_set_error(&a->archive, errno,
272 				    "Couldn't read link data");
273 				free(linkbuffer);
274 				return (ARCHIVE_FAILED);
275 			}
276 			lnklen = readlink(path, linkbuffer, linkbuffer_len);
277 #endif /* HAVE_READLINKAT */
278 		} else
279 			lnklen = readlink(path, linkbuffer, linkbuffer_len);
280 		if (lnklen < 0) {
281 			archive_set_error(&a->archive, errno,
282 			    "Couldn't read link data");
283 			free(linkbuffer);
284 			return (ARCHIVE_FAILED);
285 		}
286 		linkbuffer[lnklen] = '\0';
287 		archive_entry_set_symlink(entry, linkbuffer);
288 		free(linkbuffer);
289 	}
290 #endif /* HAVE_READLINK || HAVE_READLINKAT */
291 
292 	r = 0;
293 	if ((a->flags & ARCHIVE_READDISK_NO_ACL) == 0)
294 		r = archive_read_disk_entry_setup_acls(a, entry, &fd);
295 	if ((a->flags & ARCHIVE_READDISK_NO_XATTR) == 0) {
296 		r1 = setup_xattrs(a, entry, &fd);
297 		if (r1 < r)
298 			r = r1;
299 	}
300 	if (a->flags & ARCHIVE_READDISK_MAC_COPYFILE) {
301 		r1 = setup_mac_metadata(a, entry, &fd);
302 		if (r1 < r)
303 			r = r1;
304 	}
305 	if ((a->flags & ARCHIVE_READDISK_NO_SPARSE) == 0) {
306 		r1 = setup_sparse(a, entry, &fd);
307 		if (r1 < r)
308 			r = r1;
309 	}
310 
311 	/* If we opened the file earlier in this function, close it. */
312 	if (initial_fd != fd)
313 		close(fd);
314 	return (r);
315 }
316 
317 #if defined(__APPLE__) && defined(HAVE_COPYFILE_H)
318 /*
319  * The Mac OS "copyfile()" API copies the extended metadata for a
320  * file into a separate file in AppleDouble format (see RFC 1740).
321  *
322  * Mac OS tar and cpio implementations store this extended
323  * metadata as a separate entry just before the regular entry
324  * with a "._" prefix added to the filename.
325  *
326  * Note that this is currently done unconditionally; the tar program has
327  * an option to discard this information before the archive is written.
328  *
329  * TODO: If there's a failure, report it and return ARCHIVE_WARN.
330  */
331 static int
setup_mac_metadata(struct archive_read_disk * a,struct archive_entry * entry,int * fd)332 setup_mac_metadata(struct archive_read_disk *a,
333     struct archive_entry *entry, int *fd)
334 {
335 	int tempfd = -1;
336 	int copyfile_flags = COPYFILE_NOFOLLOW | COPYFILE_ACL | COPYFILE_XATTR;
337 	struct stat copyfile_stat;
338 	int ret = ARCHIVE_OK;
339 	void *buff = NULL;
340 	int have_attrs;
341 	const char *name;
342 	struct archive_string tempfile;
343 
344 	(void)fd; /* UNUSED */
345 
346 	name = archive_read_disk_entry_setup_path(a, entry, NULL);
347 	if (name == NULL)
348 		return (ARCHIVE_WARN);
349 
350 	/* Short-circuit if there's nothing to do. */
351 	have_attrs = copyfile(name, NULL, 0, copyfile_flags | COPYFILE_CHECK);
352 	if (have_attrs == -1) {
353 		archive_set_error(&a->archive, errno,
354 			"Could not check extended attributes");
355 		return (ARCHIVE_WARN);
356 	}
357 	if (have_attrs == 0)
358 		return (ARCHIVE_OK);
359 
360 	archive_string_init(&tempfile);
361 	if (__archive_get_tempdir(&tempfile) != ARCHIVE_OK) {
362 		ret = ARCHIVE_WARN;
363 		goto cleanup;
364 	}
365 	archive_strcat(&tempfile, "tar.md.XXXXXX");
366 	tempfd = mkstemp(tempfile.s);
367 	if (tempfd < 0) {
368 		archive_set_error(&a->archive, errno,
369 		    "Could not open extended attribute file");
370 		ret = ARCHIVE_WARN;
371 		goto cleanup;
372 	}
373 	__archive_ensure_cloexec_flag(tempfd);
374 
375 	/* XXX I wish copyfile() could pack directly to a memory
376 	 * buffer; that would avoid the temp file here.  For that
377 	 * matter, it would be nice if fcopyfile() actually worked,
378 	 * that would reduce the many open/close races here. */
379 	if (copyfile(name, tempfile.s, 0, copyfile_flags | COPYFILE_PACK)) {
380 		archive_set_error(&a->archive, errno,
381 		    "Could not pack extended attributes");
382 		ret = ARCHIVE_WARN;
383 		goto cleanup;
384 	}
385 	if (fstat(tempfd, ©file_stat)) {
386 		archive_set_error(&a->archive, errno,
387 		    "Could not check size of extended attributes");
388 		ret = ARCHIVE_WARN;
389 		goto cleanup;
390 	}
391 	buff = malloc(copyfile_stat.st_size);
392 	if (buff == NULL) {
393 		archive_set_error(&a->archive, errno,
394 		    "Could not allocate memory for extended attributes");
395 		ret = ARCHIVE_WARN;
396 		goto cleanup;
397 	}
398 	if (copyfile_stat.st_size != read(tempfd, buff, copyfile_stat.st_size)) {
399 		archive_set_error(&a->archive, errno,
400 		    "Could not read extended attributes into memory");
401 		ret = ARCHIVE_WARN;
402 		goto cleanup;
403 	}
404 	archive_entry_copy_mac_metadata(entry, buff, copyfile_stat.st_size);
405 
406 cleanup:
407 	if (tempfd >= 0) {
408 		close(tempfd);
409 		unlink(tempfile.s);
410 	}
411 	archive_string_free(&tempfile);
412 	free(buff);
413 	return (ret);
414 }
415 
416 #else
417 
418 /*
419  * Stub implementation for non-Mac systems.
420  */
421 static int
setup_mac_metadata(struct archive_read_disk * a,struct archive_entry * entry,int * fd)422 setup_mac_metadata(struct archive_read_disk *a,
423     struct archive_entry *entry, int *fd)
424 {
425 	(void)a; /* UNUSED */
426 	(void)entry; /* UNUSED */
427 	(void)fd; /* UNUSED */
428 	return (ARCHIVE_OK);
429 }
430 #endif
431 
432 #if ARCHIVE_XATTR_LINUX || ARCHIVE_XATTR_DARWIN || ARCHIVE_XATTR_AIX
433 
434 /*
435  * Linux, Darwin and AIX extended attribute support.
436  *
437  * TODO:  By using a stack-allocated buffer for the first
438  * call to getxattr(), we might be able to avoid the second
439  * call entirely.  We only need the second call if the
440  * stack-allocated buffer is too small.  But a modest buffer
441  * of 1024 bytes or so will often be big enough.  Same applies
442  * to listxattr().
443  */
444 
445 
446 static int
setup_xattr(struct archive_read_disk * a,struct archive_entry * entry,const char * name,int fd,const char * accpath)447 setup_xattr(struct archive_read_disk *a,
448     struct archive_entry *entry, const char *name, int fd, const char *accpath)
449 {
450 	ssize_t size;
451 	void *value = NULL;
452 
453 
454 	if (fd >= 0) {
455 #if ARCHIVE_XATTR_LINUX
456 		size = fgetxattr(fd, name, NULL, 0);
457 #elif ARCHIVE_XATTR_DARWIN
458 		size = fgetxattr(fd, name, NULL, 0, 0, 0);
459 #elif ARCHIVE_XATTR_AIX
460 		size = fgetea(fd, name, NULL, 0);
461 #endif
462 	} else if (!a->follow_symlinks) {
463 #if ARCHIVE_XATTR_LINUX
464 		size = lgetxattr(accpath, name, NULL, 0);
465 #elif ARCHIVE_XATTR_DARWIN
466 		size = getxattr(accpath, name, NULL, 0, 0, XATTR_NOFOLLOW);
467 #elif ARCHIVE_XATTR_AIX
468 		size = lgetea(accpath, name, NULL, 0);
469 #endif
470 	} else {
471 #if ARCHIVE_XATTR_LINUX
472 		size = getxattr(accpath, name, NULL, 0);
473 #elif ARCHIVE_XATTR_DARWIN
474 		size = getxattr(accpath, name, NULL, 0, 0, 0);
475 #elif ARCHIVE_XATTR_AIX
476 		size = getea(accpath, name, NULL, 0);
477 #endif
478 	}
479 
480 	if (size == -1) {
481 		archive_set_error(&a->archive, errno,
482 		    "Couldn't query extended attribute");
483 		return (ARCHIVE_WARN);
484 	}
485 
486 	if (size > 0 && (value = malloc(size)) == NULL) {
487 		archive_set_error(&a->archive, errno, "Out of memory");
488 		return (ARCHIVE_FATAL);
489 	}
490 
491 
492 	if (fd >= 0) {
493 #if ARCHIVE_XATTR_LINUX
494 		size = fgetxattr(fd, name, value, size);
495 #elif ARCHIVE_XATTR_DARWIN
496 		size = fgetxattr(fd, name, value, size, 0, 0);
497 #elif ARCHIVE_XATTR_AIX
498 		size = fgetea(fd, name, value, size);
499 #endif
500 	} else if (!a->follow_symlinks) {
501 #if ARCHIVE_XATTR_LINUX
502 		size = lgetxattr(accpath, name, value, size);
503 #elif ARCHIVE_XATTR_DARWIN
504 		size = getxattr(accpath, name, value, size, 0, XATTR_NOFOLLOW);
505 #elif ARCHIVE_XATTR_AIX
506 		size = lgetea(accpath, name, value, size);
507 #endif
508 	} else {
509 #if ARCHIVE_XATTR_LINUX
510 		size = getxattr(accpath, name, value, size);
511 #elif ARCHIVE_XATTR_DARWIN
512 		size = getxattr(accpath, name, value, size, 0, 0);
513 #elif ARCHIVE_XATTR_AIX
514 		size = getea(accpath, name, value, size);
515 #endif
516 	}
517 
518 	if (size == -1) {
519 		archive_set_error(&a->archive, errno,
520 		    "Couldn't read extended attribute");
521 		free(value);
522 		return (ARCHIVE_WARN);
523 	}
524 
525 	archive_entry_xattr_add_entry(entry, name, value, size);
526 
527 	free(value);
528 	return (ARCHIVE_OK);
529 }
530 
531 static int
setup_xattrs(struct archive_read_disk * a,struct archive_entry * entry,int * fd)532 setup_xattrs(struct archive_read_disk *a,
533     struct archive_entry *entry, int *fd)
534 {
535 	char *list, *p;
536 	const char *path;
537 	ssize_t list_size;
538 
539 	path = NULL;
540 
541 	if (*fd < 0) {
542 		path = archive_read_disk_entry_setup_path(a, entry, fd);
543 		if (path == NULL)
544 			return (ARCHIVE_WARN);
545 	}
546 
547 	if (*fd >= 0) {
548 #if ARCHIVE_XATTR_LINUX
549 		list_size = flistxattr(*fd, NULL, 0);
550 #elif ARCHIVE_XATTR_DARWIN
551 		list_size = flistxattr(*fd, NULL, 0, 0);
552 #elif ARCHIVE_XATTR_AIX
553 		list_size = flistea(*fd, NULL, 0);
554 #endif
555 	} else if (!a->follow_symlinks) {
556 #if ARCHIVE_XATTR_LINUX
557 		list_size = llistxattr(path, NULL, 0);
558 #elif ARCHIVE_XATTR_DARWIN
559 		list_size = listxattr(path, NULL, 0, XATTR_NOFOLLOW);
560 #elif ARCHIVE_XATTR_AIX
561 		list_size = llistea(path, NULL, 0);
562 #endif
563 	} else {
564 #if ARCHIVE_XATTR_LINUX
565 		list_size = listxattr(path, NULL, 0);
566 #elif ARCHIVE_XATTR_DARWIN
567 		list_size = listxattr(path, NULL, 0, 0);
568 #elif ARCHIVE_XATTR_AIX
569 		list_size = listea(path, NULL, 0);
570 #endif
571 	}
572 
573 	if (list_size == -1) {
574 		if (errno == ENOTSUP || errno == ENOSYS)
575 			return (ARCHIVE_OK);
576 		archive_set_error(&a->archive, errno,
577 			"Couldn't list extended attributes");
578 		return (ARCHIVE_WARN);
579 	}
580 
581 	if (list_size == 0)
582 		return (ARCHIVE_OK);
583 
584 	if ((list = malloc(list_size)) == NULL) {
585 		archive_set_error(&a->archive, errno, "Out of memory");
586 		return (ARCHIVE_FATAL);
587 	}
588 
589 	if (*fd >= 0) {
590 #if ARCHIVE_XATTR_LINUX
591 		list_size = flistxattr(*fd, list, list_size);
592 #elif ARCHIVE_XATTR_DARWIN
593 		list_size = flistxattr(*fd, list, list_size, 0);
594 #elif ARCHIVE_XATTR_AIX
595 		list_size = flistea(*fd, list, list_size);
596 #endif
597 	} else if (!a->follow_symlinks) {
598 #if ARCHIVE_XATTR_LINUX
599 		list_size = llistxattr(path, list, list_size);
600 #elif ARCHIVE_XATTR_DARWIN
601 		list_size = listxattr(path, list, list_size, XATTR_NOFOLLOW);
602 #elif ARCHIVE_XATTR_AIX
603 		list_size = llistea(path, list, list_size);
604 #endif
605 	} else {
606 #if ARCHIVE_XATTR_LINUX
607 		list_size = listxattr(path, list, list_size);
608 #elif ARCHIVE_XATTR_DARWIN
609 		list_size = listxattr(path, list, list_size, 0);
610 #elif ARCHIVE_XATTR_AIX
611 		list_size = listea(path, list, list_size);
612 #endif
613 	}
614 
615 	if (list_size == -1) {
616 		archive_set_error(&a->archive, errno,
617 			"Couldn't retrieve extended attributes");
618 		free(list);
619 		return (ARCHIVE_WARN);
620 	}
621 
622 	for (p = list; (p - list) < list_size; p += strlen(p) + 1) {
623 #if ARCHIVE_XATTR_LINUX
624 		/* Linux: skip POSIX.1e ACL extended attributes */
625 		if (strncmp(p, "system.", 7) == 0 &&
626 		   (strcmp(p + 7, "posix_acl_access") == 0 ||
627 		    strcmp(p + 7, "posix_acl_default") == 0))
628 			continue;
629 		if (strncmp(p, "trusted.SGI_", 12) == 0 &&
630 		   (strcmp(p + 12, "ACL_DEFAULT") == 0 ||
631 		    strcmp(p + 12, "ACL_FILE") == 0))
632 			continue;
633 
634 		/* Linux: xfsroot namespace is obsolete and unsupported */
635 		if (strncmp(p, "xfsroot.", 8) == 0)
636 			continue;
637 #endif
638 		setup_xattr(a, entry, p, *fd, path);
639 	}
640 
641 	free(list);
642 	return (ARCHIVE_OK);
643 }
644 
645 #elif ARCHIVE_XATTR_FREEBSD
646 
647 /*
648  * FreeBSD extattr interface.
649  */
650 
651 /* TODO: Implement this.  Follow the Linux model above, but
652  * with FreeBSD-specific system calls, of course.  Be careful
653  * to not include the system extattrs that hold ACLs; we handle
654  * those separately.
655  */
656 static int
657 setup_xattr(struct archive_read_disk *a, struct archive_entry *entry,
658     int namespace, const char *name, const char *fullname, int fd,
659     const char *path);
660 
661 static int
setup_xattr(struct archive_read_disk * a,struct archive_entry * entry,int namespace,const char * name,const char * fullname,int fd,const char * accpath)662 setup_xattr(struct archive_read_disk *a, struct archive_entry *entry,
663     int namespace, const char *name, const char *fullname, int fd,
664     const char *accpath)
665 {
666 	ssize_t size;
667 	void *value = NULL;
668 
669 	if (fd >= 0)
670 		size = extattr_get_fd(fd, namespace, name, NULL, 0);
671 	else if (!a->follow_symlinks)
672 		size = extattr_get_link(accpath, namespace, name, NULL, 0);
673 	else
674 		size = extattr_get_file(accpath, namespace, name, NULL, 0);
675 
676 	if (size == -1) {
677 		archive_set_error(&a->archive, errno,
678 		    "Couldn't query extended attribute");
679 		return (ARCHIVE_WARN);
680 	}
681 
682 	if (size > 0 && (value = malloc(size)) == NULL) {
683 		archive_set_error(&a->archive, errno, "Out of memory");
684 		return (ARCHIVE_FATAL);
685 	}
686 
687 	if (fd >= 0)
688 		size = extattr_get_fd(fd, namespace, name, value, size);
689 	else if (!a->follow_symlinks)
690 		size = extattr_get_link(accpath, namespace, name, value, size);
691 	else
692 		size = extattr_get_file(accpath, namespace, name, value, size);
693 
694 	if (size == -1) {
695 		free(value);
696 		archive_set_error(&a->archive, errno,
697 		    "Couldn't read extended attribute");
698 		return (ARCHIVE_WARN);
699 	}
700 
701 	archive_entry_xattr_add_entry(entry, fullname, value, size);
702 
703 	free(value);
704 	return (ARCHIVE_OK);
705 }
706 
707 static int
setup_xattrs_namespace(struct archive_read_disk * a,struct archive_entry * entry,int * fd,int namespace)708 setup_xattrs_namespace(struct archive_read_disk *a,
709     struct archive_entry *entry, int *fd, int namespace)
710 {
711 	char buff[512];
712 	char *list, *p;
713 	ssize_t list_size;
714 	const char *path;
715 
716 	path = NULL;
717 
718 	if (*fd < 0) {
719 		path = archive_read_disk_entry_setup_path(a, entry, fd);
720 		if (path == NULL)
721 			return (ARCHIVE_WARN);
722 	}
723 
724 	if (*fd >= 0)
725 		list_size = extattr_list_fd(*fd, namespace, NULL, 0);
726 	else if (!a->follow_symlinks)
727 		list_size = extattr_list_link(path, namespace, NULL, 0);
728 	else
729 		list_size = extattr_list_file(path, namespace, NULL, 0);
730 
731 	if (list_size == -1 && errno == EOPNOTSUPP)
732 		return (ARCHIVE_OK);
733 	if (list_size == -1 && errno == EPERM)
734 		return (ARCHIVE_OK);
735 	if (list_size == -1) {
736 		archive_set_error(&a->archive, errno,
737 			"Couldn't list extended attributes");
738 		return (ARCHIVE_WARN);
739 	}
740 
741 	if (list_size == 0)
742 		return (ARCHIVE_OK);
743 
744 	if ((list = malloc(list_size)) == NULL) {
745 		archive_set_error(&a->archive, errno, "Out of memory");
746 		return (ARCHIVE_FATAL);
747 	}
748 
749 	if (*fd >= 0)
750 		list_size = extattr_list_fd(*fd, namespace, list, list_size);
751 	else if (!a->follow_symlinks)
752 		list_size = extattr_list_link(path, namespace, list, list_size);
753 	else
754 		list_size = extattr_list_file(path, namespace, list, list_size);
755 
756 	if (list_size == -1) {
757 		archive_set_error(&a->archive, errno,
758 			"Couldn't retrieve extended attributes");
759 		free(list);
760 		return (ARCHIVE_WARN);
761 	}
762 
763 	p = list;
764 	while ((p - list) < list_size) {
765 		size_t len = 255 & (int)*p;
766 		char *name;
767 
768 		if (namespace == EXTATTR_NAMESPACE_SYSTEM) {
769 			if (!strcmp(p + 1, "nfs4.acl") ||
770 			    !strcmp(p + 1, "posix1e.acl_access") ||
771 			    !strcmp(p + 1, "posix1e.acl_default")) {
772 				p += 1 + len;
773 				continue;
774 			}
775 			strcpy(buff, "system.");
776 		} else {
777 			strcpy(buff, "user.");
778 		}
779 		name = buff + strlen(buff);
780 		memcpy(name, p + 1, len);
781 		name[len] = '\0';
782 		setup_xattr(a, entry, namespace, name, buff, *fd, path);
783 		p += 1 + len;
784 	}
785 
786 	free(list);
787 	return (ARCHIVE_OK);
788 }
789 
790 static int
setup_xattrs(struct archive_read_disk * a,struct archive_entry * entry,int * fd)791 setup_xattrs(struct archive_read_disk *a,
792     struct archive_entry *entry, int *fd)
793 {
794 	int namespaces[2];
795 	int i, res;
796 
797 	namespaces[0] = EXTATTR_NAMESPACE_USER;
798 	namespaces[1] = EXTATTR_NAMESPACE_SYSTEM;
799 
800 	for (i = 0; i < 2; i++) {
801 		res = setup_xattrs_namespace(a, entry, fd,
802 		    namespaces[i]);
803 		switch (res) {
804 			case (ARCHIVE_OK):
805 			case (ARCHIVE_WARN):
806 				break;
807 			default:
808 				return (res);
809 		}
810 	}
811 
812 	return (ARCHIVE_OK);
813 }
814 
815 #else
816 
817 /*
818  * Generic (stub) extended attribute support.
819  */
820 static int
setup_xattrs(struct archive_read_disk * a,struct archive_entry * entry,int * fd)821 setup_xattrs(struct archive_read_disk *a,
822     struct archive_entry *entry, int *fd)
823 {
824 	(void)a;     /* UNUSED */
825 	(void)entry; /* UNUSED */
826 	(void)fd;    /* UNUSED */
827 	return (ARCHIVE_OK);
828 }
829 
830 #endif
831 
832 #if defined(HAVE_LINUX_FIEMAP_H)
833 
834 /*
835  * Linux FIEMAP sparse interface.
836  *
837  * The FIEMAP ioctl returns an "extent" for each physical allocation
838  * on disk.  We need to process those to generate a more compact list
839  * of logical file blocks.  We also need to be very careful to use
840  * FIEMAP_FLAG_SYNC here, since there are reports that Linux sometimes
841  * does not report allocations for newly-written data that hasn't
842  * been synced to disk.
843  *
844  * It's important to return a minimal sparse file list because we want
845  * to not trigger sparse file extensions if we don't have to, since
846  * not all readers support them.
847  */
848 
849 static int
setup_sparse_fiemap(struct archive_read_disk * a,struct archive_entry * entry,int * fd)850 setup_sparse_fiemap(struct archive_read_disk *a,
851     struct archive_entry *entry, int *fd)
852 {
853 	char buff[4096];
854 	struct fiemap *fm;
855 	struct fiemap_extent *fe;
856 	int64_t size;
857 	int count, do_fiemap, iters;
858 	int exit_sts = ARCHIVE_OK;
859 	const char *path;
860 
861 	if (archive_entry_filetype(entry) != AE_IFREG
862 	    || archive_entry_size(entry) <= 0
863 	    || archive_entry_hardlink(entry) != NULL)
864 		return (ARCHIVE_OK);
865 
866 	if (*fd < 0) {
867 		path = archive_read_disk_entry_setup_path(a, entry, NULL);
868 		if (path == NULL)
869 			return (ARCHIVE_FAILED);
870 
871 		if (a->tree != NULL)
872 			*fd = a->open_on_current_dir(a->tree, path,
873 				O_RDONLY | O_NONBLOCK | O_CLOEXEC);
874 		else
875 			*fd = open(path, O_RDONLY | O_NONBLOCK | O_CLOEXEC);
876 		if (*fd < 0) {
877 			archive_set_error(&a->archive, errno,
878 			    "Can't open `%s'", path);
879 			return (ARCHIVE_FAILED);
880 		}
881 		__archive_ensure_cloexec_flag(*fd);
882 	}
883 
884 	/* Initialize buffer to avoid the error valgrind complains about. */
885 	memset(buff, 0, sizeof(buff));
886 	count = (sizeof(buff) - sizeof(*fm))/sizeof(*fe);
887 	fm = (struct fiemap *)buff;
888 	fm->fm_start = 0;
889 	fm->fm_length = ~0ULL;
890 	fm->fm_flags = FIEMAP_FLAG_SYNC;
891 	fm->fm_extent_count = count;
892 	do_fiemap = 1;
893 	size = archive_entry_size(entry);
894 	for (iters = 0; ; ++iters) {
895 		int i, r;
896 
897 		r = ioctl(*fd, FS_IOC_FIEMAP, fm);
898 		if (r < 0) {
899 			/* When something error happens, it is better we
900 			 * should return ARCHIVE_OK because an earlier
901 			 * version(<2.6.28) cannot perform FS_IOC_FIEMAP. */
902 			goto exit_setup_sparse_fiemap;
903 		}
904 		if (fm->fm_mapped_extents == 0) {
905 			if (iters == 0) {
906 				/* Fully sparse file; insert a zero-length "data" entry */
907 				archive_entry_sparse_add_entry(entry, 0, 0);
908 			}
909 			break;
910 		}
911 		fe = fm->fm_extents;
912 		for (i = 0; i < (int)fm->fm_mapped_extents; i++, fe++) {
913 			if (!(fe->fe_flags & FIEMAP_EXTENT_UNWRITTEN)) {
914 				/* The fe_length of the last block does not
915 				 * adjust itself to its size files. */
916 				int64_t length = fe->fe_length;
917 				if (fe->fe_logical + length > (uint64_t)size)
918 					length -= fe->fe_logical + length - size;
919 				if (fe->fe_logical == 0 && length == size) {
920 					/* This is not sparse. */
921 					do_fiemap = 0;
922 					break;
923 				}
924 				if (length > 0)
925 					archive_entry_sparse_add_entry(entry,
926 					    fe->fe_logical, length);
927 			}
928 			if (fe->fe_flags & FIEMAP_EXTENT_LAST)
929 				do_fiemap = 0;
930 		}
931 		if (do_fiemap) {
932 			fe = fm->fm_extents + fm->fm_mapped_extents -1;
933 			fm->fm_start = fe->fe_logical + fe->fe_length;
934 		} else
935 			break;
936 	}
937 exit_setup_sparse_fiemap:
938 	return (exit_sts);
939 }
940 
941 #if !defined(SEEK_HOLE) || !defined(SEEK_DATA)
942 static int
setup_sparse(struct archive_read_disk * a,struct archive_entry * entry,int * fd)943 setup_sparse(struct archive_read_disk *a,
944     struct archive_entry *entry, int *fd)
945 {
946 	return setup_sparse_fiemap(a, entry, fd);
947 }
948 #endif
949 #endif	/* defined(HAVE_LINUX_FIEMAP_H) */
950 
951 #if defined(SEEK_HOLE) && defined(SEEK_DATA)
952 
953 /*
954  * SEEK_HOLE sparse interface (FreeBSD, Linux, Solaris)
955  */
956 
957 static int
setup_sparse(struct archive_read_disk * a,struct archive_entry * entry,int * fd)958 setup_sparse(struct archive_read_disk *a,
959     struct archive_entry *entry, int *fd)
960 {
961 	int64_t size;
962 	off_t initial_off;
963 	off_t off_s, off_e;
964 	int exit_sts = ARCHIVE_OK;
965 	int check_fully_sparse = 0;
966 	const char *path;
967 
968 	if (archive_entry_filetype(entry) != AE_IFREG
969 	    || archive_entry_size(entry) <= 0
970 	    || archive_entry_hardlink(entry) != NULL)
971 		return (ARCHIVE_OK);
972 
973 	/* Does filesystem support the reporting of hole ? */
974 	if (*fd < 0)
975 		path = archive_read_disk_entry_setup_path(a, entry, fd);
976 	else
977 		path = NULL;
978 
979 	if (*fd >= 0) {
980 #ifdef _PC_MIN_HOLE_SIZE
981 		if (fpathconf(*fd, _PC_MIN_HOLE_SIZE) <= 0)
982 			return (ARCHIVE_OK);
983 #endif
984 		initial_off = lseek(*fd, 0, SEEK_CUR);
985 		if (initial_off != 0)
986 			lseek(*fd, 0, SEEK_SET);
987 	} else {
988 		if (path == NULL)
989 			return (ARCHIVE_FAILED);
990 #ifdef _PC_MIN_HOLE_SIZE
991 		if (pathconf(path, _PC_MIN_HOLE_SIZE) <= 0)
992 			return (ARCHIVE_OK);
993 #endif
994 		*fd = open(path, O_RDONLY | O_NONBLOCK | O_CLOEXEC);
995 		if (*fd < 0) {
996 			archive_set_error(&a->archive, errno,
997 			    "Can't open `%s'", path);
998 			return (ARCHIVE_FAILED);
999 		}
1000 		__archive_ensure_cloexec_flag(*fd);
1001 		initial_off = 0;
1002 	}
1003 
1004 #ifndef _PC_MIN_HOLE_SIZE
1005 	/* Check if the underlying filesystem supports seek hole */
1006 	off_s = lseek(*fd, 0, SEEK_HOLE);
1007 	if (off_s < 0)
1008 #if defined(HAVE_LINUX_FIEMAP_H)
1009 		return setup_sparse_fiemap(a, entry, fd);
1010 #else
1011 		goto exit_setup_sparse;
1012 #endif
1013 	else if (off_s > 0)
1014 		lseek(*fd, 0, SEEK_SET);
1015 #endif
1016 
1017 	off_s = 0;
1018 	size = archive_entry_size(entry);
1019 	while (off_s < size) {
1020 		off_s = lseek(*fd, off_s, SEEK_DATA);
1021 		if (off_s == (off_t)-1) {
1022 			if (errno == ENXIO) {
1023 				/* no more hole */
1024 				if (archive_entry_sparse_count(entry) == 0) {
1025 					/* Potentially a fully-sparse file. */
1026 					check_fully_sparse = 1;
1027 				}
1028 				break;
1029 			}
1030 			archive_set_error(&a->archive, errno,
1031 			    "lseek(SEEK_HOLE) failed");
1032 			exit_sts = ARCHIVE_FAILED;
1033 			goto exit_setup_sparse;
1034 		}
1035 		off_e = lseek(*fd, off_s, SEEK_HOLE);
1036 		if (off_e == (off_t)-1) {
1037 			if (errno == ENXIO) {
1038 				off_e = lseek(*fd, 0, SEEK_END);
1039 				if (off_e != (off_t)-1)
1040 					break;/* no more data */
1041 			}
1042 			archive_set_error(&a->archive, errno,
1043 			    "lseek(SEEK_DATA) failed");
1044 			exit_sts = ARCHIVE_FAILED;
1045 			goto exit_setup_sparse;
1046 		}
1047 		if (off_s == 0 && off_e == size)
1048 			break;/* This is not sparse. */
1049 		archive_entry_sparse_add_entry(entry, off_s,
1050 			off_e - off_s);
1051 		off_s = off_e;
1052 	}
1053 
1054 	if (check_fully_sparse) {
1055 		if (lseek(*fd, 0, SEEK_HOLE) == 0 &&
1056 			lseek(*fd, 0, SEEK_END) == size) {
1057 			/* Fully sparse file; insert a zero-length "data" entry */
1058 			archive_entry_sparse_add_entry(entry, 0, 0);
1059 		}
1060 	}
1061 exit_setup_sparse:
1062 	lseek(*fd, initial_off, SEEK_SET);
1063 	return (exit_sts);
1064 }
1065 
1066 #elif !defined(HAVE_LINUX_FIEMAP_H)
1067 
1068 /*
1069  * Generic (stub) sparse support.
1070  */
1071 static int
setup_sparse(struct archive_read_disk * a,struct archive_entry * entry,int * fd)1072 setup_sparse(struct archive_read_disk *a,
1073     struct archive_entry *entry, int *fd)
1074 {
1075 	(void)a;     /* UNUSED */
1076 	(void)entry; /* UNUSED */
1077 	(void)fd;    /* UNUSED */
1078 	return (ARCHIVE_OK);
1079 }
1080 
1081 #endif
1082 
1083 #endif /* !defined(_WIN32) || defined(__CYGWIN__) */
1084 
1085