xref: /freebsd/bin/pax/tar.c (revision afe61c15161c324a7af299a9b8457aba5afc92db)
1 /*-
2  * Copyright (c) 1992 Keith Muller.
3  * Copyright (c) 1992, 1993
4  *	The Regents of the University of California.  All rights reserved.
5  *
6  * This code is derived from software contributed to Berkeley by
7  * Keith Muller of the University of California, San Diego.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 3. All advertising materials mentioning features or use of this software
18  *    must display the following acknowledgement:
19  *	This product includes software developed by the University of
20  *	California, Berkeley and its contributors.
21  * 4. Neither the name of the University nor the names of its contributors
22  *    may be used to endorse or promote products derived from this software
23  *    without specific prior written permission.
24  *
25  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
26  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
30  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
31  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
32  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
33  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
34  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
35  * SUCH DAMAGE.
36  */
37 
38 #ifndef lint
39 static char sccsid[] = "@(#)tar.c	8.2 (Berkeley) 4/18/94";
40 #endif /* not lint */
41 
42 #include <sys/types.h>
43 #include <sys/time.h>
44 #include <sys/stat.h>
45 #include <sys/param.h>
46 #include <string.h>
47 #include <stdio.h>
48 #include <ctype.h>
49 #include <unistd.h>
50 #include <stdlib.h>
51 #include "pax.h"
52 #include "extern.h"
53 #include "tar.h"
54 
55 /*
56  * Routines for reading, writing and header identify of various versions of tar
57  */
58 
59 static u_long tar_chksm __P((register char *, register int));
60 static char *name_split __P((register char *, register int));
61 static int ul_oct __P((u_long, register char *, register int, int));
62 #ifndef NET2_STAT
63 static int uqd_oct __P((u_quad_t, register char *, register int, int));
64 #endif
65 
66 /*
67  * Routines common to all versions of tar
68  */
69 
70 static int tar_nodir;			/* do not write dirs under old tar */
71 
72 /*
73  * tar_endwr()
74  *	add the tar trailer of two null blocks
75  * Return:
76  *	0 if ok, -1 otherwise (what wr_skip returns)
77  */
78 
79 #if __STDC__
80 int
81 tar_endwr(void)
82 #else
83 int
84 tar_endwr()
85 #endif
86 {
87 	return(wr_skip((off_t)(NULLCNT*BLKMULT)));
88 }
89 
90 /*
91  * tar_endrd()
92  *	no cleanup needed here, just return size of trailer (for append)
93  * Return:
94  *	size of trailer (2 * BLKMULT)
95  */
96 
97 #if __STDC__
98 off_t
99 tar_endrd(void)
100 #else
101 off_t
102 tar_endrd()
103 #endif
104 {
105 	return((off_t)(NULLCNT*BLKMULT));
106 }
107 
108 /*
109  * tar_trail()
110  *	Called to determine if a header block is a valid trailer. We are passed
111  *	the block, the in_sync flag (which tells us we are in resync mode;
112  *	looking for a valid header), and cnt (which starts at zero) which is
113  *	used to count the number of empty blocks we have seen so far.
114  * Return:
115  *	0 if a valid trailer, -1 if not a valid trailer, or 1 if the block
116  *	could never contain a header.
117  */
118 
119 #if __STDC__
120 int
121 tar_trail(register char *buf, register int in_resync, register int *cnt)
122 #else
123 int
124 tar_trail(buf, in_resync, cnt)
125 	register char *buf;
126 	register int in_resync;
127 	register int *cnt;
128 #endif
129 {
130 	register int i;
131 
132 	/*
133 	 * look for all zero, trailer is two consecutive blocks of zero
134 	 */
135 	for (i = 0; i < BLKMULT; ++i) {
136 		if (buf[i] != '\0')
137 			break;
138 	}
139 
140 	/*
141 	 * if not all zero it is not a trailer, but MIGHT be a header.
142 	 */
143 	if (i != BLKMULT)
144 		return(-1);
145 
146 	/*
147 	 * When given a zero block, we must be careful!
148 	 * If we are not in resync mode, check for the trailer. Have to watch
149 	 * out that we do not mis-identify file data as the trailer, so we do
150 	 * NOT try to id a trailer during resync mode. During resync mode we
151 	 * might as well throw this block out since a valid header can NEVER be
152 	 * a block of all 0 (we must have a valid file name).
153 	 */
154 	if (!in_resync && (++*cnt >= NULLCNT))
155 		return(0);
156 	return(1);
157 }
158 
159 /*
160  * ul_oct()
161  *	convert an unsigned long to an octal string. many oddball field
162  *	termination characters are used by the various versions of tar in the
163  *	different fields. term selects which kind to use. str is BLANK padded
164  *	at the front to len. we are unable to use only one format as many old
165  *	tar readers are very cranky about this.
166  * Return:
167  *	0 if the number fit into the string, -1 otherwise
168  */
169 
170 #if __STDC__
171 static int
172 ul_oct(u_long val, register char *str, register int len, int term)
173 #else
174 static int
175 ul_oct(val, str, len, term)
176 	u_long val;
177 	register char *str;
178 	register int len;
179 	int term;
180 #endif
181 {
182 	register char *pt;
183 
184 	/*
185 	 * term selects the appropriate character(s) for the end of the string
186 	 */
187 	pt = str + len - 1;
188 	switch(term) {
189 	case 3:
190 		*pt-- = '\0';
191 		break;
192 	case 2:
193 		*pt-- = ' ';
194 		*pt-- = '\0';
195 		break;
196 	case 1:
197 		*pt-- = ' ';
198 		break;
199 	case 0:
200 	default:
201 		*pt-- = '\0';
202 		*pt-- = ' ';
203 		break;
204 	}
205 
206 	/*
207 	 * convert and blank pad if there is space
208 	 */
209 	while (pt >= str) {
210 		*pt-- = '0' + (char)(val & 0x7);
211 		if ((val = val >> 3) == (u_long)0)
212 			break;
213 	}
214 
215 	while (pt >= str)
216 		*pt-- = ' ';
217 	if (val != (u_long)0)
218 		return(-1);
219 	return(0);
220 }
221 
222 #ifndef NET2_STAT
223 /*
224  * uqd_oct()
225  *	convert an u_quad_t to an octal string. one of many oddball field
226  *	termination characters are used by the various versions of tar in the
227  *	different fields. term selects which kind to use. str is BLANK padded
228  *	at the front to len. we are unable to use only one format as many old
229  *	tar readers are very cranky about this.
230  * Return:
231  *	0 if the number fit into the string, -1 otherwise
232  */
233 
234 #if __STDC__
235 static int
236 uqd_oct(u_quad_t val, register char *str, register int len, int term)
237 #else
238 static int
239 uqd_oct(val, str, len, term)
240 	u_quad_t val;
241 	register char *str;
242 	register int len;
243 	int term;
244 #endif
245 {
246 	register char *pt;
247 
248 	/*
249 	 * term selects the appropriate character(s) for the end of the string
250 	 */
251 	pt = str + len - 1;
252 	switch(term) {
253 	case 3:
254 		*pt-- = '\0';
255 		break;
256 	case 2:
257 		*pt-- = ' ';
258 		*pt-- = '\0';
259 		break;
260 	case 1:
261 		*pt-- = ' ';
262 		break;
263 	case 0:
264 	default:
265 		*pt-- = '\0';
266 		*pt-- = ' ';
267 		break;
268 	}
269 
270 	/*
271 	 * convert and blank pad if there is space
272 	 */
273 	while (pt >= str) {
274 		*pt-- = '0' + (char)(val & 0x7);
275 		if ((val = val >> 3) == 0)
276 			break;
277 	}
278 
279 	while (pt >= str)
280 		*pt-- = ' ';
281 	if (val != (u_quad_t)0)
282 		return(-1);
283 	return(0);
284 }
285 #endif
286 
287 /*
288  * tar_chksm()
289  *	calculate the checksum for a tar block counting the checksum field as
290  *	all blanks (BLNKSUM is that value pre-calculated, the sume of 8 blanks).
291  *	NOTE: we use len to short circuit summing 0's on write since we ALWAYS
292  *	pad headers with 0.
293  * Return:
294  *	unsigned long checksum
295  */
296 
297 #if __STDC__
298 static u_long
299 tar_chksm(register char *blk, register int len)
300 #else
301 static u_long
302 tar_chksm(blk, len)
303 	register char *blk;
304 	register int len;
305 #endif
306 {
307 	register char *stop;
308 	register char *pt;
309 	u_long chksm = BLNKSUM;	/* inital value is checksum field sum */
310 
311 	/*
312 	 * add the part of the block before the checksum field
313 	 */
314 	pt = blk;
315 	stop = blk + CHK_OFFSET;
316 	while (pt < stop)
317 		chksm += (u_long)(*pt++ & 0xff);
318 	/*
319 	 * move past the checksum field and keep going, spec counts the
320 	 * checksum field as the sum of 8 blanks (which is pre-computed as
321 	 * BLNKSUM).
322 	 * ASSUMED: len is greater than CHK_OFFSET. (len is where our 0 padding
323 	 * starts, no point in summing zero's)
324 	 */
325 	pt += CHK_LEN;
326 	stop = blk + len;
327 	while (pt < stop)
328 		chksm += (u_long)(*pt++ & 0xff);
329 	return(chksm);
330 }
331 
332 /*
333  * Routines for old BSD style tar (also made portable to sysV tar)
334  */
335 
336 /*
337  * tar_id()
338  *	determine if a block given to us is a valid tar header (and not a USTAR
339  *	header). We have to be on the lookout for those pesky blocks of	all
340  *	zero's.
341  * Return:
342  *	0 if a tar header, -1 otherwise
343  */
344 
345 #if __STDC__
346 int
347 tar_id(register char *blk, int size)
348 #else
349 int
350 tar_id(blk, size)
351 	register char *blk;
352 	int size;
353 #endif
354 {
355 	register HD_TAR *hd;
356 	register HD_USTAR *uhd;
357 
358 	if (size < BLKMULT)
359 		return(-1);
360 	hd = (HD_TAR *)blk;
361 	uhd = (HD_USTAR *)blk;
362 
363 	/*
364 	 * check for block of zero's first, a simple and fast test, then make
365 	 * sure this is not a ustar header by looking for the ustar magic
366 	 * cookie. We should use TMAGLEN, but some USTAR archive programs are
367 	 * wrong and create archives missing the \0. Last we check the
368 	 * checksum. If this is ok we have to assume it is a valid header.
369 	 */
370 	if (hd->name[0] == '\0')
371 		return(-1);
372 	if (strncmp(uhd->magic, TMAGIC, TMAGLEN - 1) == 0)
373 		return(-1);
374 	if (asc_ul(hd->chksum,sizeof(hd->chksum),OCT) != tar_chksm(blk,BLKMULT))
375 		return(-1);
376 	return(0);
377 }
378 
379 /*
380  * tar_opt()
381  *	handle tar format specific -o options
382  * Return:
383  *	0 if ok -1 otherwise
384  */
385 
386 #if __STDC__
387 int
388 tar_opt(void)
389 #else
390 int
391 tar_opt()
392 #endif
393 {
394 	OPLIST *opt;
395 
396 	while ((opt = opt_next()) != NULL) {
397 		if (strcmp(opt->name, TAR_OPTION) ||
398 		    strcmp(opt->value, TAR_NODIR)) {
399 			warn(1, "Unknown tar format -o option/value pair %s=%s",
400 			    opt->name, opt->value);
401 			warn(1,"%s=%s is the only supported tar format option",
402 			    TAR_OPTION, TAR_NODIR);
403 			return(-1);
404 		}
405 
406 		/*
407 		 * we only support one option, and only when writing
408 		 */
409 		if ((act != APPND) && (act != ARCHIVE)) {
410 			warn(1, "%s=%s is only supported when writing.",
411 			    opt->name, opt->value);
412 			return(-1);
413 		}
414 		tar_nodir = 1;
415 	}
416 	return(0);
417 }
418 
419 
420 /*
421  * tar_rd()
422  *	extract the values out of block already determined to be a tar header.
423  *	store the values in the ARCHD parameter.
424  * Return:
425  *	0
426  */
427 
428 #if __STDC__
429 int
430 tar_rd(register ARCHD *arcn, register char *buf)
431 #else
432 int
433 tar_rd(arcn, buf)
434 	register ARCHD *arcn;
435 	register char *buf;
436 #endif
437 {
438 	register HD_TAR *hd;
439 	register char *pt;
440 
441 	/*
442 	 * we only get proper sized buffers passed to us
443 	 */
444 	if (tar_id(buf, BLKMULT) < 0)
445 		return(-1);
446 	arcn->org_name = arcn->name;
447 	arcn->sb.st_nlink = 1;
448 	arcn->pat = NULL;
449 
450 	/*
451 	 * copy out the name and values in the stat buffer
452 	 */
453 	hd = (HD_TAR *)buf;
454 	arcn->nlen = l_strncpy(arcn->name, hd->name, sizeof(hd->name));
455 	arcn->name[arcn->nlen] = '\0';
456 	arcn->sb.st_mode = (mode_t)(asc_ul(hd->mode,sizeof(hd->mode),OCT) &
457 	    0xfff);
458 	arcn->sb.st_uid = (uid_t)asc_ul(hd->uid, sizeof(hd->uid), OCT);
459 	arcn->sb.st_gid = (gid_t)asc_ul(hd->gid, sizeof(hd->gid), OCT);
460 	arcn->sb.st_size = (size_t)asc_ul(hd->size, sizeof(hd->size), OCT);
461 	arcn->sb.st_mtime = (time_t)asc_ul(hd->mtime, sizeof(hd->mtime), OCT);
462 	arcn->sb.st_ctime = arcn->sb.st_atime = arcn->sb.st_mtime;
463 
464 	/*
465 	 * have to look at the last character, it may be a '/' and that is used
466 	 * to encode this as a directory
467 	 */
468 	pt = &(arcn->name[arcn->nlen - 1]);
469 	arcn->pad = 0;
470 	arcn->skip = 0;
471 	switch(hd->linkflag) {
472 	case SYMTYPE:
473 		/*
474 		 * symbolic link, need to get the link name and set the type in
475 		 * the st_mode so -v printing will look correct.
476 		 */
477 		arcn->type = PAX_SLK;
478 		arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
479 			sizeof(hd->linkname));
480 		arcn->ln_name[arcn->ln_nlen] = '\0';
481 		arcn->sb.st_mode |= S_IFLNK;
482 		break;
483 	case LNKTYPE:
484 		/*
485 		 * hard link, need to get the link name, set the type in the
486 		 * st_mode and st_nlink so -v printing will look better.
487 		 */
488 		arcn->type = PAX_HLK;
489 		arcn->sb.st_nlink = 2;
490 		arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
491 			sizeof(hd->linkname));
492 		arcn->ln_name[arcn->ln_nlen] = '\0';
493 
494 		/*
495 		 * no idea of what type this thing really points at, but
496 		 * we set something for printing only.
497 		 */
498 		arcn->sb.st_mode |= S_IFREG;
499 		break;
500 	case AREGTYPE:
501 	case REGTYPE:
502 	default:
503 		/*
504 		 * If we have a trailing / this is a directory and NOT a file.
505 		 */
506 		arcn->ln_name[0] = '\0';
507 		arcn->ln_nlen = 0;
508 		if (*pt == '/') {
509 			/*
510 			 * it is a directory, set the mode for -v printing
511 			 */
512 			arcn->type = PAX_DIR;
513 			arcn->sb.st_mode |= S_IFDIR;
514 			arcn->sb.st_nlink = 2;
515 		} else {
516 			/*
517 			 * have a file that will be followed by data. Set the
518 			 * skip value to the size field and caluculate the size
519 			 * of the padding.
520 			 */
521 			arcn->type = PAX_REG;
522 			arcn->sb.st_mode |= S_IFREG;
523 			arcn->pad = TAR_PAD(arcn->sb.st_size);
524 			arcn->skip = arcn->sb.st_size;
525 		}
526 		break;
527 	}
528 
529 	/*
530 	 * strip off any trailing slash.
531 	 */
532 	if (*pt == '/') {
533 		*pt = '\0';
534 		--arcn->nlen;
535 	}
536 	return(0);
537 }
538 
539 /*
540  * tar_wr()
541  *	write a tar header for the file specified in the ARCHD to the archive.
542  *	Have to check for file types that cannot be stored and file names that
543  *	are too long. Be careful of the term (last arg) to ul_oct, each field
544  *	of tar has it own spec for the termination character(s).
545  *	ASSUMED: space after header in header block is zero filled
546  * Return:
547  *	0 if file has data to be written after the header, 1 if file has NO
548  *	data to write after the header, -1 if archive write failed
549  */
550 
551 #if __STDC__
552 int
553 tar_wr(register ARCHD *arcn)
554 #else
555 int
556 tar_wr(arcn)
557 	register ARCHD *arcn;
558 #endif
559 {
560 	register HD_TAR *hd;
561 	int len;
562 	char hdblk[sizeof(HD_TAR)];
563 
564 	/*
565 	 * check for those file system types which tar cannot store
566 	 */
567 	switch(arcn->type) {
568 	case PAX_DIR:
569 		/*
570 		 * user asked that dirs not be written to the archive
571 		 */
572 		if (tar_nodir)
573 			return(1);
574 		break;
575 	case PAX_CHR:
576 		warn(1, "Tar cannot archive a character device %s",
577 		    arcn->org_name);
578 		return(1);
579 	case PAX_BLK:
580 		warn(1, "Tar cannot archive a block device %s", arcn->org_name);
581 		return(1);
582 	case PAX_SCK:
583 		warn(1, "Tar cannot archive a socket %s", arcn->org_name);
584 		return(1);
585 	case PAX_FIF:
586 		warn(1, "Tar cannot archive a fifo %s", arcn->org_name);
587 		return(1);
588 	case PAX_SLK:
589 	case PAX_HLK:
590 	case PAX_HRG:
591 		if (arcn->ln_nlen > sizeof(hd->linkname)) {
592 			warn(1,"Link name too long for tar %s", arcn->ln_name);
593 			return(1);
594 		}
595 		break;
596 	case PAX_REG:
597 	case PAX_CTG:
598 	default:
599 		break;
600 	}
601 
602 	/*
603 	 * check file name len, remember extra char for dirs (the / at the end)
604 	 */
605 	len = arcn->nlen;
606 	if (arcn->type == PAX_DIR)
607 		++len;
608 	if (len > sizeof(hd->name)) {
609 		warn(1, "File name too long for tar %s", arcn->name);
610 		return(1);
611 	}
612 
613 	/*
614 	 * copy the data out of the ARCHD into the tar header based on the type
615 	 * of the file. Remember many tar readers want the unused fields to be
616 	 * padded with zero. We set the linkflag field (type), the linkname
617 	 * (or zero if not used),the size, and set the padding (if any) to be
618 	 * added after the file data (0 for all other types, as they only have
619 	 * a header)
620 	 */
621 	hd = (HD_TAR *)hdblk;
622 	zf_strncpy(hd->name, arcn->name, sizeof(hd->name));
623 	arcn->pad = 0;
624 
625 	if (arcn->type == PAX_DIR) {
626 		/*
627 		 * directories are the same as files, except have a filename
628 		 * that ends with a /, we add the slash here. No data follows,
629 		 * dirs, so no pad.
630 		 */
631 		hd->linkflag = AREGTYPE;
632 		bzero(hd->linkname, sizeof(hd->linkname));
633 		hd->name[len-1] = '/';
634 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
635 			goto out;
636 	} else if (arcn->type == PAX_SLK) {
637 		/*
638 		 * no data follows this file, so no pad
639 		 */
640 		hd->linkflag = SYMTYPE;
641 		zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
642 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
643 			goto out;
644 	} else if ((arcn->type == PAX_HLK) || (arcn->type == PAX_HRG)) {
645 		/*
646 		 * no data follows this file, so no pad
647 		 */
648 		hd->linkflag = LNKTYPE;
649 		zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
650 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
651 			goto out;
652 	} else {
653 		/*
654 		 * data follows this file, so set the pad
655 		 */
656 		hd->linkflag = AREGTYPE;
657 		bzero(hd->linkname, sizeof(hd->linkname));
658 #		ifdef NET2_STAT
659 		if (ul_oct((u_long)arcn->sb.st_size, hd->size,
660 		    sizeof(hd->size), 1)) {
661 #		else
662 		if (uqd_oct((u_quad_t)arcn->sb.st_size, hd->size,
663 		    sizeof(hd->size), 1)) {
664 #		endif
665 			warn(1,"File is too large for tar %s", arcn->org_name);
666 			return(1);
667 		}
668 		arcn->pad = TAR_PAD(arcn->sb.st_size);
669 	}
670 
671 	/*
672 	 * copy those fields that are independent of the type
673 	 */
674 	if (ul_oct((u_long)arcn->sb.st_mode, hd->mode, sizeof(hd->mode), 0) ||
675 	    ul_oct((u_long)arcn->sb.st_uid, hd->uid, sizeof(hd->uid), 0) ||
676 	    ul_oct((u_long)arcn->sb.st_gid, hd->gid, sizeof(hd->gid), 0) ||
677 	    ul_oct((u_long)arcn->sb.st_mtime, hd->mtime, sizeof(hd->mtime), 1))
678 		goto out;
679 
680 	/*
681 	 * calculate and add the checksum, then write the header. A return of
682 	 * 0 tells the caller to now write the file data, 1 says no data needs
683 	 * to be written
684 	 */
685 	if (ul_oct(tar_chksm(hdblk, sizeof(HD_TAR)), hd->chksum,
686 	    sizeof(hd->chksum), 2))
687 		goto out;
688 	if (wr_rdbuf(hdblk, sizeof(HD_TAR)) < 0)
689 		return(-1);
690 	if (wr_skip((off_t)(BLKMULT - sizeof(HD_TAR))) < 0)
691 		return(-1);
692 	if ((arcn->type == PAX_CTG) || (arcn->type == PAX_REG))
693 		return(0);
694 	return(1);
695 
696     out:
697 	/*
698 	 * header field is out of range
699 	 */
700 	warn(1, "Tar header field is too small for %s", arcn->org_name);
701 	return(1);
702 }
703 
704 /*
705  * Routines for POSIX ustar
706  */
707 
708 /*
709  * ustar_strd()
710  *	initialization for ustar read
711  * Return:
712  *	0 if ok, -1 otherwise
713  */
714 
715 #if __STDC__
716 int
717 ustar_strd(void)
718 #else
719 int
720 ustar_strd()
721 #endif
722 {
723 	if ((usrtb_start() < 0) || (grptb_start() < 0))
724 		return(-1);
725 	return(0);
726 }
727 
728 /*
729  * ustar_stwr()
730  *	initialization for ustar write
731  * Return:
732  *	0 if ok, -1 otherwise
733  */
734 
735 #if __STDC__
736 int
737 ustar_stwr(void)
738 #else
739 int
740 ustar_stwr()
741 #endif
742 {
743 	if ((uidtb_start() < 0) || (gidtb_start() < 0))
744 		return(-1);
745 	return(0);
746 }
747 
748 /*
749  * ustar_id()
750  *	determine if a block given to us is a valid ustar header. We have to
751  *	be on the lookout for those pesky blocks of all zero's
752  * Return:
753  *	0 if a ustar header, -1 otherwise
754  */
755 
756 #if __STDC__
757 int
758 ustar_id(char *blk, int size)
759 #else
760 int
761 ustar_id(blk, size)
762 	char *blk;
763 	int size;
764 #endif
765 {
766 	register HD_USTAR *hd;
767 
768 	if (size < BLKMULT)
769 		return(-1);
770 	hd = (HD_USTAR *)blk;
771 
772 	/*
773 	 * check for block of zero's first, a simple and fast test then check
774 	 * ustar magic cookie. We should use TMAGLEN, but some USTAR archive
775 	 * programs are fouled up and create archives missing the \0. Last we
776 	 * check the checksum. If ok we have to assume it is a valid header.
777 	 */
778 	if (hd->name[0] == '\0')
779 		return(-1);
780 	if (strncmp(hd->magic, TMAGIC, TMAGLEN - 1) != 0)
781 		return(-1);
782 	if (asc_ul(hd->chksum,sizeof(hd->chksum),OCT) != tar_chksm(blk,BLKMULT))
783 		return(-1);
784 	return(0);
785 }
786 
787 /*
788  * ustar_rd()
789  *	extract the values out of block already determined to be a ustar header.
790  *	store the values in the ARCHD parameter.
791  * Return:
792  *	0
793  */
794 
795 #if __STDC__
796 int
797 ustar_rd(register ARCHD *arcn, register char *buf)
798 #else
799 int
800 ustar_rd(arcn, buf)
801 	register ARCHD *arcn;
802 	register char *buf;
803 #endif
804 {
805 	register HD_USTAR *hd;
806 	register char *dest;
807 	register int cnt = 0;
808 	dev_t devmajor;
809 	dev_t devminor;
810 
811 	/*
812 	 * we only get proper sized buffers
813 	 */
814 	if (ustar_id(buf, BLKMULT) < 0)
815 		return(-1);
816 	arcn->org_name = arcn->name;
817 	arcn->sb.st_nlink = 1;
818 	arcn->pat = NULL;
819 	hd = (HD_USTAR *)buf;
820 
821 	/*
822 	 * see if the filename is split into two parts. if, so joint the parts.
823 	 * we copy the prefix first and add a / between the prefix and name.
824 	 */
825 	dest = arcn->name;
826 	if (*(hd->prefix) != '\0') {
827 		cnt = l_strncpy(arcn->name, hd->prefix, sizeof(hd->prefix));
828 		dest = arcn->name + arcn->nlen;
829 		*dest++ = '/';
830 	}
831 	arcn->nlen = l_strncpy(dest, hd->name, sizeof(hd->name));
832 	arcn->nlen += cnt;
833 	arcn->name[arcn->nlen] = '\0';
834 
835 	/*
836 	 * follow the spec to the letter. we should only have mode bits, strip
837 	 * off all other crud we may be passed.
838 	 */
839 	arcn->sb.st_mode = (mode_t)(asc_ul(hd->mode, sizeof(hd->mode), OCT) &
840 	    0xfff);
841 	arcn->sb.st_size = (size_t)asc_ul(hd->size, sizeof(hd->size), OCT);
842 	arcn->sb.st_mtime = (time_t)asc_ul(hd->mtime, sizeof(hd->mtime), OCT);
843 	arcn->sb.st_ctime = arcn->sb.st_atime = arcn->sb.st_mtime;
844 
845 	/*
846 	 * If we can find the ascii names for gname and uname in the password
847 	 * and group files we will use the uid's and gid they bind. Otherwise
848 	 * we use the uid and gid values stored in the header. (This is what
849 	 * the posix spec wants).
850 	 */
851 	hd->gname[sizeof(hd->gname) - 1] = '\0';
852 	if (gid_name(hd->gname, &(arcn->sb.st_gid)) < 0)
853 		arcn->sb.st_gid = (gid_t)asc_ul(hd->gid, sizeof(hd->gid), OCT);
854 	hd->uname[sizeof(hd->uname) - 1] = '\0';
855 	if (uid_name(hd->uname, &(arcn->sb.st_uid)) < 0)
856 		arcn->sb.st_uid = (uid_t)asc_ul(hd->uid, sizeof(hd->uid), OCT);
857 
858 	/*
859 	 * set the defaults, these may be changed depending on the file type
860 	 */
861 	arcn->ln_name[0] = '\0';
862 	arcn->ln_nlen = 0;
863 	arcn->pad = 0;
864 	arcn->skip = 0;
865 	arcn->sb.st_rdev = (dev_t)0;
866 
867 	/*
868 	 * set the mode and PAX type according to the typeflag in the header
869 	 */
870 	switch(hd->typeflag) {
871 	case FIFOTYPE:
872 		arcn->type = PAX_FIF;
873 		arcn->sb.st_mode |= S_IFIFO;
874 		break;
875 	case DIRTYPE:
876 		arcn->type = PAX_DIR;
877 		arcn->sb.st_mode |= S_IFDIR;
878 		arcn->sb.st_nlink = 2;
879 
880 		/*
881 		 * Some programs that create ustar archives append a '/'
882 		 * to the pathname for directories. This clearly violates
883 		 * ustar specs, but we will silently strip it off anyway.
884 		 */
885 		if (arcn->name[arcn->nlen - 1] == '/')
886 			arcn->name[--arcn->nlen] = '\0';
887 		break;
888 	case BLKTYPE:
889 	case CHRTYPE:
890 		/*
891 		 * this type requires the rdev field to be set.
892 		 */
893 		if (hd->typeflag == BLKTYPE) {
894 			arcn->type = PAX_BLK;
895 			arcn->sb.st_mode |= S_IFBLK;
896 		} else {
897 			arcn->type = PAX_CHR;
898 			arcn->sb.st_mode |= S_IFCHR;
899 		}
900 		devmajor = (dev_t)asc_ul(hd->devmajor,sizeof(hd->devmajor),OCT);
901 		devminor = (dev_t)asc_ul(hd->devminor,sizeof(hd->devminor),OCT);
902 		arcn->sb.st_rdev = TODEV(devmajor, devminor);
903 		break;
904 	case SYMTYPE:
905 	case LNKTYPE:
906 		if (hd->typeflag == SYMTYPE) {
907 			arcn->type = PAX_SLK;
908 			arcn->sb.st_mode |= S_IFLNK;
909 		} else {
910 			arcn->type = PAX_HLK;
911 			/*
912 			 * so printing looks better
913 			 */
914 			arcn->sb.st_mode |= S_IFREG;
915 			arcn->sb.st_nlink = 2;
916 		}
917 		/*
918 		 * copy the link name
919 		 */
920 		arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
921 			sizeof(hd->linkname));
922 		arcn->ln_name[arcn->ln_nlen] = '\0';
923 		break;
924 	case CONTTYPE:
925 	case AREGTYPE:
926 	case REGTYPE:
927 	default:
928 		/*
929 		 * these types have file data that follows. Set the skip and
930 		 * pad fields.
931 		 */
932 		arcn->type = PAX_REG;
933 		arcn->pad = TAR_PAD(arcn->sb.st_size);
934 		arcn->skip = arcn->sb.st_size;
935 		arcn->sb.st_mode |= S_IFREG;
936 		break;
937 	}
938 	return(0);
939 }
940 
941 /*
942  * ustar_wr()
943  *	write a ustar header for the file specified in the ARCHD to the archive
944  *	Have to check for file types that cannot be stored and file names that
945  *	are too long. Be careful of the term (last arg) to ul_oct, we only use
946  *	'\0' for the termination character (this is different than picky tar)
947  *	ASSUMED: space after header in header block is zero filled
948  * Return:
949  *	0 if file has data to be written after the header, 1 if file has NO
950  *	data to write after the header, -1 if archive write failed
951  */
952 
953 #if __STDC__
954 int
955 ustar_wr(register ARCHD *arcn)
956 #else
957 int
958 ustar_wr(arcn)
959 	register ARCHD *arcn;
960 #endif
961 {
962 	register HD_USTAR *hd;
963 	register char *pt;
964 	char hdblk[sizeof(HD_USTAR)];
965 
966 	/*
967 	 * check for those file system types ustar cannot store
968 	 */
969 	if (arcn->type == PAX_SCK) {
970 		warn(1, "Ustar cannot archive a socket %s", arcn->org_name);
971 		return(1);
972 	}
973 
974 	/*
975 	 * check the length of the linkname
976 	 */
977 	if (((arcn->type == PAX_SLK) || (arcn->type == PAX_HLK) ||
978 	    (arcn->type == PAX_HRG)) && (arcn->ln_nlen > sizeof(hd->linkname))){
979 		warn(1, "Link name too long for ustar %s", arcn->ln_name);
980 		return(1);
981 	}
982 
983 	/*
984 	 * split the path name into prefix and name fields (if needed). if
985 	 * pt != arcn->name, the name has to be split
986 	 */
987 	if ((pt = name_split(arcn->name, arcn->nlen)) == NULL) {
988 		warn(1, "File name too long for ustar %s", arcn->name);
989 		return(1);
990 	}
991 	hd = (HD_USTAR *)hdblk;
992 	arcn->pad = 0L;
993 
994 	/*
995 	 * split the name, or zero out the prefix
996 	 */
997 	if (pt != arcn->name) {
998 		/*
999 		 * name was split, pt points at the / where the split is to
1000 		 * occur, we remove the / and copy the first part to the prefix
1001 		 */
1002 		*pt = '\0';
1003 		zf_strncpy(hd->prefix, arcn->name, sizeof(hd->prefix));
1004 		*pt++ = '/';
1005 	} else
1006 		bzero(hd->prefix, sizeof(hd->prefix));
1007 
1008 	/*
1009 	 * copy the name part. this may be the whole path or the part after
1010 	 * the prefix
1011 	 */
1012 	zf_strncpy(hd->name, pt, sizeof(hd->name));
1013 
1014 	/*
1015 	 * set the fields in the header that are type dependent
1016 	 */
1017 	switch(arcn->type) {
1018 	case PAX_DIR:
1019 		hd->typeflag = DIRTYPE;
1020 		bzero(hd->linkname, sizeof(hd->linkname));
1021 		bzero(hd->devmajor, sizeof(hd->devmajor));
1022 		bzero(hd->devminor, sizeof(hd->devminor));
1023 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1024 			goto out;
1025 		break;
1026 	case PAX_CHR:
1027 	case PAX_BLK:
1028 		if (arcn->type == PAX_CHR)
1029 			hd->typeflag = CHRTYPE;
1030 		else
1031 			hd->typeflag = BLKTYPE;
1032 		bzero(hd->linkname, sizeof(hd->linkname));
1033 		if (ul_oct((u_long)MAJOR(arcn->sb.st_rdev), hd->devmajor,
1034 		   sizeof(hd->devmajor), 3) ||
1035 		   ul_oct((u_long)MINOR(arcn->sb.st_rdev), hd->devminor,
1036 		   sizeof(hd->devminor), 3) ||
1037 		   ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1038 			goto out;
1039 		break;
1040 	case PAX_FIF:
1041 		hd->typeflag = FIFOTYPE;
1042 		bzero(hd->linkname, sizeof(hd->linkname));
1043 		bzero(hd->devmajor, sizeof(hd->devmajor));
1044 		bzero(hd->devminor, sizeof(hd->devminor));
1045 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1046 			goto out;
1047 		break;
1048 	case PAX_SLK:
1049 	case PAX_HLK:
1050 	case PAX_HRG:
1051 		if (arcn->type == PAX_SLK)
1052 			hd->typeflag = SYMTYPE;
1053 		else
1054 			hd->typeflag = LNKTYPE;
1055 		zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
1056 		bzero(hd->devmajor, sizeof(hd->devmajor));
1057 		bzero(hd->devminor, sizeof(hd->devminor));
1058 		if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1059 			goto out;
1060 		break;
1061 	case PAX_REG:
1062 	case PAX_CTG:
1063 	default:
1064 		/*
1065 		 * file data with this type, set the padding
1066 		 */
1067 		if (arcn->type == PAX_CTG)
1068 			hd->typeflag = CONTTYPE;
1069 		else
1070 			hd->typeflag = REGTYPE;
1071 		bzero(hd->linkname, sizeof(hd->linkname));
1072 		bzero(hd->devmajor, sizeof(hd->devmajor));
1073 		bzero(hd->devminor, sizeof(hd->devminor));
1074 		arcn->pad = TAR_PAD(arcn->sb.st_size);
1075 #		ifdef NET2_STAT
1076 		if (ul_oct((u_long)arcn->sb.st_size, hd->size,
1077 		    sizeof(hd->size), 3)) {
1078 #		else
1079 		if (uqd_oct((u_quad_t)arcn->sb.st_size, hd->size,
1080 		    sizeof(hd->size), 3)) {
1081 #		endif
1082 			warn(1,"File is too long for ustar %s",arcn->org_name);
1083 			return(1);
1084 		}
1085 		break;
1086 	}
1087 
1088 	zf_strncpy(hd->magic, TMAGIC, TMAGLEN);
1089 	zf_strncpy(hd->version, TVERSION, TVERSLEN);
1090 
1091 	/*
1092 	 * set the remaining fields. Some versions want all 16 bits of mode
1093 	 * we better humor them (they really do not meet spec though)....
1094 	 */
1095 	if (ul_oct((u_long)arcn->sb.st_mode, hd->mode, sizeof(hd->mode), 3) ||
1096 	    ul_oct((u_long)arcn->sb.st_uid, hd->uid, sizeof(hd->uid), 3)  ||
1097 	    ul_oct((u_long)arcn->sb.st_gid, hd->gid, sizeof(hd->gid), 3) ||
1098 	    ul_oct((u_long)arcn->sb.st_mtime,hd->mtime,sizeof(hd->mtime),3))
1099 		goto out;
1100 	zf_strncpy(hd->uname,name_uid(arcn->sb.st_uid, 0),sizeof(hd->uname));
1101 	zf_strncpy(hd->gname,name_gid(arcn->sb.st_gid, 0),sizeof(hd->gname));
1102 
1103 	/*
1104 	 * calculate and store the checksum write the header to the archive
1105 	 * return 0 tells the caller to now write the file data, 1 says no data
1106 	 * needs to be written
1107 	 */
1108 	if (ul_oct(tar_chksm(hdblk, sizeof(HD_USTAR)), hd->chksum,
1109 	   sizeof(hd->chksum), 3))
1110 		goto out;
1111 	if (wr_rdbuf(hdblk, sizeof(HD_USTAR)) < 0)
1112 		return(-1);
1113 	if (wr_skip((off_t)(BLKMULT - sizeof(HD_USTAR))) < 0)
1114 		return(-1);
1115 	if ((arcn->type == PAX_CTG) || (arcn->type == PAX_REG))
1116 		return(0);
1117 	return(1);
1118 
1119     out:
1120     	/*
1121 	 * header field is out of range
1122 	 */
1123 	warn(1, "Ustar header field is too small for %s", arcn->org_name);
1124 	return(1);
1125 }
1126 
1127 /*
1128  * name_split()
1129  *	see if the name has to be split for storage in a ustar header. We try
1130  *	to fit the entire name in the name field without splitting if we can.
1131  *	The split point is always at a /
1132  * Return
1133  *	character pointer to split point (always the / that is to be removed
1134  *	if the split is not needed, the points is set to the start of the file
1135  *	name (it would violate the spec to split there). A NULL is returned if
1136  *	the file name is too long
1137  */
1138 
1139 #if __STDC__
1140 static char *
1141 name_split(register char *name, register int len)
1142 #else
1143 static char *
1144 name_split(name, len)
1145 	register char *name;
1146 	register int len;
1147 #endif
1148 {
1149 	register char *start;
1150 
1151 	/*
1152 	 * check to see if the file name is small enough to fit in the name
1153 	 * field. if so just return a pointer to the name.
1154 	 */
1155 	if (len <= TNMSZ)
1156 		return(name);
1157 	if (len > (TPFSZ + TNMSZ + 1))
1158 		return(NULL);
1159 
1160 	/*
1161 	 * we start looking at the biggest sized piece that fits in the name
1162 	 * field. We walk foward looking for a slash to split at. The idea is
1163 	 * to find the biggest piece to fit in the name field (or the smallest
1164 	 * prefix we can find) (the -1 is correct the biggest piece would
1165 	 * include the slash between the two parts that gets thrown away)
1166 	 */
1167 	start = name + len - TNMSZ - 1;
1168 	while ((*start != '\0') && (*start != '/'))
1169 		++start;
1170 
1171 	/*
1172 	 * if we hit the end of the string, this name cannot be split, so we
1173 	 * cannot store this file.
1174 	 */
1175 	if (*start == '\0')
1176 		return(NULL);
1177 	len = start - name;
1178 
1179 	/*
1180 	 * NOTE: /str where the length of str == TNMSZ can not be stored under
1181 	 * the p1003.1-1990 spec for ustar. We could force a prefix of / and
1182 	 * the file would then expand on extract to //str. The len == 0 below
1183 	 * makes this special case follow the spec to the letter.
1184 	 */
1185 	if ((len > TPFSZ) || (len == 0))
1186 		return(NULL);
1187 
1188 	/*
1189 	 * ok have a split point, return it to the caller
1190 	 */
1191 	return(start);
1192 }
1193