tar.c revision 1.1 1 /*-
2 * Copyright (c) 1992 Keith Muller.
3 * Copyright (c) 1992, 1993
4 * The Regents of the University of California. All rights reserved.
5 *
6 * This code is derived from software contributed to Berkeley by
7 * Keith Muller of the University of California, San Diego.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. All advertising materials mentioning features or use of this software
18 * must display the following acknowledgement:
19 * This product includes software developed by the University of
20 * California, Berkeley and its contributors.
21 * 4. Neither the name of the University nor the names of its contributors
22 * may be used to endorse or promote products derived from this software
23 * without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
26 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
30 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
31 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
32 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
33 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
34 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
35 * SUCH DAMAGE.
36 */
37
38 #ifndef lint
39 static char sccsid[] = "@(#)tar.c 8.2 (Berkeley) 4/18/94";
40 #endif /* not lint */
41
42 #include <sys/types.h>
43 #include <sys/time.h>
44 #include <sys/stat.h>
45 #include <sys/param.h>
46 #include <string.h>
47 #include <stdio.h>
48 #include <ctype.h>
49 #include <unistd.h>
50 #include <stdlib.h>
51 #include "pax.h"
52 #include "extern.h"
53 #include "tar.h"
54
55 /*
56 * Routines for reading, writing and header identify of various versions of tar
57 */
58
59 static u_long tar_chksm __P((register char *, register int));
60 static char *name_split __P((register char *, register int));
61 static int ul_oct __P((u_long, register char *, register int, int));
62 #ifndef NET2_STAT
63 static int uqd_oct __P((u_quad_t, register char *, register int, int));
64 #endif
65
66 /*
67 * Routines common to all versions of tar
68 */
69
70 static int tar_nodir; /* do not write dirs under old tar */
71
72 /*
73 * tar_endwr()
74 * add the tar trailer of two null blocks
75 * Return:
76 * 0 if ok, -1 otherwise (what wr_skip returns)
77 */
78
79 #if __STDC__
80 int
81 tar_endwr(void)
82 #else
83 int
84 tar_endwr()
85 #endif
86 {
87 return(wr_skip((off_t)(NULLCNT*BLKMULT)));
88 }
89
90 /*
91 * tar_endrd()
92 * no cleanup needed here, just return size of trailer (for append)
93 * Return:
94 * size of trailer (2 * BLKMULT)
95 */
96
97 #if __STDC__
98 off_t
99 tar_endrd(void)
100 #else
101 off_t
102 tar_endrd()
103 #endif
104 {
105 return((off_t)(NULLCNT*BLKMULT));
106 }
107
108 /*
109 * tar_trail()
110 * Called to determine if a header block is a valid trailer. We are passed
111 * the block, the in_sync flag (which tells us we are in resync mode;
112 * looking for a valid header), and cnt (which starts at zero) which is
113 * used to count the number of empty blocks we have seen so far.
114 * Return:
115 * 0 if a valid trailer, -1 if not a valid trailer, or 1 if the block
116 * could never contain a header.
117 */
118
119 #if __STDC__
120 int
121 tar_trail(register char *buf, register int in_resync, register int *cnt)
122 #else
123 int
124 tar_trail(buf, in_resync, cnt)
125 register char *buf;
126 register int in_resync;
127 register int *cnt;
128 #endif
129 {
130 register int i;
131
132 /*
133 * look for all zero, trailer is two consecutive blocks of zero
134 */
135 for (i = 0; i < BLKMULT; ++i) {
136 if (buf[i] != '\0')
137 break;
138 }
139
140 /*
141 * if not all zero it is not a trailer, but MIGHT be a header.
142 */
143 if (i != BLKMULT)
144 return(-1);
145
146 /*
147 * When given a zero block, we must be careful!
148 * If we are not in resync mode, check for the trailer. Have to watch
149 * out that we do not mis-identify file data as the trailer, so we do
150 * NOT try to id a trailer during resync mode. During resync mode we
151 * might as well throw this block out since a valid header can NEVER be
152 * a block of all 0 (we must have a valid file name).
153 */
154 if (!in_resync && (++*cnt >= NULLCNT))
155 return(0);
156 return(1);
157 }
158
159 /*
160 * ul_oct()
161 * convert an unsigned long to an octal string. many oddball field
162 * termination characters are used by the various versions of tar in the
163 * different fields. term selects which kind to use. str is BLANK padded
164 * at the front to len. we are unable to use only one format as many old
165 * tar readers are very cranky about this.
166 * Return:
167 * 0 if the number fit into the string, -1 otherwise
168 */
169
170 #if __STDC__
171 static int
172 ul_oct(u_long val, register char *str, register int len, int term)
173 #else
174 static int
175 ul_oct(val, str, len, term)
176 u_long val;
177 register char *str;
178 register int len;
179 int term;
180 #endif
181 {
182 register char *pt;
183
184 /*
185 * term selects the appropriate character(s) for the end of the string
186 */
187 pt = str + len - 1;
188 switch(term) {
189 case 3:
190 *pt-- = '\0';
191 break;
192 case 2:
193 *pt-- = ' ';
194 *pt-- = '\0';
195 break;
196 case 1:
197 *pt-- = ' ';
198 break;
199 case 0:
200 default:
201 *pt-- = '\0';
202 *pt-- = ' ';
203 break;
204 }
205
206 /*
207 * convert and blank pad if there is space
208 */
209 while (pt >= str) {
210 *pt-- = '0' + (char)(val & 0x7);
211 if ((val = val >> 3) == (u_long)0)
212 break;
213 }
214
215 while (pt >= str)
216 *pt-- = ' ';
217 if (val != (u_long)0)
218 return(-1);
219 return(0);
220 }
221
222 #ifndef NET2_STAT
223 /*
224 * uqd_oct()
225 * convert an u_quad_t to an octal string. one of many oddball field
226 * termination characters are used by the various versions of tar in the
227 * different fields. term selects which kind to use. str is BLANK padded
228 * at the front to len. we are unable to use only one format as many old
229 * tar readers are very cranky about this.
230 * Return:
231 * 0 if the number fit into the string, -1 otherwise
232 */
233
234 #if __STDC__
235 static int
236 uqd_oct(u_quad_t val, register char *str, register int len, int term)
237 #else
238 static int
239 uqd_oct(val, str, len, term)
240 u_quad_t val;
241 register char *str;
242 register int len;
243 int term;
244 #endif
245 {
246 register char *pt;
247
248 /*
249 * term selects the appropriate character(s) for the end of the string
250 */
251 pt = str + len - 1;
252 switch(term) {
253 case 3:
254 *pt-- = '\0';
255 break;
256 case 2:
257 *pt-- = ' ';
258 *pt-- = '\0';
259 break;
260 case 1:
261 *pt-- = ' ';
262 break;
263 case 0:
264 default:
265 *pt-- = '\0';
266 *pt-- = ' ';
267 break;
268 }
269
270 /*
271 * convert and blank pad if there is space
272 */
273 while (pt >= str) {
274 *pt-- = '0' + (char)(val & 0x7);
275 if ((val = val >> 3) == 0)
276 break;
277 }
278
279 while (pt >= str)
280 *pt-- = ' ';
281 if (val != (u_quad_t)0)
282 return(-1);
283 return(0);
284 }
285 #endif
286
287 /*
288 * tar_chksm()
289 * calculate the checksum for a tar block counting the checksum field as
290 * all blanks (BLNKSUM is that value pre-calculated, the sume of 8 blanks).
291 * NOTE: we use len to short circuit summing 0's on write since we ALWAYS
292 * pad headers with 0.
293 * Return:
294 * unsigned long checksum
295 */
296
297 #if __STDC__
298 static u_long
299 tar_chksm(register char *blk, register int len)
300 #else
301 static u_long
302 tar_chksm(blk, len)
303 register char *blk;
304 register int len;
305 #endif
306 {
307 register char *stop;
308 register char *pt;
309 u_long chksm = BLNKSUM; /* inital value is checksum field sum */
310
311 /*
312 * add the part of the block before the checksum field
313 */
314 pt = blk;
315 stop = blk + CHK_OFFSET;
316 while (pt < stop)
317 chksm += (u_long)(*pt++ & 0xff);
318 /*
319 * move past the checksum field and keep going, spec counts the
320 * checksum field as the sum of 8 blanks (which is pre-computed as
321 * BLNKSUM).
322 * ASSUMED: len is greater than CHK_OFFSET. (len is where our 0 padding
323 * starts, no point in summing zero's)
324 */
325 pt += CHK_LEN;
326 stop = blk + len;
327 while (pt < stop)
328 chksm += (u_long)(*pt++ & 0xff);
329 return(chksm);
330 }
331
332 /*
333 * Routines for old BSD style tar (also made portable to sysV tar)
334 */
335
336 /*
337 * tar_id()
338 * determine if a block given to us is a valid tar header (and not a USTAR
339 * header). We have to be on the lookout for those pesky blocks of all
340 * zero's.
341 * Return:
342 * 0 if a tar header, -1 otherwise
343 */
344
345 #if __STDC__
346 int
347 tar_id(register char *blk, int size)
348 #else
349 int
350 tar_id(blk, size)
351 register char *blk;
352 int size;
353 #endif
354 {
355 register HD_TAR *hd;
356 register HD_USTAR *uhd;
357
358 if (size < BLKMULT)
359 return(-1);
360 hd = (HD_TAR *)blk;
361 uhd = (HD_USTAR *)blk;
362
363 /*
364 * check for block of zero's first, a simple and fast test, then make
365 * sure this is not a ustar header by looking for the ustar magic
366 * cookie. We should use TMAGLEN, but some USTAR archive programs are
367 * wrong and create archives missing the \0. Last we check the
368 * checksum. If this is ok we have to assume it is a valid header.
369 */
370 if (hd->name[0] == '\0')
371 return(-1);
372 if (strncmp(uhd->magic, TMAGIC, TMAGLEN - 1) == 0)
373 return(-1);
374 if (asc_ul(hd->chksum,sizeof(hd->chksum),OCT) != tar_chksm(blk,BLKMULT))
375 return(-1);
376 return(0);
377 }
378
379 /*
380 * tar_opt()
381 * handle tar format specific -o options
382 * Return:
383 * 0 if ok -1 otherwise
384 */
385
386 #if __STDC__
387 int
388 tar_opt(void)
389 #else
390 int
391 tar_opt()
392 #endif
393 {
394 OPLIST *opt;
395
396 while ((opt = opt_next()) != NULL) {
397 if (strcmp(opt->name, TAR_OPTION) ||
398 strcmp(opt->value, TAR_NODIR)) {
399 warn(1, "Unknown tar format -o option/value pair %s=%s",
400 opt->name, opt->value);
401 warn(1,"%s=%s is the only supported tar format option",
402 TAR_OPTION, TAR_NODIR);
403 return(-1);
404 }
405
406 /*
407 * we only support one option, and only when writing
408 */
409 if ((act != APPND) && (act != ARCHIVE)) {
410 warn(1, "%s=%s is only supported when writing.",
411 opt->name, opt->value);
412 return(-1);
413 }
414 tar_nodir = 1;
415 }
416 return(0);
417 }
418
419
420 /*
421 * tar_rd()
422 * extract the values out of block already determined to be a tar header.
423 * store the values in the ARCHD parameter.
424 * Return:
425 * 0
426 */
427
428 #if __STDC__
429 int
430 tar_rd(register ARCHD *arcn, register char *buf)
431 #else
432 int
433 tar_rd(arcn, buf)
434 register ARCHD *arcn;
435 register char *buf;
436 #endif
437 {
438 register HD_TAR *hd;
439 register char *pt;
440
441 /*
442 * we only get proper sized buffers passed to us
443 */
444 if (tar_id(buf, BLKMULT) < 0)
445 return(-1);
446 arcn->org_name = arcn->name;
447 arcn->sb.st_nlink = 1;
448 arcn->pat = NULL;
449
450 /*
451 * copy out the name and values in the stat buffer
452 */
453 hd = (HD_TAR *)buf;
454 arcn->nlen = l_strncpy(arcn->name, hd->name, sizeof(hd->name));
455 arcn->name[arcn->nlen] = '\0';
456 arcn->sb.st_mode = (mode_t)(asc_ul(hd->mode,sizeof(hd->mode),OCT) &
457 0xfff);
458 arcn->sb.st_uid = (uid_t)asc_ul(hd->uid, sizeof(hd->uid), OCT);
459 arcn->sb.st_gid = (gid_t)asc_ul(hd->gid, sizeof(hd->gid), OCT);
460 arcn->sb.st_size = (size_t)asc_ul(hd->size, sizeof(hd->size), OCT);
461 arcn->sb.st_mtime = (time_t)asc_ul(hd->mtime, sizeof(hd->mtime), OCT);
462 arcn->sb.st_ctime = arcn->sb.st_atime = arcn->sb.st_mtime;
463
464 /*
465 * have to look at the last character, it may be a '/' and that is used
466 * to encode this as a directory
467 */
468 pt = &(arcn->name[arcn->nlen - 1]);
469 arcn->pad = 0;
470 arcn->skip = 0;
471 switch(hd->linkflag) {
472 case SYMTYPE:
473 /*
474 * symbolic link, need to get the link name and set the type in
475 * the st_mode so -v printing will look correct.
476 */
477 arcn->type = PAX_SLK;
478 arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
479 sizeof(hd->linkname));
480 arcn->ln_name[arcn->ln_nlen] = '\0';
481 arcn->sb.st_mode |= S_IFLNK;
482 break;
483 case LNKTYPE:
484 /*
485 * hard link, need to get the link name, set the type in the
486 * st_mode and st_nlink so -v printing will look better.
487 */
488 arcn->type = PAX_HLK;
489 arcn->sb.st_nlink = 2;
490 arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
491 sizeof(hd->linkname));
492 arcn->ln_name[arcn->ln_nlen] = '\0';
493
494 /*
495 * no idea of what type this thing really points at, but
496 * we set something for printing only.
497 */
498 arcn->sb.st_mode |= S_IFREG;
499 break;
500 case AREGTYPE:
501 case REGTYPE:
502 default:
503 /*
504 * If we have a trailing / this is a directory and NOT a file.
505 */
506 arcn->ln_name[0] = '\0';
507 arcn->ln_nlen = 0;
508 if (*pt == '/') {
509 /*
510 * it is a directory, set the mode for -v printing
511 */
512 arcn->type = PAX_DIR;
513 arcn->sb.st_mode |= S_IFDIR;
514 arcn->sb.st_nlink = 2;
515 } else {
516 /*
517 * have a file that will be followed by data. Set the
518 * skip value to the size field and caluculate the size
519 * of the padding.
520 */
521 arcn->type = PAX_REG;
522 arcn->sb.st_mode |= S_IFREG;
523 arcn->pad = TAR_PAD(arcn->sb.st_size);
524 arcn->skip = arcn->sb.st_size;
525 }
526 break;
527 }
528
529 /*
530 * strip off any trailing slash.
531 */
532 if (*pt == '/') {
533 *pt = '\0';
534 --arcn->nlen;
535 }
536 return(0);
537 }
538
539 /*
540 * tar_wr()
541 * write a tar header for the file specified in the ARCHD to the archive.
542 * Have to check for file types that cannot be stored and file names that
543 * are too long. Be careful of the term (last arg) to ul_oct, each field
544 * of tar has it own spec for the termination character(s).
545 * ASSUMED: space after header in header block is zero filled
546 * Return:
547 * 0 if file has data to be written after the header, 1 if file has NO
548 * data to write after the header, -1 if archive write failed
549 */
550
551 #if __STDC__
552 int
553 tar_wr(register ARCHD *arcn)
554 #else
555 int
556 tar_wr(arcn)
557 register ARCHD *arcn;
558 #endif
559 {
560 register HD_TAR *hd;
561 int len;
562 char hdblk[sizeof(HD_TAR)];
563
564 /*
565 * check for those file system types which tar cannot store
566 */
567 switch(arcn->type) {
568 case PAX_DIR:
569 /*
570 * user asked that dirs not be written to the archive
571 */
572 if (tar_nodir)
573 return(1);
574 break;
575 case PAX_CHR:
576 warn(1, "Tar cannot archive a character device %s",
577 arcn->org_name);
578 return(1);
579 case PAX_BLK:
580 warn(1, "Tar cannot archive a block device %s", arcn->org_name);
581 return(1);
582 case PAX_SCK:
583 warn(1, "Tar cannot archive a socket %s", arcn->org_name);
584 return(1);
585 case PAX_FIF:
586 warn(1, "Tar cannot archive a fifo %s", arcn->org_name);
587 return(1);
588 case PAX_SLK:
589 case PAX_HLK:
590 case PAX_HRG:
591 if (arcn->ln_nlen > sizeof(hd->linkname)) {
592 warn(1,"Link name too long for tar %s", arcn->ln_name);
593 return(1);
594 }
595 break;
596 case PAX_REG:
597 case PAX_CTG:
598 default:
599 break;
600 }
601
602 /*
603 * check file name len, remember extra char for dirs (the / at the end)
604 */
605 len = arcn->nlen;
606 if (arcn->type == PAX_DIR)
607 ++len;
608 if (len > sizeof(hd->name)) {
609 warn(1, "File name too long for tar %s", arcn->name);
610 return(1);
611 }
612
613 /*
614 * copy the data out of the ARCHD into the tar header based on the type
615 * of the file. Remember many tar readers want the unused fields to be
616 * padded with zero. We set the linkflag field (type), the linkname
617 * (or zero if not used),the size, and set the padding (if any) to be
618 * added after the file data (0 for all other types, as they only have
619 * a header)
620 */
621 hd = (HD_TAR *)hdblk;
622 zf_strncpy(hd->name, arcn->name, sizeof(hd->name));
623 arcn->pad = 0;
624
625 if (arcn->type == PAX_DIR) {
626 /*
627 * directories are the same as files, except have a filename
628 * that ends with a /, we add the slash here. No data follows,
629 * dirs, so no pad.
630 */
631 hd->linkflag = AREGTYPE;
632 bzero(hd->linkname, sizeof(hd->linkname));
633 hd->name[len-1] = '/';
634 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
635 goto out;
636 } else if (arcn->type == PAX_SLK) {
637 /*
638 * no data follows this file, so no pad
639 */
640 hd->linkflag = SYMTYPE;
641 zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
642 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
643 goto out;
644 } else if ((arcn->type == PAX_HLK) || (arcn->type == PAX_HRG)) {
645 /*
646 * no data follows this file, so no pad
647 */
648 hd->linkflag = LNKTYPE;
649 zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
650 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 1))
651 goto out;
652 } else {
653 /*
654 * data follows this file, so set the pad
655 */
656 hd->linkflag = AREGTYPE;
657 bzero(hd->linkname, sizeof(hd->linkname));
658 # ifdef NET2_STAT
659 if (ul_oct((u_long)arcn->sb.st_size, hd->size,
660 sizeof(hd->size), 1)) {
661 # else
662 if (uqd_oct((u_quad_t)arcn->sb.st_size, hd->size,
663 sizeof(hd->size), 1)) {
664 # endif
665 warn(1,"File is too large for tar %s", arcn->org_name);
666 return(1);
667 }
668 arcn->pad = TAR_PAD(arcn->sb.st_size);
669 }
670
671 /*
672 * copy those fields that are independent of the type
673 */
674 if (ul_oct((u_long)arcn->sb.st_mode, hd->mode, sizeof(hd->mode), 0) ||
675 ul_oct((u_long)arcn->sb.st_uid, hd->uid, sizeof(hd->uid), 0) ||
676 ul_oct((u_long)arcn->sb.st_gid, hd->gid, sizeof(hd->gid), 0) ||
677 ul_oct((u_long)arcn->sb.st_mtime, hd->mtime, sizeof(hd->mtime), 1))
678 goto out;
679
680 /*
681 * calculate and add the checksum, then write the header. A return of
682 * 0 tells the caller to now write the file data, 1 says no data needs
683 * to be written
684 */
685 if (ul_oct(tar_chksm(hdblk, sizeof(HD_TAR)), hd->chksum,
686 sizeof(hd->chksum), 2))
687 goto out;
688 if (wr_rdbuf(hdblk, sizeof(HD_TAR)) < 0)
689 return(-1);
690 if (wr_skip((off_t)(BLKMULT - sizeof(HD_TAR))) < 0)
691 return(-1);
692 if ((arcn->type == PAX_CTG) || (arcn->type == PAX_REG))
693 return(0);
694 return(1);
695
696 out:
697 /*
698 * header field is out of range
699 */
700 warn(1, "Tar header field is too small for %s", arcn->org_name);
701 return(1);
702 }
703
704 /*
705 * Routines for POSIX ustar
706 */
707
708 /*
709 * ustar_strd()
710 * initialization for ustar read
711 * Return:
712 * 0 if ok, -1 otherwise
713 */
714
715 #if __STDC__
716 int
717 ustar_strd(void)
718 #else
719 int
720 ustar_strd()
721 #endif
722 {
723 if ((usrtb_start() < 0) || (grptb_start() < 0))
724 return(-1);
725 return(0);
726 }
727
728 /*
729 * ustar_stwr()
730 * initialization for ustar write
731 * Return:
732 * 0 if ok, -1 otherwise
733 */
734
735 #if __STDC__
736 int
737 ustar_stwr(void)
738 #else
739 int
740 ustar_stwr()
741 #endif
742 {
743 if ((uidtb_start() < 0) || (gidtb_start() < 0))
744 return(-1);
745 return(0);
746 }
747
748 /*
749 * ustar_id()
750 * determine if a block given to us is a valid ustar header. We have to
751 * be on the lookout for those pesky blocks of all zero's
752 * Return:
753 * 0 if a ustar header, -1 otherwise
754 */
755
756 #if __STDC__
757 int
758 ustar_id(char *blk, int size)
759 #else
760 int
761 ustar_id(blk, size)
762 char *blk;
763 int size;
764 #endif
765 {
766 register HD_USTAR *hd;
767
768 if (size < BLKMULT)
769 return(-1);
770 hd = (HD_USTAR *)blk;
771
772 /*
773 * check for block of zero's first, a simple and fast test then check
774 * ustar magic cookie. We should use TMAGLEN, but some USTAR archive
775 * programs are fouled up and create archives missing the \0. Last we
776 * check the checksum. If ok we have to assume it is a valid header.
777 */
778 if (hd->name[0] == '\0')
779 return(-1);
780 if (strncmp(hd->magic, TMAGIC, TMAGLEN - 1) != 0)
781 return(-1);
782 if (asc_ul(hd->chksum,sizeof(hd->chksum),OCT) != tar_chksm(blk,BLKMULT))
783 return(-1);
784 return(0);
785 }
786
787 /*
788 * ustar_rd()
789 * extract the values out of block already determined to be a ustar header.
790 * store the values in the ARCHD parameter.
791 * Return:
792 * 0
793 */
794
795 #if __STDC__
796 int
797 ustar_rd(register ARCHD *arcn, register char *buf)
798 #else
799 int
800 ustar_rd(arcn, buf)
801 register ARCHD *arcn;
802 register char *buf;
803 #endif
804 {
805 register HD_USTAR *hd;
806 register char *dest;
807 register int cnt = 0;
808 dev_t devmajor;
809 dev_t devminor;
810
811 /*
812 * we only get proper sized buffers
813 */
814 if (ustar_id(buf, BLKMULT) < 0)
815 return(-1);
816 arcn->org_name = arcn->name;
817 arcn->sb.st_nlink = 1;
818 arcn->pat = NULL;
819 hd = (HD_USTAR *)buf;
820
821 /*
822 * see if the filename is split into two parts. if, so joint the parts.
823 * we copy the prefix first and add a / between the prefix and name.
824 */
825 dest = arcn->name;
826 if (*(hd->prefix) != '\0') {
827 cnt = l_strncpy(arcn->name, hd->prefix, sizeof(hd->prefix));
828 dest = arcn->name + arcn->nlen;
829 *dest++ = '/';
830 }
831 arcn->nlen = l_strncpy(dest, hd->name, sizeof(hd->name));
832 arcn->nlen += cnt;
833 arcn->name[arcn->nlen] = '\0';
834
835 /*
836 * follow the spec to the letter. we should only have mode bits, strip
837 * off all other crud we may be passed.
838 */
839 arcn->sb.st_mode = (mode_t)(asc_ul(hd->mode, sizeof(hd->mode), OCT) &
840 0xfff);
841 arcn->sb.st_size = (size_t)asc_ul(hd->size, sizeof(hd->size), OCT);
842 arcn->sb.st_mtime = (time_t)asc_ul(hd->mtime, sizeof(hd->mtime), OCT);
843 arcn->sb.st_ctime = arcn->sb.st_atime = arcn->sb.st_mtime;
844
845 /*
846 * If we can find the ascii names for gname and uname in the password
847 * and group files we will use the uid's and gid they bind. Otherwise
848 * we use the uid and gid values stored in the header. (This is what
849 * the posix spec wants).
850 */
851 hd->gname[sizeof(hd->gname) - 1] = '\0';
852 if (gid_name(hd->gname, &(arcn->sb.st_gid)) < 0)
853 arcn->sb.st_gid = (gid_t)asc_ul(hd->gid, sizeof(hd->gid), OCT);
854 hd->uname[sizeof(hd->uname) - 1] = '\0';
855 if (uid_name(hd->uname, &(arcn->sb.st_uid)) < 0)
856 arcn->sb.st_uid = (uid_t)asc_ul(hd->uid, sizeof(hd->uid), OCT);
857
858 /*
859 * set the defaults, these may be changed depending on the file type
860 */
861 arcn->ln_name[0] = '\0';
862 arcn->ln_nlen = 0;
863 arcn->pad = 0;
864 arcn->skip = 0;
865 arcn->sb.st_rdev = (dev_t)0;
866
867 /*
868 * set the mode and PAX type according to the typeflag in the header
869 */
870 switch(hd->typeflag) {
871 case FIFOTYPE:
872 arcn->type = PAX_FIF;
873 arcn->sb.st_mode |= S_IFIFO;
874 break;
875 case DIRTYPE:
876 arcn->type = PAX_DIR;
877 arcn->sb.st_mode |= S_IFDIR;
878 arcn->sb.st_nlink = 2;
879
880 /*
881 * Some programs that create ustar archives append a '/'
882 * to the pathname for directories. This clearly violates
883 * ustar specs, but we will silently strip it off anyway.
884 */
885 if (arcn->name[arcn->nlen - 1] == '/')
886 arcn->name[--arcn->nlen] = '\0';
887 break;
888 case BLKTYPE:
889 case CHRTYPE:
890 /*
891 * this type requires the rdev field to be set.
892 */
893 if (hd->typeflag == BLKTYPE) {
894 arcn->type = PAX_BLK;
895 arcn->sb.st_mode |= S_IFBLK;
896 } else {
897 arcn->type = PAX_CHR;
898 arcn->sb.st_mode |= S_IFCHR;
899 }
900 devmajor = (dev_t)asc_ul(hd->devmajor,sizeof(hd->devmajor),OCT);
901 devminor = (dev_t)asc_ul(hd->devminor,sizeof(hd->devminor),OCT);
902 arcn->sb.st_rdev = TODEV(devmajor, devminor);
903 break;
904 case SYMTYPE:
905 case LNKTYPE:
906 if (hd->typeflag == SYMTYPE) {
907 arcn->type = PAX_SLK;
908 arcn->sb.st_mode |= S_IFLNK;
909 } else {
910 arcn->type = PAX_HLK;
911 /*
912 * so printing looks better
913 */
914 arcn->sb.st_mode |= S_IFREG;
915 arcn->sb.st_nlink = 2;
916 }
917 /*
918 * copy the link name
919 */
920 arcn->ln_nlen = l_strncpy(arcn->ln_name, hd->linkname,
921 sizeof(hd->linkname));
922 arcn->ln_name[arcn->ln_nlen] = '\0';
923 break;
924 case CONTTYPE:
925 case AREGTYPE:
926 case REGTYPE:
927 default:
928 /*
929 * these types have file data that follows. Set the skip and
930 * pad fields.
931 */
932 arcn->type = PAX_REG;
933 arcn->pad = TAR_PAD(arcn->sb.st_size);
934 arcn->skip = arcn->sb.st_size;
935 arcn->sb.st_mode |= S_IFREG;
936 break;
937 }
938 return(0);
939 }
940
941 /*
942 * ustar_wr()
943 * write a ustar header for the file specified in the ARCHD to the archive
944 * Have to check for file types that cannot be stored and file names that
945 * are too long. Be careful of the term (last arg) to ul_oct, we only use
946 * '\0' for the termination character (this is different than picky tar)
947 * ASSUMED: space after header in header block is zero filled
948 * Return:
949 * 0 if file has data to be written after the header, 1 if file has NO
950 * data to write after the header, -1 if archive write failed
951 */
952
953 #if __STDC__
954 int
955 ustar_wr(register ARCHD *arcn)
956 #else
957 int
958 ustar_wr(arcn)
959 register ARCHD *arcn;
960 #endif
961 {
962 register HD_USTAR *hd;
963 register char *pt;
964 char hdblk[sizeof(HD_USTAR)];
965
966 /*
967 * check for those file system types ustar cannot store
968 */
969 if (arcn->type == PAX_SCK) {
970 warn(1, "Ustar cannot archive a socket %s", arcn->org_name);
971 return(1);
972 }
973
974 /*
975 * check the length of the linkname
976 */
977 if (((arcn->type == PAX_SLK) || (arcn->type == PAX_HLK) ||
978 (arcn->type == PAX_HRG)) && (arcn->ln_nlen > sizeof(hd->linkname))){
979 warn(1, "Link name too long for ustar %s", arcn->ln_name);
980 return(1);
981 }
982
983 /*
984 * split the path name into prefix and name fields (if needed). if
985 * pt != arcn->name, the name has to be split
986 */
987 if ((pt = name_split(arcn->name, arcn->nlen)) == NULL) {
988 warn(1, "File name too long for ustar %s", arcn->name);
989 return(1);
990 }
991 hd = (HD_USTAR *)hdblk;
992 arcn->pad = 0L;
993
994 /*
995 * split the name, or zero out the prefix
996 */
997 if (pt != arcn->name) {
998 /*
999 * name was split, pt points at the / where the split is to
1000 * occur, we remove the / and copy the first part to the prefix
1001 */
1002 *pt = '\0';
1003 zf_strncpy(hd->prefix, arcn->name, sizeof(hd->prefix));
1004 *pt++ = '/';
1005 } else
1006 bzero(hd->prefix, sizeof(hd->prefix));
1007
1008 /*
1009 * copy the name part. this may be the whole path or the part after
1010 * the prefix
1011 */
1012 zf_strncpy(hd->name, pt, sizeof(hd->name));
1013
1014 /*
1015 * set the fields in the header that are type dependent
1016 */
1017 switch(arcn->type) {
1018 case PAX_DIR:
1019 hd->typeflag = DIRTYPE;
1020 bzero(hd->linkname, sizeof(hd->linkname));
1021 bzero(hd->devmajor, sizeof(hd->devmajor));
1022 bzero(hd->devminor, sizeof(hd->devminor));
1023 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1024 goto out;
1025 break;
1026 case PAX_CHR:
1027 case PAX_BLK:
1028 if (arcn->type == PAX_CHR)
1029 hd->typeflag = CHRTYPE;
1030 else
1031 hd->typeflag = BLKTYPE;
1032 bzero(hd->linkname, sizeof(hd->linkname));
1033 if (ul_oct((u_long)MAJOR(arcn->sb.st_rdev), hd->devmajor,
1034 sizeof(hd->devmajor), 3) ||
1035 ul_oct((u_long)MINOR(arcn->sb.st_rdev), hd->devminor,
1036 sizeof(hd->devminor), 3) ||
1037 ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1038 goto out;
1039 break;
1040 case PAX_FIF:
1041 hd->typeflag = FIFOTYPE;
1042 bzero(hd->linkname, sizeof(hd->linkname));
1043 bzero(hd->devmajor, sizeof(hd->devmajor));
1044 bzero(hd->devminor, sizeof(hd->devminor));
1045 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1046 goto out;
1047 break;
1048 case PAX_SLK:
1049 case PAX_HLK:
1050 case PAX_HRG:
1051 if (arcn->type == PAX_SLK)
1052 hd->typeflag = SYMTYPE;
1053 else
1054 hd->typeflag = LNKTYPE;
1055 zf_strncpy(hd->linkname,arcn->ln_name, sizeof(hd->linkname));
1056 bzero(hd->devmajor, sizeof(hd->devmajor));
1057 bzero(hd->devminor, sizeof(hd->devminor));
1058 if (ul_oct((u_long)0L, hd->size, sizeof(hd->size), 3))
1059 goto out;
1060 break;
1061 case PAX_REG:
1062 case PAX_CTG:
1063 default:
1064 /*
1065 * file data with this type, set the padding
1066 */
1067 if (arcn->type == PAX_CTG)
1068 hd->typeflag = CONTTYPE;
1069 else
1070 hd->typeflag = REGTYPE;
1071 bzero(hd->linkname, sizeof(hd->linkname));
1072 bzero(hd->devmajor, sizeof(hd->devmajor));
1073 bzero(hd->devminor, sizeof(hd->devminor));
1074 arcn->pad = TAR_PAD(arcn->sb.st_size);
1075 # ifdef NET2_STAT
1076 if (ul_oct((u_long)arcn->sb.st_size, hd->size,
1077 sizeof(hd->size), 3)) {
1078 # else
1079 if (uqd_oct((u_quad_t)arcn->sb.st_size, hd->size,
1080 sizeof(hd->size), 3)) {
1081 # endif
1082 warn(1,"File is too long for ustar %s",arcn->org_name);
1083 return(1);
1084 }
1085 break;
1086 }
1087
1088 zf_strncpy(hd->magic, TMAGIC, TMAGLEN);
1089 zf_strncpy(hd->version, TVERSION, TVERSLEN);
1090
1091 /*
1092 * set the remaining fields. Some versions want all 16 bits of mode
1093 * we better humor them (they really do not meet spec though)....
1094 */
1095 if (ul_oct((u_long)arcn->sb.st_mode, hd->mode, sizeof(hd->mode), 3) ||
1096 ul_oct((u_long)arcn->sb.st_uid, hd->uid, sizeof(hd->uid), 3) ||
1097 ul_oct((u_long)arcn->sb.st_gid, hd->gid, sizeof(hd->gid), 3) ||
1098 ul_oct((u_long)arcn->sb.st_mtime,hd->mtime,sizeof(hd->mtime),3))
1099 goto out;
1100 zf_strncpy(hd->uname,name_uid(arcn->sb.st_uid, 0),sizeof(hd->uname));
1101 zf_strncpy(hd->gname,name_gid(arcn->sb.st_gid, 0),sizeof(hd->gname));
1102
1103 /*
1104 * calculate and store the checksum write the header to the archive
1105 * return 0 tells the caller to now write the file data, 1 says no data
1106 * needs to be written
1107 */
1108 if (ul_oct(tar_chksm(hdblk, sizeof(HD_USTAR)), hd->chksum,
1109 sizeof(hd->chksum), 3))
1110 goto out;
1111 if (wr_rdbuf(hdblk, sizeof(HD_USTAR)) < 0)
1112 return(-1);
1113 if (wr_skip((off_t)(BLKMULT - sizeof(HD_USTAR))) < 0)
1114 return(-1);
1115 if ((arcn->type == PAX_CTG) || (arcn->type == PAX_REG))
1116 return(0);
1117 return(1);
1118
1119 out:
1120 /*
1121 * header field is out of range
1122 */
1123 warn(1, "Ustar header field is too small for %s", arcn->org_name);
1124 return(1);
1125 }
1126
1127 /*
1128 * name_split()
1129 * see if the name has to be split for storage in a ustar header. We try
1130 * to fit the entire name in the name field without splitting if we can.
1131 * The split point is always at a /
1132 * Return
1133 * character pointer to split point (always the / that is to be removed
1134 * if the split is not needed, the points is set to the start of the file
1135 * name (it would violate the spec to split there). A NULL is returned if
1136 * the file name is too long
1137 */
1138
1139 #if __STDC__
1140 static char *
1141 name_split(register char *name, register int len)
1142 #else
1143 static char *
1144 name_split(name, len)
1145 register char *name;
1146 register int len;
1147 #endif
1148 {
1149 register char *start;
1150
1151 /*
1152 * check to see if the file name is small enough to fit in the name
1153 * field. if so just return a pointer to the name.
1154 */
1155 if (len <= TNMSZ)
1156 return(name);
1157 if (len > (TPFSZ + TNMSZ + 1))
1158 return(NULL);
1159
1160 /*
1161 * we start looking at the biggest sized piece that fits in the name
1162 * field. We walk foward looking for a slash to split at. The idea is
1163 * to find the biggest piece to fit in the name field (or the smallest
1164 * prefix we can find) (the -1 is correct the biggest piece would
1165 * include the slash between the two parts that gets thrown away)
1166 */
1167 start = name + len - TNMSZ - 1;
1168 while ((*start != '\0') && (*start != '/'))
1169 ++start;
1170
1171 /*
1172 * if we hit the end of the string, this name cannot be split, so we
1173 * cannot store this file.
1174 */
1175 if (*start == '\0')
1176 return(NULL);
1177 len = start - name;
1178
1179 /*
1180 * NOTE: /str where the length of str == TNMSZ can not be stored under
1181 * the p1003.1-1990 spec for ustar. We could force a prefix of / and
1182 * the file would then expand on extract to //str. The len == 0 below
1183 * makes this special case follow the spec to the letter.
1184 */
1185 if ((len > TPFSZ) || (len == 0))
1186 return(NULL);
1187
1188 /*
1189 * ok have a split point, return it to the caller
1190 */
1191 return(start);
1192 }
1193