1 /* Create a tar archive.
3 Copyright (C) 1985, 1992, 1993, 1994, 1996, 1997, 1999, 2000, 2001,
4 2003, 2004, 2005 Free Software Foundation, Inc.
6 Written by John Gilmore, on 1985-08-25.
8 This program is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 2, or (at your option) any later
13 This program is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
16 Public License for more details.
18 You should have received a copy of the GNU General Public License along
19 with this program; if not, write to the Free Software Foundation, Inc.,
20 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
38 /* The maximum uintmax_t value that can be represented with DIGITS digits,
39 assuming that each digit is BITS_PER_DIGIT wide. */
40 #define MAX_VAL_WITH_DIGITS(digits, bits_per_digit) \
41 ((digits) * (bits_per_digit) < sizeof (uintmax_t) * CHAR_BIT \
42 ? ((uintmax_t) 1 << ((digits) * (bits_per_digit))) - 1 \
45 /* The maximum uintmax_t value that can be represented with octal
46 digits and a trailing NUL in BUFFER. */
47 #define MAX_OCTAL_VAL(buffer) MAX_VAL_WITH_DIGITS (sizeof (buffer) - 1, LG_8)
49 /* Convert VALUE to an octal representation suitable for tar headers.
50 Output to buffer WHERE with size SIZE.
51 The result is undefined if SIZE is 0 or if VALUE is too large to fit. */
54 to_octal (uintmax_t value
, char *where
, size_t size
)
61 where
[--i
] = '0' + (v
& ((1 << LG_8
) - 1));
67 /* Copy at most LEN bytes from the string SRC to DST. Terminate with
68 NUL unless SRC is LEN or more bytes long. */
71 tar_copy_str (char *dst
, const char *src
, size_t len
)
74 for (i
= 0; i
< len
; i
++)
75 if (! (dst
[i
] = src
[i
]))
79 /* Same as tar_copy_str, but always terminate with NUL if using
83 tar_name_copy_str (char *dst
, const char *src
, size_t len
)
85 tar_copy_str (dst
, src
, len
);
86 if (archive_format
== OLDGNU_FORMAT
)
90 /* Convert NEGATIVE VALUE to a base-256 representation suitable for
91 tar headers. NEGATIVE is 1 if VALUE was negative before being cast
92 to uintmax_t, 0 otherwise. Output to buffer WHERE with size SIZE.
93 The result is undefined if SIZE is 0 or if VALUE is too large to
97 to_base256 (int negative
, uintmax_t value
, char *where
, size_t size
)
100 uintmax_t propagated_sign_bits
=
101 ((uintmax_t) - negative
<< (CHAR_BIT
* sizeof v
- LG_256
));
106 where
[--i
] = v
& ((1 << LG_256
) - 1);
107 v
= propagated_sign_bits
| (v
>> LG_256
);
112 /* Convert NEGATIVE VALUE (which was originally of size VALSIZE) to
113 external form, using SUBSTITUTE (...) if VALUE won't fit. Output
114 to buffer WHERE with size SIZE. NEGATIVE is 1 iff VALUE was
115 negative before being cast to uintmax_t; its original bitpattern
116 can be deduced from VALSIZE, its original size before casting.
117 TYPE is the kind of value being output (useful for diagnostics).
118 Prefer the POSIX format of SIZE - 1 octal digits (with leading zero
119 digits), followed by '\0'. If this won't work, and if GNU or
120 OLDGNU format is allowed, use '\200' followed by base-256, or (if
121 NEGATIVE is nonzero) '\377' followed by two's complement base-256.
122 If neither format works, use SUBSTITUTE (...) instead. Pass to
123 SUBSTITUTE the address of an 0-or-1 flag recording whether the
124 substitute value is negative. */
127 to_chars (int negative
, uintmax_t value
, size_t valsize
,
128 uintmax_t (*substitute
) (int *),
129 char *where
, size_t size
, const char *type
)
131 int base256_allowed
= (archive_format
== GNU_FORMAT
132 || archive_format
== OLDGNU_FORMAT
);
134 /* Generate the POSIX octal representation if the number fits. */
135 if (! negative
&& value
<= MAX_VAL_WITH_DIGITS (size
- 1, LG_8
))
137 where
[size
- 1] = '\0';
138 to_octal (value
, where
, size
- 1);
141 /* Otherwise, generate the base-256 representation if we are
142 generating an old or new GNU format and if the number fits. */
143 else if (((negative
? -1 - value
: value
)
144 <= MAX_VAL_WITH_DIGITS (size
- 1, LG_256
))
147 where
[0] = negative
? -1 : 1 << (LG_256
- 1);
148 to_base256 (negative
, value
, where
+ 1, size
- 1);
151 /* Otherwise, if the number is negative, and if it would not cause
152 ambiguity on this host by confusing positive with negative
153 values, then generate the POSIX octal representation of the value
154 modulo 2**(field bits). The resulting tar file is
155 machine-dependent, since it depends on the host word size. Yuck!
156 But this is the traditional behavior. */
157 else if (negative
&& valsize
* CHAR_BIT
<= (size
- 1) * LG_8
)
159 static int warned_once
;
163 WARN ((0, 0, _("Generating negative octal headers")));
165 where
[size
- 1] = '\0';
166 to_octal (value
& MAX_VAL_WITH_DIGITS (valsize
* CHAR_BIT
, 1),
170 /* Otherwise, output a substitute value if possible (with a
171 warning), and an error message if not. */
174 uintmax_t maxval
= (base256_allowed
175 ? MAX_VAL_WITH_DIGITS (size
- 1, LG_256
)
176 : MAX_VAL_WITH_DIGITS (size
- 1, LG_8
));
177 char valbuf
[UINTMAX_STRSIZE_BOUND
+ 1];
178 char maxbuf
[UINTMAX_STRSIZE_BOUND
];
179 char minbuf
[UINTMAX_STRSIZE_BOUND
+ 1];
180 char const *minval_string
;
181 char const *maxval_string
= STRINGIFY_BIGINT (maxval
, maxbuf
);
182 char const *value_string
;
186 uintmax_t m
= maxval
+ 1 ? maxval
+ 1 : maxval
/ 2 + 1;
187 char *p
= STRINGIFY_BIGINT (m
, minbuf
+ 1);
196 char *p
= STRINGIFY_BIGINT (- value
, valbuf
+ 1);
201 value_string
= STRINGIFY_BIGINT (value
, valbuf
);
206 uintmax_t sub
= substitute (&negsub
) & maxval
;
207 /* FIXME: This is the only place where GNU_FORMAT differs from
208 OLDGNU_FORMAT. Apart from this they are completely identical. */
209 uintmax_t s
= (negsub
&= archive_format
== GNU_FORMAT
) ? - sub
: sub
;
210 char subbuf
[UINTMAX_STRSIZE_BOUND
+ 1];
211 char *sub_string
= STRINGIFY_BIGINT (s
, subbuf
+ 1);
214 WARN ((0, 0, _("value %s out of %s range %s..%s; substituting %s"),
215 value_string
, type
, minval_string
, maxval_string
,
217 to_chars (negsub
, s
, valsize
, 0, where
, size
, type
);
220 ERROR ((0, 0, _("value %s out of %s range %s..%s"),
221 value_string
, type
, minval_string
, maxval_string
));
226 gid_substitute (int *negative
)
232 static gid_t gid_nobody
;
233 if (!gid_nobody
&& !gname_to_gid ("nobody", &gid_nobody
))
242 gid_to_chars (gid_t v
, char *p
, size_t s
)
244 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, gid_substitute
, p
, s
, "gid_t");
248 major_to_chars (major_t v
, char *p
, size_t s
)
250 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, 0, p
, s
, "major_t");
254 minor_to_chars (minor_t v
, char *p
, size_t s
)
256 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, 0, p
, s
, "minor_t");
260 mode_to_chars (mode_t v
, char *p
, size_t s
)
262 /* In the common case where the internal and external mode bits are the same,
263 and we are not using POSIX or GNU format,
264 propagate all unknown bits to the external mode.
265 This matches historical practice.
266 Otherwise, just copy the bits we know about. */
269 if (S_ISUID
== TSUID
&& S_ISGID
== TSGID
&& S_ISVTX
== TSVTX
270 && S_IRUSR
== TUREAD
&& S_IWUSR
== TUWRITE
&& S_IXUSR
== TUEXEC
271 && S_IRGRP
== TGREAD
&& S_IWGRP
== TGWRITE
&& S_IXGRP
== TGEXEC
272 && S_IROTH
== TOREAD
&& S_IWOTH
== TOWRITE
&& S_IXOTH
== TOEXEC
273 && archive_format
!= POSIX_FORMAT
274 && archive_format
!= USTAR_FORMAT
275 && archive_format
!= GNU_FORMAT
)
283 u
= ((v
& S_ISUID
? TSUID
: 0)
284 | (v
& S_ISGID
? TSGID
: 0)
285 | (v
& S_ISVTX
? TSVTX
: 0)
286 | (v
& S_IRUSR
? TUREAD
: 0)
287 | (v
& S_IWUSR
? TUWRITE
: 0)
288 | (v
& S_IXUSR
? TUEXEC
: 0)
289 | (v
& S_IRGRP
? TGREAD
: 0)
290 | (v
& S_IWGRP
? TGWRITE
: 0)
291 | (v
& S_IXGRP
? TGEXEC
: 0)
292 | (v
& S_IROTH
? TOREAD
: 0)
293 | (v
& S_IWOTH
? TOWRITE
: 0)
294 | (v
& S_IXOTH
? TOEXEC
: 0));
296 to_chars (negative
, u
, sizeof v
, 0, p
, s
, "mode_t");
300 off_to_chars (off_t v
, char *p
, size_t s
)
302 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, 0, p
, s
, "off_t");
306 size_to_chars (size_t v
, char *p
, size_t s
)
308 to_chars (0, (uintmax_t) v
, sizeof v
, 0, p
, s
, "size_t");
312 time_to_chars (time_t v
, char *p
, size_t s
)
314 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, 0, p
, s
, "time_t");
318 uid_substitute (int *negative
)
324 static uid_t uid_nobody
;
325 if (!uid_nobody
&& !uname_to_uid ("nobody", &uid_nobody
))
334 uid_to_chars (uid_t v
, char *p
, size_t s
)
336 to_chars (v
< 0, (uintmax_t) v
, sizeof v
, uid_substitute
, p
, s
, "uid_t");
340 uintmax_to_chars (uintmax_t v
, char *p
, size_t s
)
342 to_chars (0, v
, sizeof v
, 0, p
, s
, "uintmax_t");
346 string_to_chars (char const *str
, char *p
, size_t s
)
348 tar_copy_str (p
, str
, s
);
353 /* A file is considered dumpable if it is sparse and both --sparse and --totals
355 Otherwise, it is dumpable unless any of the following conditions occur:
357 a) it is empty *and* world-readable, or
358 b) current archive is /dev/null */
361 file_dumpable_p (struct tar_stat_info
*st
)
364 return totals_option
&& sparse_option
&& sparse_file_p (st
);
365 return !(st
->archive_file_size
== 0
366 && (st
->stat
.st_mode
& MODE_R
) == MODE_R
);
370 /* Writing routines. */
372 /* Write the EOT block(s). Zero at least two blocks, through the end
373 of the record. Old tar, as previous versions of GNU tar, writes
374 garbage after two zeroed blocks. */
378 union block
*pointer
= find_next_block ();
379 memset (pointer
->buffer
, 0, BLOCKSIZE
);
380 set_next_block_after (pointer
);
381 pointer
= find_next_block ();
382 memset (pointer
->buffer
, 0, available_space_after (pointer
));
383 set_next_block_after (pointer
);
386 /* Write a "private" header */
388 start_private_header (const char *name
, size_t size
)
391 union block
*header
= find_next_block ();
393 memset (header
->buffer
, 0, sizeof (union block
));
395 tar_name_copy_str (header
->header
.name
, name
, NAME_FIELD_SIZE
);
396 OFF_TO_CHARS (size
, header
->header
.size
);
399 TIME_TO_CHARS (t
, header
->header
.mtime
);
400 MODE_TO_CHARS (S_IFREG
|S_IRUSR
|S_IWUSR
|S_IRGRP
|S_IROTH
, header
->header
.mode
);
401 UID_TO_CHARS (getuid (), header
->header
.uid
);
402 GID_TO_CHARS (getgid (), header
->header
.gid
);
403 MAJOR_TO_CHARS (0, header
->header
.devmajor
);
404 MINOR_TO_CHARS (0, header
->header
.devminor
);
405 strncpy (header
->header
.magic
, TMAGIC
, TMAGLEN
);
406 strncpy (header
->header
.version
, TVERSION
, TVERSLEN
);
410 /* Create a new header and store there at most NAME_FIELD_SIZE bytes of
414 write_short_name (struct tar_stat_info
*st
)
416 union block
*header
= find_next_block ();
417 memset (header
->buffer
, 0, sizeof (union block
));
418 tar_name_copy_str (header
->header
.name
, st
->file_name
, NAME_FIELD_SIZE
);
422 #define FILL(field,byte) do { \
423 memset(field, byte, sizeof(field)-1); \
424 (field)[sizeof(field)-1] = 0; \
427 /* Write a GNUTYPE_LONGLINK or GNUTYPE_LONGNAME block. */
429 write_gnu_long_link (struct tar_stat_info
*st
, const char *p
, char type
)
431 size_t size
= strlen (p
) + 1;
436 header
= start_private_header ("././@LongLink", size
);
437 FILL(header
->header
.mtime
, '0');
438 FILL(header
->header
.mode
, '0');
439 FILL(header
->header
.uid
, '0');
440 FILL(header
->header
.gid
, '0');
441 FILL(header
->header
.devmajor
, 0);
442 FILL(header
->header
.devminor
, 0);
443 uid_to_uname (0, &tmpname
);
444 UNAME_TO_CHARS (tmpname
, header
->header
.uname
);
446 gid_to_gname (0, &tmpname
);
447 GNAME_TO_CHARS (tmpname
, header
->header
.gname
);
450 strcpy (header
->header
.magic
, OLDGNU_MAGIC
);
451 header
->header
.typeflag
= type
;
452 finish_header (st
, header
, -1);
454 header
= find_next_block ();
456 bufsize
= available_space_after (header
);
458 while (bufsize
< size
)
460 memcpy (header
->buffer
, p
, bufsize
);
463 set_next_block_after (header
+ (bufsize
- 1) / BLOCKSIZE
);
464 header
= find_next_block ();
465 bufsize
= available_space_after (header
);
467 memcpy (header
->buffer
, p
, size
);
468 memset (header
->buffer
+ size
, 0, bufsize
- size
);
469 set_next_block_after (header
+ (size
- 1) / BLOCKSIZE
);
473 split_long_name (const char *name
, size_t length
)
477 if (length
> PREFIX_FIELD_SIZE
)
478 length
= PREFIX_FIELD_SIZE
+2;
479 for (i
= length
- 1; i
> 0; i
--)
480 if (ISSLASH (name
[i
]))
486 write_ustar_long_name (const char *name
)
488 size_t length
= strlen (name
);
492 if (length
> PREFIX_FIELD_SIZE
+ NAME_FIELD_SIZE
+ 1)
494 ERROR ((0, 0, _("%s: file name is too long (max %d); not dumped"),
495 quotearg_colon (name
),
496 PREFIX_FIELD_SIZE
+ NAME_FIELD_SIZE
+ 1));
500 i
= split_long_name (name
, length
);
501 if (i
== 0 || length
- i
- 1 > NAME_FIELD_SIZE
)
504 _("%s: file name is too long (cannot be split); not dumped"),
505 quotearg_colon (name
)));
509 header
= find_next_block ();
510 memset (header
->buffer
, 0, sizeof (header
->buffer
));
511 memcpy (header
->header
.prefix
, name
, i
);
512 memcpy (header
->header
.name
, name
+ i
+ 1, length
- i
- 1);
517 /* Write a long link name, depending on the current archive format */
519 write_long_link (struct tar_stat_info
*st
)
521 switch (archive_format
)
524 xheader_store ("linkpath", st
, NULL
);
527 case V7_FORMAT
: /* old V7 tar format */
531 _("%s: link name is too long; not dumped"),
532 quotearg_colon (st
->link_name
)));
537 write_gnu_long_link (st
, st
->link_name
, GNUTYPE_LONGLINK
);
546 write_long_name (struct tar_stat_info
*st
)
548 switch (archive_format
)
551 xheader_store ("path", st
, NULL
);
555 if (strlen (st
->file_name
) > NAME_FIELD_SIZE
-1)
557 ERROR ((0, 0, _("%s: file name is too long (max %d); not dumped"),
558 quotearg_colon (st
->file_name
),
559 NAME_FIELD_SIZE
- 1));
566 return write_ustar_long_name (st
->file_name
);
570 write_gnu_long_link (st
, st
->file_name
, GNUTYPE_LONGNAME
);
576 return write_short_name (st
);
580 write_extended (char type
, struct tar_stat_info
*st
, union block
*old_header
)
582 union block
*header
, hp
;
585 if (extended_header
.buffer
|| extended_header
.stk
== NULL
)
588 xheader_finish (&extended_header
);
589 memcpy (hp
.buffer
, old_header
, sizeof (hp
));
590 p
= xheader_xhdr_name (st
);
591 xheader_write (type
, p
, &extended_header
);
593 header
= find_next_block ();
594 memcpy (header
, &hp
.buffer
, sizeof (hp
.buffer
));
599 write_header_name (struct tar_stat_info
*st
)
601 if (archive_format
== POSIX_FORMAT
&& !string_ascii_p (st
->file_name
))
603 xheader_store ("path", st
, NULL
);
604 return write_short_name (st
);
606 else if (NAME_FIELD_SIZE
- (archive_format
== OLDGNU_FORMAT
)
607 < strlen (st
->file_name
))
608 return write_long_name (st
);
610 return write_short_name (st
);
614 /* Header handling. */
616 /* Make a header block for the file whose stat info is st,
617 and return its address. */
620 start_header (struct tar_stat_info
*st
)
624 header
= write_header_name (st
);
628 /* Override some stat fields, if requested to do so. */
630 if (owner_option
!= (uid_t
) -1)
631 st
->stat
.st_uid
= owner_option
;
632 if (group_option
!= (gid_t
) -1)
633 st
->stat
.st_gid
= group_option
;
636 ((st
->stat
.st_mode
& ~MODE_ALL
)
637 | mode_adjust (st
->stat
.st_mode
, mode_option
, initial_umask
));
639 /* Paul Eggert tried the trivial test ($WRITER cf a b; $READER tvf a)
640 for a few tars and came up with the following interoperability
644 1 2 3 4 5 6 7 8 9 READER
645 . . . . . . . . . 1 = SunOS 4.2 tar
646 # . . # # . . # # 2 = NEC SVR4.0.2 tar
647 . . . # # . . # . 3 = Solaris 2.1 tar
648 . . . . . . . . . 4 = GNU tar 1.11.1
649 . . . . . . . . . 5 = HP-UX 8.07 tar
650 . . . . . . . . . 6 = Ultrix 4.1
651 . . . . . . . . . 7 = AIX 3.2
652 . . . . . . . . . 8 = Hitachi HI-UX 1.03
653 . . . . . . . . . 9 = Omron UNIOS-B 4.3BSD 1.60Beta
656 # = ``impossible file type''
658 The following mask for old archive removes the `#'s in column 4
659 above, thus making GNU tar both a universal donor and a universal
660 acceptor for Paul's test. */
662 if (archive_format
== V7_FORMAT
|| archive_format
== USTAR_FORMAT
)
663 MODE_TO_CHARS (st
->stat
.st_mode
& MODE_ALL
, header
->header
.mode
);
665 MODE_TO_CHARS (st
->stat
.st_mode
, header
->header
.mode
);
668 uid_t uid
= st
->stat
.st_uid
;
669 if (archive_format
== POSIX_FORMAT
670 && MAX_OCTAL_VAL (header
->header
.uid
) < uid
)
672 xheader_store ("uid", st
, NULL
);
675 UID_TO_CHARS (uid
, header
->header
.uid
);
679 gid_t gid
= st
->stat
.st_gid
;
680 if (archive_format
== POSIX_FORMAT
681 && MAX_OCTAL_VAL (header
->header
.gid
) < gid
)
683 xheader_store ("gid", st
, NULL
);
686 GID_TO_CHARS (gid
, header
->header
.gid
);
690 off_t size
= st
->stat
.st_size
;
691 if (archive_format
== POSIX_FORMAT
692 && MAX_OCTAL_VAL (header
->header
.size
) < size
)
694 xheader_store ("size", st
, NULL
);
697 OFF_TO_CHARS (size
, header
->header
.size
);
701 struct timespec mtime
= st
->mtime
;
702 if (archive_format
== POSIX_FORMAT
)
704 if (MAX_OCTAL_VAL (header
->header
.mtime
) < mtime
.tv_sec
705 || mtime
.tv_nsec
!= 0)
706 xheader_store ("mtime", st
, NULL
);
707 if (MAX_OCTAL_VAL (header
->header
.mtime
) < mtime
.tv_sec
)
710 TIME_TO_CHARS (mtime
.tv_sec
, header
->header
.mtime
);
714 if (S_ISCHR (st
->stat
.st_mode
)
715 || S_ISBLK (st
->stat
.st_mode
))
717 major_t devmajor
= major (st
->stat
.st_rdev
);
718 minor_t devminor
= minor (st
->stat
.st_rdev
);
720 if (archive_format
== POSIX_FORMAT
721 && MAX_OCTAL_VAL (header
->header
.devmajor
) < devmajor
)
723 xheader_store ("devmajor", st
, NULL
);
726 MAJOR_TO_CHARS (devmajor
, header
->header
.devmajor
);
728 if (archive_format
== POSIX_FORMAT
729 && MAX_OCTAL_VAL (header
->header
.devminor
) < devminor
)
731 xheader_store ("devminor", st
, NULL
);
734 MINOR_TO_CHARS (devminor
, header
->header
.devminor
);
736 else if (archive_format
!= GNU_FORMAT
&& archive_format
!= OLDGNU_FORMAT
)
738 MAJOR_TO_CHARS (0, header
->header
.devmajor
);
739 MINOR_TO_CHARS (0, header
->header
.devminor
);
742 if (archive_format
== POSIX_FORMAT
)
744 xheader_store ("atime", st
, NULL
);
745 xheader_store ("ctime", st
, NULL
);
747 else if (incremental_option
)
748 if (archive_format
== OLDGNU_FORMAT
|| archive_format
== GNU_FORMAT
)
750 TIME_TO_CHARS (st
->atime
.tv_sec
, header
->oldgnu_header
.atime
);
751 TIME_TO_CHARS (st
->ctime
.tv_sec
, header
->oldgnu_header
.ctime
);
754 header
->header
.typeflag
= archive_format
== V7_FORMAT
? AREGTYPE
: REGTYPE
;
756 switch (archive_format
)
762 case GNU_FORMAT
: /*FIXME?*/
763 /* Overwrite header->header.magic and header.version in one blow. */
764 strcpy (header
->header
.magic
, OLDGNU_MAGIC
);
769 strncpy (header
->header
.magic
, TMAGIC
, TMAGLEN
);
770 strncpy (header
->header
.version
, TVERSION
, TVERSLEN
);
777 if (archive_format
== V7_FORMAT
|| numeric_owner_option
)
779 /* header->header.[ug]name are left as the empty string. */
783 uid_to_uname (st
->stat
.st_uid
, &st
->uname
);
784 gid_to_gname (st
->stat
.st_gid
, &st
->gname
);
786 if (archive_format
== POSIX_FORMAT
787 && (strlen (st
->uname
) > UNAME_FIELD_SIZE
788 || !string_ascii_p (st
->uname
)))
789 xheader_store ("uname", st
, NULL
);
790 UNAME_TO_CHARS (st
->uname
, header
->header
.uname
);
792 if (archive_format
== POSIX_FORMAT
793 && (strlen (st
->gname
) > GNAME_FIELD_SIZE
794 || !string_ascii_p (st
->gname
)))
795 xheader_store ("gname", st
, NULL
);
796 GNAME_TO_CHARS (st
->gname
, header
->header
.gname
);
803 simple_finish_header (union block
*header
)
809 memcpy (header
->header
.chksum
, CHKBLANKS
, sizeof header
->header
.chksum
);
813 for (i
= sizeof *header
; i
-- != 0; )
814 /* We can't use unsigned char here because of old compilers, e.g. V7. */
817 /* Fill in the checksum field. It's formatted differently from the
818 other fields: it has [6] digits, a null, then a space -- rather than
819 digits, then a null. We use to_chars.
820 The final space is already there, from
821 checksumming, and to_chars doesn't modify it.
823 This is a fast way to do:
825 sprintf(header->header.chksum, "%6o", sum); */
827 uintmax_to_chars ((uintmax_t) sum
, header
->header
.chksum
, 7);
829 set_next_block_after (header
);
832 /* Finish off a filled-in header block and write it out. We also
833 print the file name and/or full info if verbose is on. If BLOCK_ORDINAL
834 is not negative, is the block ordinal of the first record for this
835 file, which may be a preceding long name or long link record. */
837 finish_header (struct tar_stat_info
*st
,
838 union block
*header
, off_t block_ordinal
)
840 /* Note: It is important to do this before the call to write_extended(),
841 so that the actual ustar header is printed */
843 && header
->header
.typeflag
!= GNUTYPE_LONGLINK
844 && header
->header
.typeflag
!= GNUTYPE_LONGNAME
845 && header
->header
.typeflag
!= XHDTYPE
846 && header
->header
.typeflag
!= XGLTYPE
)
848 /* These globals are parameters to print_header, sigh. */
850 current_header
= header
;
851 current_format
= archive_format
;
852 print_header (st
, block_ordinal
);
855 header
= write_extended (XHDTYPE
, st
, header
);
856 simple_finish_header (header
);
861 pad_archive (off_t size_left
)
864 while (size_left
> 0)
866 mv_size_left (size_left
);
867 blk
= find_next_block ();
868 memset (blk
->buffer
, 0, BLOCKSIZE
);
869 set_next_block_after (blk
);
870 size_left
-= BLOCKSIZE
;
874 static enum dump_status
875 dump_regular_file (int fd
, struct tar_stat_info
*st
)
877 off_t size_left
= st
->stat
.st_size
;
881 block_ordinal
= current_block_ordinal ();
882 blk
= start_header (st
);
884 return dump_status_fail
;
886 /* Mark contiguous files, if we support them. */
887 if (archive_format
!= V7_FORMAT
&& S_ISCTG (st
->stat
.st_mode
))
888 blk
->header
.typeflag
= CONTTYPE
;
890 finish_header (st
, blk
, block_ordinal
);
893 while (size_left
> 0)
895 size_t bufsize
, count
;
897 mv_size_left (size_left
);
899 blk
= find_next_block ();
901 bufsize
= available_space_after (blk
);
903 if (size_left
< bufsize
)
905 /* Last read -- zero out area beyond. */
907 count
= bufsize
% BLOCKSIZE
;
909 memset (blk
->buffer
+ size_left
, 0, BLOCKSIZE
- count
);
912 count
= (fd
< 0) ? bufsize
: safe_read (fd
, blk
->buffer
, bufsize
);
913 if (count
== SAFE_READ_ERROR
)
915 read_diag_details (st
->orig_file_name
,
916 st
->stat
.st_size
- size_left
, bufsize
);
917 pad_archive (size_left
);
918 return dump_status_short
;
922 set_next_block_after (blk
+ (bufsize
- 1) / BLOCKSIZE
);
924 if (count
!= bufsize
)
926 char buf
[UINTMAX_STRSIZE_BOUND
];
927 memset (blk
->buffer
+ count
, 0, bufsize
- count
);
929 ngettext ("%s: File shrank by %s byte; padding with zeros",
930 "%s: File shrank by %s bytes; padding with zeros",
932 quotearg_colon (st
->orig_file_name
),
933 STRINGIFY_BIGINT (size_left
, buf
)));
934 if (! ignore_failed_read_option
)
935 exit_status
= TAREXIT_FAILURE
;
936 pad_archive (size_left
- (bufsize
-count
));
937 return dump_status_short
;
940 return dump_status_ok
;
944 dump_regular_finish (int fd
, struct tar_stat_info
*st
,
945 struct timespec original_ctime
)
949 struct stat final_stat
;
950 if (fstat (fd
, &final_stat
) != 0)
952 stat_diag (st
->orig_file_name
);
954 else if (timespec_cmp (get_stat_ctime (&final_stat
), original_ctime
)
957 WARN ((0, 0, _("%s: file changed as we read it"),
958 quotearg_colon (st
->orig_file_name
)));
962 close_diag (st
->orig_file_name
);
965 if (remove_files_option
)
967 if (unlink (st
->orig_file_name
) == -1)
968 unlink_error (st
->orig_file_name
);
972 /* Look in directory DIRNAME for a cache directory tag file
973 with the magic name "CACHEDIR.TAG" and a standard header,
975 http://www.brynosaurus.com/cachedir
976 Applications can write this file into directories they create
977 for use as caches containing purely regenerable, non-precious data,
978 allowing us to avoid archiving them if --exclude-caches is specified. */
980 #define CACHEDIR_SIGNATURE "Signature: 8a477f597d28d172789f06886806bc55"
981 #define CACHEDIR_SIGNATURE_SIZE (sizeof CACHEDIR_SIGNATURE - 1)
984 check_cache_directory (char *dirname
)
986 static char tagname
[] = "CACHEDIR.TAG";
989 int tag_present
= false;
991 tagpath
= xmalloc (strlen (dirname
) + strlen (tagname
) + 1);
992 strcpy (tagpath
, dirname
);
993 strcat (tagpath
, tagname
);
995 fd
= open (tagpath
, O_RDONLY
);
998 static char tagbuf
[CACHEDIR_SIGNATURE_SIZE
];
1000 if (read (fd
, tagbuf
, CACHEDIR_SIGNATURE_SIZE
)
1001 == CACHEDIR_SIGNATURE_SIZE
1002 && memcmp (tagbuf
, CACHEDIR_SIGNATURE
, CACHEDIR_SIGNATURE_SIZE
) == 0)
1014 dump_dir0 (char *directory
,
1015 struct tar_stat_info
*st
, int top_level
, dev_t parent_device
)
1017 dev_t our_device
= st
->stat
.st_dev
;
1019 if (!is_avoided_name (st
->orig_file_name
))
1021 union block
*blk
= NULL
;
1022 off_t block_ordinal
= current_block_ordinal ();
1023 st
->stat
.st_size
= 0; /* force 0 size on dir */
1025 blk
= start_header (st
);
1029 if (incremental_option
&& archive_format
!= POSIX_FORMAT
)
1030 blk
->header
.typeflag
= GNUTYPE_DUMPDIR
;
1031 else /* if (standard_option) */
1032 blk
->header
.typeflag
= DIRTYPE
;
1034 /* If we're gnudumping, we aren't done yet so don't close it. */
1036 if (!incremental_option
)
1037 finish_header (st
, blk
, block_ordinal
);
1038 else if (gnu_list_name
->dir_contents
)
1040 if (archive_format
== POSIX_FORMAT
)
1042 xheader_store ("GNU.dumpdir", st
, gnu_list_name
->dir_contents
);
1043 finish_header (st
, blk
, block_ordinal
);
1051 const char *buffer
, *p_buffer
;
1053 block_ordinal
= current_block_ordinal ();
1054 buffer
= gnu_list_name
->dir_contents
;
1056 totsize
= dumpdir_size (buffer
);
1059 OFF_TO_CHARS (totsize
, blk
->header
.size
);
1060 finish_header (st
, blk
, block_ordinal
);
1062 size_left
= totsize
;
1065 mv_total_size (totsize
);
1066 while (size_left
> 0)
1068 mv_size_left (size_left
);
1069 blk
= find_next_block ();
1070 bufsize
= available_space_after (blk
);
1071 if (size_left
< bufsize
)
1073 bufsize
= size_left
;
1074 count
= bufsize
% BLOCKSIZE
;
1076 memset (blk
->buffer
+ size_left
, 0, BLOCKSIZE
- count
);
1078 memcpy (blk
->buffer
, p_buffer
, bufsize
);
1079 size_left
-= bufsize
;
1080 p_buffer
+= bufsize
;
1081 set_next_block_after (blk
+ (bufsize
- 1) / BLOCKSIZE
);
1089 if (!recursion_option
)
1092 if (one_file_system_option
1094 && parent_device
!= st
->stat
.st_dev
)
1098 _("%s: file is on a different filesystem; not dumped"),
1099 quotearg_colon (st
->orig_file_name
)));
1103 if (exclude_caches_option
1104 && check_cache_directory(st
->orig_file_name
))
1108 _("%s: contains a cache directory tag; not dumped"),
1109 quotearg_colon (st
->orig_file_name
)));
1116 char *name_buf
= xstrdup (st
->orig_file_name
);
1117 size_t name_size
= strlen (name_buf
);
1118 size_t name_len
= name_size
;
1120 /* Now output all the files in the directory. */
1121 /* FIXME: Should speed this up by cd-ing into the dir. */
1123 for (entry
= directory
; (entry_len
= strlen (entry
)) != 0;
1124 entry
+= entry_len
+ 1)
1126 if (name_size
< name_len
+ entry_len
)
1128 name_size
= name_len
+ entry_len
;
1129 name_buf
= xrealloc (name_buf
, name_size
+ 1);
1131 strcpy (name_buf
+ name_len
, entry
);
1132 if (!excluded_name (name_buf
))
1133 dump_file (name_buf
, 0, our_device
);
1140 /* Ensure exactly one trailing slash. */
1142 ensure_slash (char **pstr
)
1144 size_t len
= strlen (*pstr
);
1145 while (len
>= 1 && ISSLASH ((*pstr
)[len
- 1]))
1147 if (!ISSLASH ((*pstr
)[len
]))
1148 *pstr
= xrealloc (*pstr
, len
+ 2);
1149 (*pstr
)[len
++] = '/';
1150 (*pstr
)[len
] = '\0';
1154 dump_dir (struct tar_stat_info
*st
, int top_level
, dev_t parent_device
)
1158 directory
= savedir (st
->orig_file_name
);
1161 savedir_diag (st
->orig_file_name
);
1165 ensure_slash (&st
->orig_file_name
);
1166 ensure_slash (&st
->file_name
);
1168 dump_dir0 (directory
, st
, top_level
, parent_device
);
1175 /* Main functions of this module. */
1178 create_archive (void)
1182 open_archive (ACCESS_WRITE
);
1183 xheader_write_global ();
1185 if (incremental_option
)
1187 size_t buffer_size
= 1000;
1188 char *buffer
= xmalloc (buffer_size
);
1191 collect_and_sort_names ();
1193 while ((p
= name_from_list ()) != NULL
)
1194 if (!excluded_name (p
))
1195 dump_file (p
, -1, (dev_t
) 0);
1198 while ((p
= name_from_list ()) != NULL
)
1199 if (!excluded_name (p
))
1201 size_t plen
= strlen (p
);
1202 if (buffer_size
<= plen
)
1204 while ((buffer_size
*= 2) <= plen
)
1206 buffer
= xrealloc (buffer
, buffer_size
);
1208 memcpy (buffer
, p
, plen
);
1209 if (! ISSLASH (buffer
[plen
- 1]))
1210 buffer
[plen
++] = '/';
1211 q
= gnu_list_name
->dir_contents
;
1215 size_t qlen
= strlen (q
);
1218 if (buffer_size
< plen
+ qlen
)
1220 while ((buffer_size
*=2 ) < plen
+ qlen
)
1222 buffer
= xrealloc (buffer
, buffer_size
);
1224 strcpy (buffer
+ plen
, q
+ 1);
1225 dump_file (buffer
, -1, (dev_t
) 0);
1234 while ((p
= name_next (1)) != NULL
)
1235 if (!excluded_name (p
))
1236 dump_file (p
, 1, (dev_t
) 0);
1242 if (listed_incremental_option
)
1243 write_directory_file ();
1247 /* Calculate the hash of a link. */
1249 hash_link (void const *entry
, size_t n_buckets
)
1251 struct link
const *l
= entry
;
1252 uintmax_t num
= l
->dev
^ l
->ino
;
1253 return num
% n_buckets
;
1256 /* Compare two links for equality. */
1258 compare_links (void const *entry1
, void const *entry2
)
1260 struct link
const *link1
= entry1
;
1261 struct link
const *link2
= entry2
;
1262 return ((link1
->dev
^ link2
->dev
) | (link1
->ino
^ link2
->ino
)) == 0;
1266 unknown_file_error (char *p
)
1268 WARN ((0, 0, _("%s: Unknown file type; file ignored"),
1269 quotearg_colon (p
)));
1270 if (!ignore_failed_read_option
)
1271 exit_status
= TAREXIT_FAILURE
;
1275 /* Handling of hard links */
1277 /* Table of all non-directories that we've written so far. Any time
1278 we see another, we check the table and avoid dumping the data
1279 again if we've done it once already. */
1280 static Hash_table
*link_table
;
1282 /* Try to dump stat as a hard link to another file in the archive. If
1283 succeeded returns true */
1285 dump_hard_link (struct tar_stat_info
*st
)
1287 if (link_table
&& st
->stat
.st_nlink
> 1)
1290 struct link
*duplicate
;
1291 off_t block_ordinal
;
1294 lp
.ino
= st
->stat
.st_ino
;
1295 lp
.dev
= st
->stat
.st_dev
;
1297 if ((duplicate
= hash_lookup (link_table
, &lp
)))
1299 /* We found a link. */
1300 char const *link_name
= safer_name_suffix (duplicate
->name
, true,
1301 absolute_names_option
);
1305 block_ordinal
= current_block_ordinal ();
1306 assign_string (&st
->link_name
, link_name
);
1307 if (NAME_FIELD_SIZE
- (archive_format
== OLDGNU_FORMAT
)
1308 < strlen (link_name
))
1309 write_long_link (st
);
1311 st
->stat
.st_size
= 0;
1312 blk
= start_header (st
);
1315 tar_copy_str (blk
->header
.linkname
, link_name
, NAME_FIELD_SIZE
);
1317 blk
->header
.typeflag
= LNKTYPE
;
1318 finish_header (st
, blk
, block_ordinal
);
1320 if (remove_files_option
&& unlink (st
->orig_file_name
) != 0)
1321 unlink_error (st
->orig_file_name
);
1330 file_count_links (struct tar_stat_info
*st
)
1332 if (st
->stat
.st_nlink
> 1)
1334 struct link
*duplicate
;
1335 struct link
*lp
= xmalloc (offsetof (struct link
, name
)
1336 + strlen (st
->orig_file_name
) + 1);
1337 lp
->ino
= st
->stat
.st_ino
;
1338 lp
->dev
= st
->stat
.st_dev
;
1339 lp
->nlink
= st
->stat
.st_nlink
;
1340 strcpy (lp
->name
, st
->orig_file_name
);
1343 || (link_table
= hash_initialize (0, 0, hash_link
,
1345 && (duplicate
= hash_insert (link_table
, lp
))))
1348 if (duplicate
!= lp
)
1354 /* For each dumped file, check if all its links were dumped. Emit
1355 warnings if it is not so. */
1364 for (lp
= hash_get_first (link_table
); lp
;
1365 lp
= hash_get_next (link_table
, lp
))
1369 WARN ((0, 0, _("Missing links to %s.\n"), quote (lp
->name
)));
1375 /* Dump a single file, recursing on directories. P is the file name
1376 to dump. TOP_LEVEL tells whether this is a top-level call; zero
1377 means no, positive means yes, and negative means the top level
1378 of an incremental dump. PARENT_DEVICE is the device of P's
1379 parent directory; it is examined only if TOP_LEVEL is zero. */
1381 /* FIXME: One should make sure that for *every* path leading to setting
1382 exit_status to failure, a clear diagnostic has been issued. */
1385 dump_file0 (struct tar_stat_info
*st
, char *p
,
1386 int top_level
, dev_t parent_device
)
1388 union block
*header
;
1390 struct timespec original_ctime
;
1391 struct timespec restore_times
[2];
1392 off_t block_ordinal
= -1;
1394 if (interactive_option
&& !confirm ("add", p
))
1397 assign_string (&st
->orig_file_name
, p
);
1398 assign_string (&st
->file_name
,
1399 safer_name_suffix (p
, false, absolute_names_option
));
1401 if (deref_stat (dereference_option
, p
, &st
->stat
) != 0)
1406 st
->archive_file_size
= st
->stat
.st_size
;
1407 st
->atime
= restore_times
[0] = get_stat_atime (&st
->stat
);
1408 st
->mtime
= restore_times
[1] = get_stat_mtime (&st
->stat
);
1409 st
->ctime
= original_ctime
= get_stat_ctime (&st
->stat
);
1412 if (S_ISHIDDEN (st
->stat
.st_mode
))
1414 char *new = (char *) alloca (strlen (p
) + 2);
1424 /* See if we want only new files, and check if this one is too old to
1427 This check is omitted if incremental_option is set *and* the
1428 requested file is not explicitely listed in the command line. */
1430 if (!(incremental_option
&& !is_individual_file (p
))
1431 && !S_ISDIR (st
->stat
.st_mode
)
1432 && OLDER_TAR_STAT_TIME (*st
, m
)
1433 && (!after_date_option
|| OLDER_TAR_STAT_TIME (*st
, c
)))
1435 if (!incremental_option
&& verbose_option
)
1436 WARN ((0, 0, _("%s: file is unchanged; not dumped"),
1437 quotearg_colon (p
)));
1441 /* See if we are trying to dump the archive. */
1442 if (sys_file_is_archive (st
))
1444 WARN ((0, 0, _("%s: file is the archive; not dumped"),
1445 quotearg_colon (p
)));
1449 if (is_avoided_name (p
))
1451 if (S_ISDIR (st
->stat
.st_mode
))
1453 dump_dir (st
, top_level
, parent_device
);
1454 if (atime_preserve_option
)
1455 utimens (p
, restore_times
);
1460 /* Check for multiple links. */
1461 if (dump_hard_link (st
))
1464 /* This is not a link to a previously dumped file, so dump it. */
1466 if (S_ISREG (st
->stat
.st_mode
)
1467 || S_ISCTG (st
->stat
.st_mode
))
1470 enum dump_status status
;
1472 if (file_dumpable_p (st
))
1474 fd
= open (st
->orig_file_name
,
1475 O_RDONLY
| O_BINARY
);
1478 if (!top_level
&& errno
== ENOENT
)
1479 WARN ((0, 0, _("%s: File removed before we read it"),
1480 quotearg_colon (st
->orig_file_name
)));
1482 open_diag (st
->orig_file_name
);
1489 if (fd
!= -1 && sparse_option
&& sparse_file_p (st
))
1491 status
= sparse_dump_file (fd
, st
);
1492 if (status
== dump_status_not_implemented
)
1493 status
= dump_regular_file (fd
, st
);
1496 status
= dump_regular_file (fd
, st
);
1500 case dump_status_ok
:
1502 dump_regular_finish (fd
, st
, original_ctime
);
1505 case dump_status_short
:
1510 case dump_status_fail
:
1514 case dump_status_not_implemented
:
1518 if (atime_preserve_option
)
1519 utimens (st
->orig_file_name
, restore_times
);
1520 file_count_links (st
);
1523 #ifdef HAVE_READLINK
1524 else if (S_ISLNK (st
->stat
.st_mode
))
1528 size_t linklen
= st
->stat
.st_size
;
1529 if (linklen
!= st
->stat
.st_size
|| linklen
+ 1 == 0)
1531 buffer
= (char *) alloca (linklen
+ 1);
1532 size
= readlink (p
, buffer
, linklen
+ 1);
1538 buffer
[size
] = '\0';
1539 assign_string (&st
->link_name
, buffer
);
1540 if (NAME_FIELD_SIZE
- (archive_format
== OLDGNU_FORMAT
) < size
)
1541 write_long_link (st
);
1543 block_ordinal
= current_block_ordinal ();
1544 st
->stat
.st_size
= 0; /* force 0 size on symlink */
1545 header
= start_header (st
);
1548 tar_copy_str (header
->header
.linkname
, buffer
, NAME_FIELD_SIZE
);
1549 header
->header
.typeflag
= SYMTYPE
;
1550 finish_header (st
, header
, block_ordinal
);
1551 /* nothing more to do to it */
1553 if (remove_files_option
)
1555 if (unlink (p
) == -1)
1558 file_count_links (st
);
1562 else if (S_ISCHR (st
->stat
.st_mode
))
1564 else if (S_ISBLK (st
->stat
.st_mode
))
1566 else if (S_ISFIFO (st
->stat
.st_mode
))
1568 else if (S_ISSOCK (st
->stat
.st_mode
))
1570 WARN ((0, 0, _("%s: socket ignored"), quotearg_colon (p
)));
1573 else if (S_ISDOOR (st
->stat
.st_mode
))
1575 WARN ((0, 0, _("%s: door ignored"), quotearg_colon (p
)));
1580 unknown_file_error (p
);
1585 if (archive_format
== V7_FORMAT
)
1587 unknown_file_error (p
);
1591 block_ordinal
= current_block_ordinal ();
1592 st
->stat
.st_size
= 0; /* force 0 size */
1593 header
= start_header (st
);
1596 header
->header
.typeflag
= type
;
1598 if (type
!= FIFOTYPE
)
1600 MAJOR_TO_CHARS (major (st
->stat
.st_rdev
),
1601 header
->header
.devmajor
);
1602 MINOR_TO_CHARS (minor (st
->stat
.st_rdev
),
1603 header
->header
.devminor
);
1606 finish_header (st
, header
, block_ordinal
);
1607 if (remove_files_option
)
1609 if (unlink (p
) == -1)
1615 dump_file (char *p
, int top_level
, dev_t parent_device
)
1617 struct tar_stat_info st
;
1618 tar_stat_init (&st
);
1619 dump_file0 (&st
, p
, top_level
, parent_device
);
1620 if (listed_incremental_option
)
1621 update_parent_directory (p
);
1622 tar_stat_destroy (&st
);