1 /* Various processing of names.
3 Copyright (C) 1988, 1992, 1994, 1996, 1997, 1998, 1999, 2000, 2001,
4 2003, 2004, 2005 Free Software Foundation, Inc.
6 This program is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 2, or (at your option) any later
11 This program is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
14 Public License for more details.
16 You should have received a copy of the GNU General Public License along
17 with this program; if not, write to the Free Software Foundation, Inc.,
18 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
28 /* User and group names. */
30 struct group
*getgrnam ();
31 struct passwd
*getpwnam ();
32 #if ! HAVE_DECL_GETPWUID
33 struct passwd
*getpwuid ();
35 #if ! HAVE_DECL_GETGRGID
36 struct group
*getgrgid ();
39 /* Make sure you link with the proper libraries if you are running the
40 Yellow Peril (thanks for the good laugh, Ian J.!), or, euh... NIS.
41 This code should also be modified for non-UNIX systems to do something
44 static char *cached_uname
;
45 static char *cached_gname
;
47 static uid_t cached_uid
; /* valid only if cached_uname is not empty */
48 static gid_t cached_gid
; /* valid only if cached_gname is not empty */
50 /* These variables are valid only if nonempty. */
51 static char *cached_no_such_uname
;
52 static char *cached_no_such_gname
;
54 /* These variables are valid only if nonzero. It's not worth optimizing
55 the case for weird systems where 0 is not a valid uid or gid. */
56 static uid_t cached_no_such_uid
;
57 static gid_t cached_no_such_gid
;
59 static void register_individual_file (char const *name
);
61 /* Given UID, find the corresponding UNAME. */
63 uid_to_uname (uid_t uid
, char **uname
)
65 struct passwd
*passwd
;
67 if (uid
!= 0 && uid
== cached_no_such_uid
)
69 *uname
= xstrdup ("");
73 if (!cached_uname
|| uid
!= cached_uid
)
75 passwd
= getpwuid (uid
);
79 assign_string (&cached_uname
, passwd
->pw_name
);
83 cached_no_such_uid
= uid
;
84 *uname
= xstrdup ("");
88 *uname
= xstrdup (cached_uname
);
91 /* Given GID, find the corresponding GNAME. */
93 gid_to_gname (gid_t gid
, char **gname
)
97 if (gid
!= 0 && gid
== cached_no_such_gid
)
99 *gname
= xstrdup ("");
103 if (!cached_gname
|| gid
!= cached_gid
)
105 group
= getgrgid (gid
);
109 assign_string (&cached_gname
, group
->gr_name
);
113 cached_no_such_gid
= gid
;
114 *gname
= xstrdup ("");
118 *gname
= xstrdup (cached_gname
);
121 /* Given UNAME, set the corresponding UID and return 1, or else, return 0. */
123 uname_to_uid (char const *uname
, uid_t
*uidp
)
125 struct passwd
*passwd
;
127 if (cached_no_such_uname
128 && strcmp (uname
, cached_no_such_uname
) == 0)
132 || uname
[0] != cached_uname
[0]
133 || strcmp (uname
, cached_uname
) != 0)
135 passwd
= getpwnam (uname
);
138 cached_uid
= passwd
->pw_uid
;
139 assign_string (&cached_uname
, passwd
->pw_name
);
143 assign_string (&cached_no_such_uname
, uname
);
151 /* Given GNAME, set the corresponding GID and return 1, or else, return 0. */
153 gname_to_gid (char const *gname
, gid_t
*gidp
)
157 if (cached_no_such_gname
158 && strcmp (gname
, cached_no_such_gname
) == 0)
162 || gname
[0] != cached_gname
[0]
163 || strcmp (gname
, cached_gname
) != 0)
165 group
= getgrnam (gname
);
168 cached_gid
= group
->gr_gid
;
169 assign_string (&cached_gname
, gname
);
173 assign_string (&cached_no_such_gname
, gname
);
182 /* Names from the command call. */
184 static struct name
*namelist
; /* first name in list, if any */
185 static struct name
**nametail
= &namelist
; /* end of name list */
186 static const char **name_array
; /* store an array of names */
187 static int allocated_names
; /* how big is the array? */
188 static int names
; /* how many entries does it have? */
189 static int name_index
; /* how many of the entries have we scanned? */
191 /* Initialize structures. */
195 allocated_names
= 10;
196 name_array
= xmalloc (sizeof (const char *) * allocated_names
);
200 /* Add NAME at end of name_array, reallocating it as necessary. */
202 name_add (const char *name
)
204 if (names
== allocated_names
)
206 allocated_names
*= 2;
208 xrealloc (name_array
, sizeof (const char *) * allocated_names
);
210 name_array
[names
++] = name
;
213 /* Names from external name file. */
215 static char *name_buffer
; /* buffer to hold the current file name */
216 static size_t name_buffer_length
; /* allocated length of name_buffer */
218 /* FIXME: I should better check more closely. It seems at first glance that
219 is_pattern is only used when reading a file, and ignored for all
220 command line arguments. */
223 is_pattern (const char *string
)
225 return strchr (string
, '*') || strchr (string
, '[') || strchr (string
, '?');
228 /* Set up to gather file names for tar. They can either come from a
229 file or were saved from decoding arguments. */
233 name_buffer
= xmalloc (NAME_FIELD_SIZE
+ 2);
234 name_buffer_length
= NAME_FIELD_SIZE
;
244 /* Get the next name from ARGV or the file of names. Result is in
245 static storage and can't be relied upon across two calls.
247 If CHANGE_DIRS is true, treat a filename of the form "-C" as
248 meaning that the next filename is the name of a directory to change
249 to. If filename_terminator is NUL, CHANGE_DIRS is effectively
252 name_next (int change_dirs
)
258 if (filename_terminator
== '\0')
261 while (name_index
!= names
)
264 source
= name_array
[name_index
++];
265 source_len
= strlen (source
);
266 if (name_buffer_length
< source_len
)
270 name_buffer_length
*= 2;
271 if (! name_buffer_length
)
274 while (name_buffer_length
< source_len
);
277 name_buffer
= xmalloc (name_buffer_length
+ 2);
279 strcpy (name_buffer
, source
);
281 /* Zap trailing slashes. */
283 cursor
= name_buffer
+ strlen (name_buffer
) - 1;
284 while (cursor
> name_buffer
&& ISSLASH (*cursor
))
289 if (chdir (name_buffer
) < 0)
290 chdir_fatal (name_buffer
);
293 else if (change_dirs
&& strcmp (name_buffer
, "-C") == 0)
298 unquote_string (name_buffer
);
299 if (incremental_option
)
300 register_individual_file (name_buffer
);
308 /* Gather names in a list for scanning. Could hash them later if we
311 If the names are already sorted to match the archive, we just read
312 them one by one. name_gather reads the first one, and it is called
313 by name_match as appropriate to read the next ones. At EOF, the
314 last name read is just left in the buffer. This option lets users
315 of small machines extract an arbitrary number of files by doing
316 "tar t" and editing down the list of files. */
321 /* Buffer able to hold a single name. */
322 static struct name
*buffer
;
323 static size_t allocated_size
;
327 if (same_order_option
)
329 static int change_dir
;
331 if (allocated_size
== 0)
333 allocated_size
= offsetof (struct name
, name
) + NAME_FIELD_SIZE
+ 1;
334 buffer
= xmalloc (allocated_size
);
335 /* FIXME: This memset is overkill, and ugly... */
336 memset (buffer
, 0, allocated_size
);
339 while ((name
= name_next (0)) && strcmp (name
, "-C") == 0)
341 char const *dir
= name_next (0);
343 FATAL_ERROR ((0, 0, _("Missing file name after -C")));
344 change_dir
= chdir_arg (xstrdup (dir
));
350 buffer
->length
= strlen (name
);
351 needed_size
= offsetof (struct name
, name
) + buffer
->length
+ 1;
352 if (allocated_size
< needed_size
)
357 if (! allocated_size
)
360 while (allocated_size
< needed_size
);
362 buffer
= xrealloc (buffer
, allocated_size
);
364 buffer
->change_dir
= change_dir
;
365 strcpy (buffer
->name
, name
);
367 buffer
->found_count
= 0;
370 nametail
= &namelist
->next
;
373 addname (0, change_dir
);
377 /* Non sorted names -- read them all in. */
382 int change_dir0
= change_dir
;
383 while ((name
= name_next (0)) && strcmp (name
, "-C") == 0)
385 char const *dir
= name_next (0);
387 FATAL_ERROR ((0, 0, _("Missing file name after -C")));
388 change_dir
= chdir_arg (xstrdup (dir
));
391 addname (name
, change_dir
);
394 if (change_dir
!= change_dir0
)
395 addname (0, change_dir
);
402 /* Add a name to the namelist. */
404 addname (char const *string
, int change_dir
)
406 size_t length
= string
? strlen (string
) : 0;
407 struct name
*name
= xmalloc (offsetof (struct name
, name
) + length
+ 1);
412 strcpy (name
->name
, string
);
418 /* FIXME: This initialization (and the byte of memory that it
419 initializes) is probably not needed, but we are currently in
420 bug-fix mode so we'll leave it in for now. */
425 name
->length
= length
;
426 name
->found_count
= 0;
427 name
->regexp
= 0; /* assume not a regular expression */
428 name
->firstch
= 1; /* assume first char is literal */
429 name
->change_dir
= change_dir
;
430 name
->dir_contents
= 0;
432 if (string
&& is_pattern (string
))
435 if (string
[0] == '*' || string
[0] == '[' || string
[0] == '?')
440 nametail
= &name
->next
;
444 /* Find a match for FILE_NAME (whose string length is LENGTH) in the name
447 namelist_match (char const *file_name
, size_t length
)
451 for (p
= namelist
; p
; p
= p
->next
)
453 /* If first chars don't match, quick skip. */
455 if (p
->firstch
&& p
->name
[0] != file_name
[0])
459 ? fnmatch (p
->name
, file_name
, recursion_option
) == 0
460 : (p
->length
<= length
461 && (file_name
[p
->length
] == '\0'
462 || (ISSLASH (file_name
[p
->length
]) && recursion_option
))
463 && memcmp (file_name
, p
->name
, p
->length
) == 0))
470 /* Return true if and only if name FILE_NAME (from an archive) matches any
471 name from the namelist. */
473 name_match (const char *file_name
)
475 size_t length
= strlen (file_name
);
479 struct name
*cursor
= namelist
;
486 chdir_do (cursor
->change_dir
);
488 nametail
= &namelist
;
492 cursor
= namelist_match (file_name
, length
);
495 if (!(ISSLASH (file_name
[cursor
->length
]) && recursion_option
)
496 || cursor
->found_count
== 0)
497 cursor
->found_count
++; /* remember it matched */
498 if (starting_file_option
)
502 nametail
= &namelist
;
504 chdir_do (cursor
->change_dir
);
506 /* We got a match. */
507 return ISFOUND (cursor
);
510 /* Filename from archive not found in namelist. If we have the whole
511 namelist here, just return 0. Otherwise, read the next name in and
512 compare it. If this was the last name, namelist->found_count will
513 remain on. If not, we loop to compare the newly read name. */
515 if (same_order_option
&& namelist
->found_count
)
517 name_gather (); /* read one more */
518 if (namelist
->found_count
)
526 /* Returns true if all names from the namelist were processed.
527 P is the stat_info of the most recently processed entry.
528 The decision is postponed until the next entry is read if:
530 1) P ended with a slash (i.e. it was a directory)
531 2) P matches any entry from the namelist *and* represents a subdirectory
532 or a file lying under this entry (in the terms of directory structure).
534 This is necessary to handle contents of directories. */
536 all_names_found (struct tar_stat_info
*p
)
538 struct name
const *cursor
;
541 if (test_label_option
)
543 if (!p
->file_name
|| occurrence_option
== 0 || p
->had_trailing_slash
)
545 len
= strlen (p
->file_name
);
546 for (cursor
= namelist
; cursor
; cursor
= cursor
->next
)
549 || (!WASFOUND(cursor
) && !cursor
->fake
)
550 || (len
>= cursor
->length
&& ISSLASH (p
->file_name
[cursor
->length
])))
556 /* Print the names of things in the namelist that were not matched. */
558 names_notfound (void)
560 struct name
const *cursor
;
562 for (cursor
= namelist
; cursor
; cursor
= cursor
->next
)
563 if (!WASFOUND(cursor
) && !cursor
->fake
)
565 if (cursor
->found_count
== 0)
566 ERROR ((0, 0, _("%s: Not found in archive"),
567 quotearg_colon (cursor
->name
)));
569 ERROR ((0, 0, _("%s: Required occurrence not found in archive"),
570 quotearg_colon (cursor
->name
)));
573 /* Don't bother freeing the name list; we're about to exit. */
575 nametail
= &namelist
;
577 if (same_order_option
)
581 while ((name
= name_next (1)) != NULL
)
582 ERROR ((0, 0, _("%s: Not found in archive"),
583 quotearg_colon (name
)));
587 /* Sorting name lists. */
589 /* Sort linked LIST of names, of given LENGTH, using COMPARE to order
590 names. Return the sorted list. Apart from the type `struct name'
591 and the definition of SUCCESSOR, this is a generic list-sorting
592 function, but it's too painful to make it both generic and portable
596 merge_sort (struct name
*list
, int length
,
597 int (*compare
) (struct name
const*, struct name
const*))
599 struct name
*first_list
;
600 struct name
*second_list
;
604 struct name
**merge_point
;
608 # define SUCCESSOR(name) ((name)->next)
615 if ((*compare
) (list
, SUCCESSOR (list
)) > 0)
617 result
= SUCCESSOR (list
);
618 SUCCESSOR (result
) = list
;
619 SUCCESSOR (list
) = 0;
626 first_length
= (length
+ 1) / 2;
627 second_length
= length
/ 2;
628 for (cursor
= list
, counter
= first_length
- 1;
630 cursor
= SUCCESSOR (cursor
), counter
--)
632 second_list
= SUCCESSOR (cursor
);
633 SUCCESSOR (cursor
) = 0;
635 first_list
= merge_sort (first_list
, first_length
, compare
);
636 second_list
= merge_sort (second_list
, second_length
, compare
);
638 merge_point
= &result
;
639 while (first_list
&& second_list
)
640 if ((*compare
) (first_list
, second_list
) < 0)
642 cursor
= SUCCESSOR (first_list
);
643 *merge_point
= first_list
;
644 merge_point
= &SUCCESSOR (first_list
);
649 cursor
= SUCCESSOR (second_list
);
650 *merge_point
= second_list
;
651 merge_point
= &SUCCESSOR (second_list
);
652 second_list
= cursor
;
655 *merge_point
= first_list
;
657 *merge_point
= second_list
;
664 /* A comparison function for sorting names. Put found names last;
665 break ties by string comparison. */
668 compare_names (struct name
const *n1
, struct name
const *n2
)
670 int found_diff
= WASFOUND(n2
) - WASFOUND(n1
);
671 return found_diff
? found_diff
: strcmp (n1
->name
, n2
->name
);
674 /* Add all the dirs under NAME, which names a directory, to the namelist.
675 If any of the files is a directory, recurse on the subdirectory.
676 DEVICE is the device not to leave, if the -l option is specified. */
679 add_hierarchy_to_namelist (struct name
*name
, dev_t device
)
681 char *file_name
= name
->name
;
682 char *buffer
= get_directory_contents (file_name
, device
);
685 name
->dir_contents
= "\0\0\0\0";
688 size_t name_length
= name
->length
;
689 size_t allocated_length
= (name_length
>= NAME_FIELD_SIZE
690 ? name_length
+ NAME_FIELD_SIZE
692 char *namebuf
= xmalloc (allocated_length
+ 1);
693 /* FIXME: + 2 above? */
695 size_t string_length
;
696 int change_dir
= name
->change_dir
;
698 name
->dir_contents
= buffer
;
699 strcpy (namebuf
, file_name
);
700 if (! ISSLASH (namebuf
[name_length
- 1]))
702 namebuf
[name_length
++] = '/';
703 namebuf
[name_length
] = '\0';
706 for (string
= buffer
; *string
; string
+= string_length
+ 1)
708 string_length
= strlen (string
);
711 if (allocated_length
<= name_length
+ string_length
)
715 allocated_length
*= 2;
716 if (! allocated_length
)
719 while (allocated_length
<= name_length
+ string_length
);
721 namebuf
= xrealloc (namebuf
, allocated_length
+ 1);
723 strcpy (namebuf
+ name_length
, string
+ 1);
724 add_hierarchy_to_namelist (addname (namebuf
, change_dir
),
733 /* Collect all the names from argv[] (or whatever), expand them into a
734 directory tree, and sort them. This gets only subdirectories, not
738 collect_and_sort_names (void)
741 struct name
*next_name
;
747 if (listed_incremental_option
)
748 read_directory_file ();
753 for (name
= namelist
; name
; name
= next_name
)
755 next_name
= name
->next
;
756 if (name
->found_count
|| name
->dir_contents
)
758 if (name
->regexp
) /* FIXME: just skip regexps for now */
760 chdir_do (name
->change_dir
);
764 if (deref_stat (dereference_option
, name
->name
, &statbuf
) != 0)
766 stat_diag (name
->name
);
769 if (S_ISDIR (statbuf
.st_mode
))
772 add_hierarchy_to_namelist (name
, statbuf
.st_dev
);
777 for (name
= namelist
; name
; name
= name
->next
)
779 namelist
= merge_sort (namelist
, num_names
, compare_names
);
781 for (name
= namelist
; name
; name
= name
->next
)
782 name
->found_count
= 0;
785 /* This is like name_match, except that it returns a pointer to the
786 name it matched, and doesn't set FOUND in structure. The caller
787 will have to do that if it wants to. Oh, and if the namelist is
788 empty, it returns null, unlike name_match, which returns TRUE. */
790 name_scan (const char *file_name
)
792 size_t length
= strlen (file_name
);
796 struct name
*cursor
= namelist_match (file_name
, length
);
800 /* Filename from archive not found in namelist. If we have the whole
801 namelist here, just return 0. Otherwise, read the next name in and
802 compare it. If this was the last name, namelist->found_count will
803 remain on. If not, we loop to compare the newly read name. */
805 if (same_order_option
&& namelist
&& namelist
->found_count
)
807 name_gather (); /* read one more */
808 if (namelist
->found_count
)
816 /* This returns a name from the namelist which doesn't have ->found
817 set. It sets ->found before returning, so successive calls will
818 find and return all the non-found names in the namelist. */
819 struct name
*gnu_list_name
;
822 name_from_list (void)
825 gnu_list_name
= namelist
;
826 while (gnu_list_name
&& (gnu_list_name
->found_count
|| gnu_list_name
->fake
))
827 gnu_list_name
= gnu_list_name
->next
;
830 gnu_list_name
->found_count
++;
831 chdir_do (gnu_list_name
->change_dir
);
832 return gnu_list_name
->name
;
838 blank_name_list (void)
843 for (name
= namelist
; name
; name
= name
->next
)
844 name
->found_count
= 0;
847 /* Yield a newly allocated file name consisting of FILE_NAME concatenated to
848 NAME, with an intervening slash if FILE_NAME does not already end in one. */
850 new_name (const char *file_name
, const char *name
)
852 size_t file_name_len
= strlen (file_name
);
853 size_t namesize
= strlen (name
) + 1;
854 int slash
= file_name_len
&& ! ISSLASH (file_name
[file_name_len
- 1]);
855 char *buffer
= xmalloc (file_name_len
+ slash
+ namesize
);
856 memcpy (buffer
, file_name
, file_name_len
);
857 buffer
[file_name_len
] = '/';
858 memcpy (buffer
+ file_name_len
+ slash
, name
, namesize
);
862 /* Return nonzero if file NAME is excluded. */
864 excluded_name (char const *name
)
866 return excluded_file_name (excluded
, name
+ FILE_SYSTEM_PREFIX_LEN (name
));
869 /* Names to avoid dumping. */
870 static Hash_table
*avoided_name_table
;
872 /* Remember to not archive NAME. */
874 add_avoided_name (char const *name
)
876 hash_string_insert (&avoided_name_table
, name
);
879 /* Should NAME be avoided when archiving? */
881 is_avoided_name (char const *name
)
883 return hash_string_lookup (avoided_name_table
, name
);
887 static Hash_table
*individual_file_table
;
890 register_individual_file (char const *name
)
894 if (deref_stat (dereference_option
, name
, &st
) != 0)
895 return; /* Will be complained about later */
896 if (S_ISDIR (st
.st_mode
))
899 hash_string_insert (&individual_file_table
, name
);
903 is_individual_file (char const *name
)
905 return hash_string_lookup (individual_file_table
, name
);
910 /* Return the size of the prefix of FILE_NAME that is removed after
911 stripping NUM leading file name components. NUM must be
915 stripped_prefix_len (char const *file_name
, size_t num
)
917 char const *p
= file_name
+ FILE_SYSTEM_PREFIX_LEN (file_name
);
922 bool slash
= ISSLASH (*p
);
927 return p
- file_name
;
935 /* Return nonzero if NAME contains ".." as a file name component. */
937 contains_dot_dot (char const *name
)
939 char const *p
= name
+ FILE_SYSTEM_PREFIX_LEN (name
);
943 if (p
[0] == '.' && p
[1] == '.' && (ISSLASH (p
[2]) || !p
[2]))
951 while (! ISSLASH (*p
));