]> Dogcows Code - chaz/tar/blob - src/names.c
* src/names.c (file_list_name): Properly prototype.
[chaz/tar] / src / names.c
1 /* Various processing of names.
2
3 Copyright 1988, 1992, 1994, 1996-2001, 2003-2007, 2009, 2013 Free
4 Software Foundation, Inc.
5
6 This program is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 3, or (at your option) any later
9 version.
10
11 This program is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
14 Public License for more details.
15
16 You should have received a copy of the GNU General Public License along
17 with this program. If not, see <http://www.gnu.org/licenses/>. */
18
19 #include <system.h>
20
21 #include <fnmatch.h>
22 #include <hash.h>
23 #include <quotearg.h>
24 #include <wordsplit.h>
25
26 #include "common.h"
27 \f
28 /* User and group names. */
29
30 /* Make sure you link with the proper libraries if you are running the
31 Yellow Peril (thanks for the good laugh, Ian J.!), or, euh... NIS.
32 This code should also be modified for non-UNIX systems to do something
33 reasonable. */
34
35 static char *cached_uname;
36 static char *cached_gname;
37
38 static uid_t cached_uid; /* valid only if cached_uname is not empty */
39 static gid_t cached_gid; /* valid only if cached_gname is not empty */
40
41 /* These variables are valid only if nonempty. */
42 static char *cached_no_such_uname;
43 static char *cached_no_such_gname;
44
45 /* These variables are valid only if nonzero. It's not worth optimizing
46 the case for weird systems where 0 is not a valid uid or gid. */
47 static uid_t cached_no_such_uid;
48 static gid_t cached_no_such_gid;
49
50 /* Given UID, find the corresponding UNAME. */
51 void
52 uid_to_uname (uid_t uid, char **uname)
53 {
54 struct passwd *passwd;
55
56 if (uid != 0 && uid == cached_no_such_uid)
57 {
58 *uname = xstrdup ("");
59 return;
60 }
61
62 if (!cached_uname || uid != cached_uid)
63 {
64 passwd = getpwuid (uid);
65 if (passwd)
66 {
67 cached_uid = uid;
68 assign_string (&cached_uname, passwd->pw_name);
69 }
70 else
71 {
72 cached_no_such_uid = uid;
73 *uname = xstrdup ("");
74 return;
75 }
76 }
77 *uname = xstrdup (cached_uname);
78 }
79
80 /* Given GID, find the corresponding GNAME. */
81 void
82 gid_to_gname (gid_t gid, char **gname)
83 {
84 struct group *group;
85
86 if (gid != 0 && gid == cached_no_such_gid)
87 {
88 *gname = xstrdup ("");
89 return;
90 }
91
92 if (!cached_gname || gid != cached_gid)
93 {
94 group = getgrgid (gid);
95 if (group)
96 {
97 cached_gid = gid;
98 assign_string (&cached_gname, group->gr_name);
99 }
100 else
101 {
102 cached_no_such_gid = gid;
103 *gname = xstrdup ("");
104 return;
105 }
106 }
107 *gname = xstrdup (cached_gname);
108 }
109
110 /* Given UNAME, set the corresponding UID and return 1, or else, return 0. */
111 int
112 uname_to_uid (char const *uname, uid_t *uidp)
113 {
114 struct passwd *passwd;
115
116 if (cached_no_such_uname
117 && strcmp (uname, cached_no_such_uname) == 0)
118 return 0;
119
120 if (!cached_uname
121 || uname[0] != cached_uname[0]
122 || strcmp (uname, cached_uname) != 0)
123 {
124 passwd = getpwnam (uname);
125 if (passwd)
126 {
127 cached_uid = passwd->pw_uid;
128 assign_string (&cached_uname, passwd->pw_name);
129 }
130 else
131 {
132 assign_string (&cached_no_such_uname, uname);
133 return 0;
134 }
135 }
136 *uidp = cached_uid;
137 return 1;
138 }
139
140 /* Given GNAME, set the corresponding GID and return 1, or else, return 0. */
141 int
142 gname_to_gid (char const *gname, gid_t *gidp)
143 {
144 struct group *group;
145
146 if (cached_no_such_gname
147 && strcmp (gname, cached_no_such_gname) == 0)
148 return 0;
149
150 if (!cached_gname
151 || gname[0] != cached_gname[0]
152 || strcmp (gname, cached_gname) != 0)
153 {
154 group = getgrnam (gname);
155 if (group)
156 {
157 cached_gid = group->gr_gid;
158 assign_string (&cached_gname, gname);
159 }
160 else
161 {
162 assign_string (&cached_no_such_gname, gname);
163 return 0;
164 }
165 }
166 *gidp = cached_gid;
167 return 1;
168 }
169
170 \f
171 static struct name *
172 make_name (const char *file_name)
173 {
174 struct name *p = xzalloc (sizeof (*p));
175 if (!file_name)
176 file_name = "";
177 p->name = xstrdup (file_name);
178 p->length = strlen (p->name);
179 return p;
180 }
181
182 static void
183 free_name (struct name *p)
184 {
185 if (p)
186 {
187 free (p->name);
188 free (p->caname);
189 free (p);
190 }
191 }
192
193 \f
194 /* Names from the command call. */
195
196 static struct name *namelist; /* first name in list, if any */
197 static struct name *nametail; /* end of name list */
198
199 /* File name arguments are processed in two stages: first a
200 name element list (see below) is filled, then the names from it
201 are moved into the namelist.
202
203 This awkward process is needed only to implement --same-order option,
204 which is meant to help process large archives on machines with
205 limited memory. With this option on, namelist contains at most one
206 entry, which diminishes the memory consumption.
207
208 However, I very much doubt if we still need this -- Sergey */
209
210 /* A name_list element contains entries of three types: */
211
212 #define NELT_NAME 0 /* File name */
213 #define NELT_CHDIR 1 /* Change directory request */
214 #define NELT_FMASK 2 /* Change fnmatch options request */
215 #define NELT_FILE 3 /* Read file names from that file */
216 #define NELT_NOOP 4 /* No operation */
217
218 struct name_elt /* A name_array element. */
219 {
220 struct name_elt *next, *prev;
221 char type; /* Element type, see NELT_* constants above */
222 union
223 {
224 const char *name; /* File or directory name */
225 int matching_flags;/* fnmatch options if type == NELT_FMASK */
226 struct /* File, if type == NELT_FILE */
227 {
228 const char *name;/* File name */
229 int term; /* File name terminator in the list */
230 FILE *fp;
231 } file;
232 } v;
233 };
234
235 static struct name_elt *name_head; /* store a list of names */
236 size_t name_count; /* how many of the entries are names? */
237
238 static struct name_elt *
239 name_elt_alloc (void)
240 {
241 struct name_elt *elt;
242
243 elt = xmalloc (sizeof (*elt));
244 if (!name_head)
245 {
246 name_head = elt;
247 name_head->prev = name_head->next = NULL;
248 name_head->type = NELT_NOOP;
249 elt = xmalloc (sizeof (*elt));
250 }
251
252 elt->prev = name_head->prev;
253 if (name_head->prev)
254 name_head->prev->next = elt;
255 elt->next = name_head;
256 name_head->prev = elt;
257 return elt;
258 }
259
260 static void
261 name_list_adjust (void)
262 {
263 if (name_head)
264 while (name_head->prev)
265 name_head = name_head->prev;
266 }
267
268 static void
269 name_list_advance (void)
270 {
271 struct name_elt *elt = name_head;
272 name_head = elt->next;
273 if (name_head)
274 name_head->prev = NULL;
275 free (elt);
276 }
277
278 /* Add to name_array the file NAME with fnmatch options MATCHING_FLAGS */
279 void
280 name_add_name (const char *name, int matching_flags)
281 {
282 static int prev_flags = 0; /* FIXME: Or EXCLUDE_ANCHORED? */
283 struct name_elt *ep = name_elt_alloc ();
284
285 if (prev_flags != matching_flags)
286 {
287 ep->type = NELT_FMASK;
288 ep->v.matching_flags = matching_flags;
289 prev_flags = matching_flags;
290 ep = name_elt_alloc ();
291 }
292 ep->type = NELT_NAME;
293 ep->v.name = name;
294 name_count++;
295 }
296
297 /* Add to name_array a chdir request for the directory NAME */
298 void
299 name_add_dir (const char *name)
300 {
301 struct name_elt *ep = name_elt_alloc ();
302 ep->type = NELT_CHDIR;
303 ep->v.name = name;
304 }
305
306 void
307 name_add_file (const char *name, int term)
308 {
309 struct name_elt *ep = name_elt_alloc ();
310 ep->type = NELT_FILE;
311 ep->v.file.name = name;
312 ep->v.file.term = term;
313 ep->v.file.fp = NULL;
314 }
315 \f
316 /* Names from external name file. */
317
318 static char *name_buffer; /* buffer to hold the current file name */
319 static size_t name_buffer_length; /* allocated length of name_buffer */
320
321 /* Set up to gather file names for tar. They can either come from a
322 file or were saved from decoding arguments. */
323 void
324 name_init (void)
325 {
326 name_buffer = xmalloc (NAME_FIELD_SIZE + 2);
327 name_buffer_length = NAME_FIELD_SIZE;
328 name_list_adjust ();
329 }
330
331 void
332 name_term (void)
333 {
334 free (name_buffer);
335 }
336 \f
337 /* Prevent recursive inclusion of the same file */
338 struct file_id_list
339 {
340 struct file_id_list *next;
341 ino_t ino;
342 dev_t dev;
343 const char *from_file;
344 };
345
346 static struct file_id_list *file_id_list;
347
348 /* Return the name of the file from which the file names and options
349 are being read.
350 */
351 static const char *
352 file_list_name (void)
353 {
354 struct name_elt *elt;
355
356 for (elt = name_head; elt; elt = elt->next)
357 if (elt->type == NELT_FILE && elt->v.file.fp)
358 return elt->v.file.name;
359 return _("command line");
360 }
361
362 static int
363 add_file_id (const char *filename)
364 {
365 struct file_id_list *p;
366 struct stat st;
367 const char *reading_from;
368
369 if (stat (filename, &st))
370 stat_fatal (filename);
371 reading_from = file_list_name ();
372 for (p = file_id_list; p; p = p->next)
373 if (p->ino == st.st_ino && p->dev == st.st_dev)
374 {
375 int oldc = set_char_quoting (NULL, ':', 1);
376 ERROR ((0, 0,
377 _("%s: file list requested from %s already read from %s"),
378 quotearg_n (0, filename),
379 reading_from, p->from_file));
380 set_char_quoting (NULL, ':', oldc);
381 return 1;
382 }
383 p = xmalloc (sizeof *p);
384 p->next = file_id_list;
385 p->ino = st.st_ino;
386 p->dev = st.st_dev;
387 p->from_file = reading_from;
388 file_id_list = p;
389 return 0;
390 }
391 \f
392 enum read_file_list_state /* Result of reading file name from the list file */
393 {
394 file_list_success, /* OK, name read successfully */
395 file_list_end, /* End of list file */
396 file_list_zero, /* Zero separator encountered where it should not */
397 file_list_skip /* Empty (zero-length) entry encountered, skip it */
398 };
399
400 /* Read from FP a sequence of characters up to TERM and put them
401 into STK.
402 */
403 static enum read_file_list_state
404 read_name_from_file (struct name_elt *ent)
405 {
406 int c;
407 size_t counter = 0;
408 FILE *fp = ent->v.file.fp;
409 int term = ent->v.file.term;
410
411 for (c = getc (fp); c != EOF && c != term; c = getc (fp))
412 {
413 if (counter == name_buffer_length)
414 name_buffer = x2realloc (name_buffer, &name_buffer_length);
415 name_buffer[counter++] = c;
416 if (c == 0)
417 {
418 /* We have read a zero separator. The file possibly is
419 zero-separated */
420 return file_list_zero;
421 }
422 }
423
424 if (counter == 0 && c != EOF)
425 return file_list_skip;
426
427 if (counter == name_buffer_length)
428 name_buffer = x2realloc (name_buffer, &name_buffer_length);
429 name_buffer[counter] = 0;
430
431 return (counter == 0 && c == EOF) ? file_list_end : file_list_success;
432 }
433
434 static int
435 handle_option (const char *str)
436 {
437 struct wordsplit ws;
438 int i;
439
440 while (*str && isspace (*str))
441 ;
442 if (*str != '-')
443 return 1;
444
445 ws.ws_offs = 1;
446 if (wordsplit (str, &ws, WRDSF_DEFFLAGS|WRDSF_DOOFFS))
447 FATAL_ERROR ((0, 0, _("cannot split string '%s': %s"),
448 str, wordsplit_strerror (&ws)));
449 ws.ws_wordv[0] = program_invocation_short_name;
450 more_options (ws.ws_wordc+ws.ws_offs, ws.ws_wordv);
451 for (i = 0; i < ws.ws_wordc+ws.ws_offs; i++)
452 ws.ws_wordv[i] = NULL;
453
454 wordsplit_free (&ws);
455 return 0;
456 }
457
458 static int
459 read_next_name (struct name_elt *ent, struct name_elt *ret)
460 {
461 if (!ent->v.file.fp)
462 {
463 if (!strcmp (ent->v.file.name, "-"))
464 {
465 request_stdin ("-T");
466 ent->v.file.fp = stdin;
467 }
468 else
469 {
470 if (add_file_id (ent->v.file.name))
471 {
472 name_list_advance ();
473 return 1;
474 }
475 if ((ent->v.file.fp = fopen (ent->v.file.name, "r")) == NULL)
476 open_fatal (ent->v.file.name);
477 }
478 }
479
480 while (1)
481 {
482 switch (read_name_from_file (ent))
483 {
484 case file_list_skip:
485 continue;
486
487 case file_list_zero:
488 WARNOPT (WARN_FILENAME_WITH_NULS,
489 (0, 0, N_("%s: file name read contains nul character"),
490 quotearg_colon (ent->v.file.name)));
491 ent->v.file.term = 0;
492 /* fall through */
493 case file_list_success:
494 if (handle_option (name_buffer) == 0)
495 {
496 name_list_adjust ();
497 return 1;
498 }
499 ret->type = NELT_NAME;
500 ret->v.name = name_buffer;
501 return 0;
502
503 case file_list_end:
504 if (strcmp (ent->v.file.name, "-"))
505 fclose (ent->v.file.fp);
506 ent->v.file.fp = NULL;
507 name_list_advance ();
508 return 1;
509 }
510 }
511 }
512 \f
513 static void
514 copy_name (struct name_elt *ep)
515 {
516 const char *source;
517 size_t source_len;
518 char *cursor;
519
520 source = ep->v.name;
521 source_len = strlen (source);
522 if (name_buffer_length < source_len)
523 {
524 do
525 {
526 name_buffer_length *= 2;
527 if (! name_buffer_length)
528 xalloc_die ();
529 }
530 while (name_buffer_length < source_len);
531
532 free (name_buffer);
533 name_buffer = xmalloc(name_buffer_length + 2);
534 }
535 strcpy (name_buffer, source);
536
537 /* Zap trailing slashes. */
538 cursor = name_buffer + strlen (name_buffer) - 1;
539 while (cursor > name_buffer && ISSLASH (*cursor))
540 *cursor-- = '\0';
541 }
542
543 \f
544 static int matching_flags; /* exclude_fnmatch options */
545
546 /* Get the next NELT_NAME element from name_array. Result is in
547 static storage and can't be relied upon across two calls.
548
549 If CHANGE_DIRS is true, treat any entries of type NELT_CHDIR as
550 the request to change to the given directory.
551
552 Entries of type NELT_FMASK cause updates of the matching_flags
553 value. */
554 static struct name_elt *
555 name_next_elt (int change_dirs)
556 {
557 static struct name_elt entry;
558 struct name_elt *ep;
559
560 while ((ep = name_head) != NULL)
561 {
562 switch (ep->type)
563 {
564 case NELT_NOOP:
565 name_list_advance ();
566 break;
567
568 case NELT_FMASK:
569 matching_flags = ep->v.matching_flags;
570 name_list_advance ();
571 continue;
572
573 case NELT_FILE:
574 if (read_next_name (ep, &entry) == 0)
575 return &entry;
576 continue;
577
578 case NELT_CHDIR:
579 if (change_dirs)
580 {
581 copy_name (ep);
582 if (chdir (name_buffer) < 0)
583 chdir_fatal (name_buffer);
584 name_list_advance ();
585 break;
586 }
587 /* fall trhough */
588 case NELT_NAME:
589 copy_name (ep);
590 if (unquote_option)
591 unquote_string (name_buffer);
592 entry.type = ep->type;
593 entry.v.name = name_buffer;
594 name_list_advance ();
595 return &entry;
596 }
597 }
598
599 return NULL;
600 }
601
602 const char *
603 name_next (int change_dirs)
604 {
605 struct name_elt *nelt = name_next_elt (change_dirs);
606 return nelt ? nelt->v.name : NULL;
607 }
608
609 /* Gather names in a list for scanning. Could hash them later if we
610 really care.
611
612 If the names are already sorted to match the archive, we just read
613 them one by one. name_gather reads the first one, and it is called
614 by name_match as appropriate to read the next ones. At EOF, the
615 last name read is just left in the buffer. This option lets users
616 of small machines extract an arbitrary number of files by doing
617 "tar t" and editing down the list of files. */
618
619 void
620 name_gather (void)
621 {
622 /* Buffer able to hold a single name. */
623 static struct name *buffer = NULL;
624
625 struct name_elt *ep;
626
627 if (same_order_option)
628 {
629 static int change_dir;
630
631 while ((ep = name_next_elt (0)) && ep->type == NELT_CHDIR)
632 change_dir = chdir_arg (xstrdup (ep->v.name));
633
634 if (ep)
635 {
636 free_name (buffer);
637 buffer = make_name (ep->v.name);
638 buffer->change_dir = change_dir;
639 buffer->next = 0;
640 buffer->found_count = 0;
641 buffer->matching_flags = matching_flags;
642 buffer->directory = NULL;
643 buffer->parent = NULL;
644 buffer->cmdline = true;
645
646 namelist = nametail = buffer;
647 }
648 else if (change_dir)
649 addname (0, change_dir, false, NULL);
650 }
651 else
652 {
653 /* Non sorted names -- read them all in. */
654 int change_dir = 0;
655
656 for (;;)
657 {
658 int change_dir0 = change_dir;
659 while ((ep = name_next_elt (0)) && ep->type == NELT_CHDIR)
660 change_dir = chdir_arg (xstrdup (ep->v.name));
661
662 if (ep)
663 addname (ep->v.name, change_dir, true, NULL);
664 else
665 {
666 if (change_dir != change_dir0)
667 addname (NULL, change_dir, false, NULL);
668 break;
669 }
670 }
671 }
672 }
673
674 /* Add a name to the namelist. */
675 struct name *
676 addname (char const *string, int change_dir, bool cmdline, struct name *parent)
677 {
678 struct name *name = make_name (string);
679
680 name->prev = nametail;
681 name->next = NULL;
682 name->found_count = 0;
683 name->matching_flags = matching_flags;
684 name->change_dir = change_dir;
685 name->directory = NULL;
686 name->parent = parent;
687 name->cmdline = cmdline;
688
689 if (nametail)
690 nametail->next = name;
691 else
692 namelist = name;
693 nametail = name;
694 return name;
695 }
696
697 /* Find a match for FILE_NAME (whose string length is LENGTH) in the name
698 list. */
699 static struct name *
700 namelist_match (char const *file_name, size_t length)
701 {
702 struct name *p;
703
704 for (p = namelist; p; p = p->next)
705 {
706 if (p->name[0]
707 && exclude_fnmatch (p->name, file_name, p->matching_flags))
708 return p;
709 }
710
711 return NULL;
712 }
713
714 void
715 remname (struct name *name)
716 {
717 struct name *p;
718
719 if ((p = name->prev) != NULL)
720 p->next = name->next;
721 else
722 namelist = name->next;
723
724 if ((p = name->next) != NULL)
725 p->prev = name->prev;
726 else
727 nametail = name->prev;
728 }
729
730 /* Return true if and only if name FILE_NAME (from an archive) matches any
731 name from the namelist. */
732 bool
733 name_match (const char *file_name)
734 {
735 size_t length = strlen (file_name);
736
737 while (1)
738 {
739 struct name *cursor = namelist;
740
741 if (!cursor)
742 return true;
743
744 if (cursor->name[0] == 0)
745 {
746 chdir_do (cursor->change_dir);
747 namelist = NULL;
748 nametail = NULL;
749 return true;
750 }
751
752 cursor = namelist_match (file_name, length);
753 if (cursor)
754 {
755 if (!(ISSLASH (file_name[cursor->length]) && recursion_option)
756 || cursor->found_count == 0)
757 cursor->found_count++; /* remember it matched */
758 if (starting_file_option)
759 {
760 free (namelist);
761 namelist = NULL;
762 nametail = NULL;
763 }
764 chdir_do (cursor->change_dir);
765
766 /* We got a match. */
767 return ISFOUND (cursor);
768 }
769
770 /* Filename from archive not found in namelist. If we have the whole
771 namelist here, just return 0. Otherwise, read the next name in and
772 compare it. If this was the last name, namelist->found_count will
773 remain on. If not, we loop to compare the newly read name. */
774
775 if (same_order_option && namelist->found_count)
776 {
777 name_gather (); /* read one more */
778 if (namelist->found_count)
779 return false;
780 }
781 else
782 return false;
783 }
784 }
785
786 /* Returns true if all names from the namelist were processed.
787 P is the stat_info of the most recently processed entry.
788 The decision is postponed until the next entry is read if:
789
790 1) P ended with a slash (i.e. it was a directory)
791 2) P matches any entry from the namelist *and* represents a subdirectory
792 or a file lying under this entry (in the terms of directory structure).
793
794 This is necessary to handle contents of directories. */
795 bool
796 all_names_found (struct tar_stat_info *p)
797 {
798 struct name const *cursor;
799 size_t len;
800
801 if (!p->file_name || occurrence_option == 0 || p->had_trailing_slash)
802 return false;
803 len = strlen (p->file_name);
804 for (cursor = namelist; cursor; cursor = cursor->next)
805 {
806 if ((cursor->name[0] && !WASFOUND (cursor))
807 || (len >= cursor->length && ISSLASH (p->file_name[cursor->length])))
808 return false;
809 }
810 return true;
811 }
812
813 static int
814 regex_usage_warning (const char *name)
815 {
816 static int warned_once = 0;
817
818 if (warn_regex_usage && fnmatch_pattern_has_wildcards (name, 0))
819 {
820 warned_once = 1;
821 WARN ((0, 0,
822 _("Pattern matching characters used in file names")));
823 WARN ((0, 0,
824 _("Use --wildcards to enable pattern matching,"
825 " or --no-wildcards to suppress this warning")));
826 }
827 return warned_once;
828 }
829
830 /* Print the names of things in the namelist that were not matched. */
831 void
832 names_notfound (void)
833 {
834 struct name const *cursor;
835
836 for (cursor = namelist; cursor; cursor = cursor->next)
837 if (!WASFOUND (cursor) && cursor->name[0])
838 {
839 regex_usage_warning (cursor->name);
840 ERROR ((0, 0,
841 (cursor->found_count == 0) ?
842 _("%s: Not found in archive") :
843 _("%s: Required occurrence not found in archive"),
844 quotearg_colon (cursor->name)));
845 }
846
847 /* Don't bother freeing the name list; we're about to exit. */
848 namelist = NULL;
849 nametail = NULL;
850
851 if (same_order_option)
852 {
853 const char *name;
854
855 while ((name = name_next (1)) != NULL)
856 {
857 regex_usage_warning (name);
858 ERROR ((0, 0, _("%s: Not found in archive"),
859 quotearg_colon (name)));
860 }
861 }
862 }
863
864 void
865 label_notfound (void)
866 {
867 struct name const *cursor;
868
869 if (!namelist)
870 return;
871
872 for (cursor = namelist; cursor; cursor = cursor->next)
873 if (WASFOUND (cursor))
874 return;
875
876 if (verbose_option)
877 error (0, 0, _("Archive label mismatch"));
878 set_exit_status (TAREXIT_DIFFERS);
879
880 for (cursor = namelist; cursor; cursor = cursor->next)
881 {
882 if (regex_usage_warning (cursor->name))
883 break;
884 }
885
886 /* Don't bother freeing the name list; we're about to exit. */
887 namelist = NULL;
888 nametail = NULL;
889
890 if (same_order_option)
891 {
892 const char *name;
893
894 while ((name = name_next (1)) != NULL
895 && regex_usage_warning (name) == 0)
896 ;
897 }
898 }
899 \f
900 /* Sorting name lists. */
901
902 /* Sort *singly* linked LIST of names, of given LENGTH, using COMPARE
903 to order names. Return the sorted list. Note that after calling
904 this function, the 'prev' links in list elements are messed up.
905
906 Apart from the type 'struct name' and the definition of SUCCESSOR,
907 this is a generic list-sorting function, but it's too painful to
908 make it both generic and portable
909 in C. */
910
911 static struct name *
912 merge_sort_sll (struct name *list, int length,
913 int (*compare) (struct name const*, struct name const*))
914 {
915 struct name *first_list;
916 struct name *second_list;
917 int first_length;
918 int second_length;
919 struct name *result;
920 struct name **merge_point;
921 struct name *cursor;
922 int counter;
923
924 # define SUCCESSOR(name) ((name)->next)
925
926 if (length == 1)
927 return list;
928
929 if (length == 2)
930 {
931 if ((*compare) (list, SUCCESSOR (list)) > 0)
932 {
933 result = SUCCESSOR (list);
934 SUCCESSOR (result) = list;
935 SUCCESSOR (list) = 0;
936 return result;
937 }
938 return list;
939 }
940
941 first_list = list;
942 first_length = (length + 1) / 2;
943 second_length = length / 2;
944 for (cursor = list, counter = first_length - 1;
945 counter;
946 cursor = SUCCESSOR (cursor), counter--)
947 continue;
948 second_list = SUCCESSOR (cursor);
949 SUCCESSOR (cursor) = 0;
950
951 first_list = merge_sort_sll (first_list, first_length, compare);
952 second_list = merge_sort_sll (second_list, second_length, compare);
953
954 merge_point = &result;
955 while (first_list && second_list)
956 if ((*compare) (first_list, second_list) < 0)
957 {
958 cursor = SUCCESSOR (first_list);
959 *merge_point = first_list;
960 merge_point = &SUCCESSOR (first_list);
961 first_list = cursor;
962 }
963 else
964 {
965 cursor = SUCCESSOR (second_list);
966 *merge_point = second_list;
967 merge_point = &SUCCESSOR (second_list);
968 second_list = cursor;
969 }
970 if (first_list)
971 *merge_point = first_list;
972 else
973 *merge_point = second_list;
974
975 return result;
976
977 #undef SUCCESSOR
978 }
979
980 /* Sort doubly linked LIST of names, of given LENGTH, using COMPARE
981 to order names. Return the sorted list. */
982 static struct name *
983 merge_sort (struct name *list, int length,
984 int (*compare) (struct name const*, struct name const*))
985 {
986 struct name *head, *p, *prev;
987 head = merge_sort_sll (list, length, compare);
988 /* Fixup prev pointers */
989 for (prev = NULL, p = head; p; prev = p, p = p->next)
990 p->prev = prev;
991 return head;
992 }
993
994 /* A comparison function for sorting names. Put found names last;
995 break ties by string comparison. */
996
997 static int
998 compare_names_found (struct name const *n1, struct name const *n2)
999 {
1000 int found_diff = WASFOUND (n2) - WASFOUND (n1);
1001 return found_diff ? found_diff : strcmp (n1->name, n2->name);
1002 }
1003
1004 /* Simple comparison by names. */
1005 static int
1006 compare_names (struct name const *n1, struct name const *n2)
1007 {
1008 return strcmp (n1->name, n2->name);
1009 }
1010
1011 \f
1012 /* Add all the dirs under ST to the namelist NAME, descending the
1013 directory hierarchy recursively. */
1014
1015 static void
1016 add_hierarchy_to_namelist (struct tar_stat_info *st, struct name *name)
1017 {
1018 const char *buffer;
1019
1020 name->directory = scan_directory (st);
1021 buffer = directory_contents (name->directory);
1022 if (buffer)
1023 {
1024 struct name *child_head = NULL, *child_tail = NULL;
1025 size_t name_length = name->length;
1026 size_t allocated_length = (name_length >= NAME_FIELD_SIZE
1027 ? name_length + NAME_FIELD_SIZE
1028 : NAME_FIELD_SIZE);
1029 char *namebuf = xmalloc (allocated_length + 1);
1030 /* FIXME: + 2 above? */
1031 const char *string;
1032 size_t string_length;
1033 int change_dir = name->change_dir;
1034
1035 strcpy (namebuf, name->name);
1036 if (! ISSLASH (namebuf[name_length - 1]))
1037 {
1038 namebuf[name_length++] = '/';
1039 namebuf[name_length] = '\0';
1040 }
1041
1042 for (string = buffer; *string; string += string_length + 1)
1043 {
1044 string_length = strlen (string);
1045 if (*string == 'D')
1046 {
1047 struct name *np;
1048 struct tar_stat_info subdir;
1049 int subfd;
1050
1051 if (allocated_length <= name_length + string_length)
1052 {
1053 do
1054 {
1055 allocated_length *= 2;
1056 if (! allocated_length)
1057 xalloc_die ();
1058 }
1059 while (allocated_length <= name_length + string_length);
1060
1061 namebuf = xrealloc (namebuf, allocated_length + 1);
1062 }
1063 strcpy (namebuf + name_length, string + 1);
1064 np = addname (namebuf, change_dir, false, name);
1065 if (!child_head)
1066 child_head = np;
1067 else
1068 child_tail->sibling = np;
1069 child_tail = np;
1070
1071 tar_stat_init (&subdir);
1072 subdir.parent = st;
1073 if (st->fd < 0)
1074 {
1075 subfd = -1;
1076 errno = - st->fd;
1077 }
1078 else
1079 subfd = subfile_open (st, string + 1,
1080 open_read_flags | O_DIRECTORY);
1081 if (subfd < 0)
1082 open_diag (namebuf);
1083 else
1084 {
1085 subdir.fd = subfd;
1086 if (fstat (subfd, &subdir.stat) != 0)
1087 stat_diag (namebuf);
1088 else if (! (O_DIRECTORY || S_ISDIR (subdir.stat.st_mode)))
1089 {
1090 errno = ENOTDIR;
1091 open_diag (namebuf);
1092 }
1093 else
1094 {
1095 subdir.orig_file_name = xstrdup (namebuf);
1096 add_hierarchy_to_namelist (&subdir, np);
1097 restore_parent_fd (&subdir);
1098 }
1099 }
1100
1101 tar_stat_destroy (&subdir);
1102 }
1103 }
1104
1105 free (namebuf);
1106 name->child = child_head;
1107 }
1108 }
1109 \f
1110 /* Auxiliary functions for hashed table of struct name's. */
1111
1112 static size_t
1113 name_hash (void const *entry, size_t n_buckets)
1114 {
1115 struct name const *name = entry;
1116 return hash_string (name->caname, n_buckets);
1117 }
1118
1119 /* Compare two directories for equality of their names. */
1120 static bool
1121 name_compare (void const *entry1, void const *entry2)
1122 {
1123 struct name const *name1 = entry1;
1124 struct name const *name2 = entry2;
1125 return strcmp (name1->caname, name2->caname) == 0;
1126 }
1127
1128 \f
1129 /* Rebase 'name' member of CHILD and all its siblings to
1130 the new PARENT. */
1131 static void
1132 rebase_child_list (struct name *child, struct name *parent)
1133 {
1134 size_t old_prefix_len = child->parent->length;
1135 size_t new_prefix_len = parent->length;
1136 char *new_prefix = parent->name;
1137
1138 for (; child; child = child->sibling)
1139 {
1140 size_t size = child->length - old_prefix_len + new_prefix_len;
1141 char *newp = xmalloc (size + 1);
1142 strcpy (newp, new_prefix);
1143 strcat (newp, child->name + old_prefix_len);
1144 free (child->name);
1145 child->name = newp;
1146 child->length = size;
1147
1148 rebase_directory (child->directory,
1149 child->parent->name, old_prefix_len,
1150 new_prefix, new_prefix_len);
1151 }
1152 }
1153
1154 /* Collect all the names from argv[] (or whatever), expand them into a
1155 directory tree, and sort them. This gets only subdirectories, not
1156 all files. */
1157
1158 void
1159 collect_and_sort_names (void)
1160 {
1161 struct name *name;
1162 struct name *next_name, *prev_name = NULL;
1163 int num_names;
1164 Hash_table *nametab;
1165
1166 name_gather ();
1167
1168 if (!namelist)
1169 addname (".", 0, false, NULL);
1170
1171 if (listed_incremental_option)
1172 {
1173 switch (chdir_count ())
1174 {
1175 case 0:
1176 break;
1177
1178 case 1:
1179 if (namelist->change_dir == 0)
1180 USAGE_ERROR ((0, 0,
1181 _("Using -C option inside file list is not "
1182 "allowed with --listed-incremental")));
1183 break;
1184
1185 default:
1186 USAGE_ERROR ((0, 0,
1187 _("Only one -C option is allowed with "
1188 "--listed-incremental")));
1189 }
1190
1191 read_directory_file ();
1192 }
1193
1194 num_names = 0;
1195 for (name = namelist; name; name = name->next, num_names++)
1196 {
1197 struct tar_stat_info st;
1198
1199 if (name->found_count || name->directory)
1200 continue;
1201 if (name->matching_flags & EXCLUDE_WILDCARDS)
1202 /* NOTE: EXCLUDE_ANCHORED is not relevant here */
1203 /* FIXME: just skip regexps for now */
1204 continue;
1205 chdir_do (name->change_dir);
1206
1207 if (name->name[0] == 0)
1208 continue;
1209
1210 tar_stat_init (&st);
1211
1212 if (deref_stat (name->name, &st.stat) != 0)
1213 {
1214 stat_diag (name->name);
1215 continue;
1216 }
1217 if (S_ISDIR (st.stat.st_mode))
1218 {
1219 int dir_fd = openat (chdir_fd, name->name,
1220 open_read_flags | O_DIRECTORY);
1221 if (dir_fd < 0)
1222 open_diag (name->name);
1223 else
1224 {
1225 st.fd = dir_fd;
1226 if (fstat (dir_fd, &st.stat) != 0)
1227 stat_diag (name->name);
1228 else if (O_DIRECTORY || S_ISDIR (st.stat.st_mode))
1229 {
1230 st.orig_file_name = xstrdup (name->name);
1231 name->found_count++;
1232 add_hierarchy_to_namelist (&st, name);
1233 }
1234 }
1235 }
1236
1237 tar_stat_destroy (&st);
1238 }
1239
1240 namelist = merge_sort (namelist, num_names, compare_names);
1241
1242 num_names = 0;
1243 nametab = hash_initialize (0, 0,
1244 name_hash,
1245 name_compare, NULL);
1246 for (name = namelist; name; name = next_name)
1247 {
1248 next_name = name->next;
1249 name->caname = normalize_filename (name->name);
1250 if (prev_name)
1251 {
1252 struct name *p = hash_lookup (nametab, name);
1253 if (p)
1254 {
1255 /* Keep the one listed in the command line */
1256 if (!name->parent)
1257 {
1258 if (p->child)
1259 rebase_child_list (p->child, name);
1260 hash_delete (nametab, name);
1261 /* FIXME: remove_directory (p->caname); ? */
1262 remname (p);
1263 free_name (p);
1264 num_names--;
1265 }
1266 else
1267 {
1268 if (name->child)
1269 rebase_child_list (name->child, p);
1270 /* FIXME: remove_directory (name->caname); ? */
1271 remname (name);
1272 free_name (name);
1273 continue;
1274 }
1275 }
1276 }
1277 name->found_count = 0;
1278 if (!hash_insert (nametab, name))
1279 xalloc_die ();
1280 prev_name = name;
1281 num_names++;
1282 }
1283 nametail = prev_name;
1284 hash_free (nametab);
1285
1286 namelist = merge_sort (namelist, num_names, compare_names_found);
1287
1288 if (listed_incremental_option)
1289 {
1290 for (name = namelist; name && name->name[0] == 0; name++)
1291 ;
1292 if (name)
1293 append_incremental_renames (name->directory);
1294 }
1295 }
1296
1297 /* This is like name_match, except that
1298 1. It returns a pointer to the name it matched, and doesn't set FOUND
1299 in structure. The caller will have to do that if it wants to.
1300 2. If the namelist is empty, it returns null, unlike name_match, which
1301 returns TRUE. */
1302 struct name *
1303 name_scan (const char *file_name)
1304 {
1305 size_t length = strlen (file_name);
1306
1307 while (1)
1308 {
1309 struct name *cursor = namelist_match (file_name, length);
1310 if (cursor)
1311 return cursor;
1312
1313 /* Filename from archive not found in namelist. If we have the whole
1314 namelist here, just return 0. Otherwise, read the next name in and
1315 compare it. If this was the last name, namelist->found_count will
1316 remain on. If not, we loop to compare the newly read name. */
1317
1318 if (same_order_option && namelist && namelist->found_count)
1319 {
1320 name_gather (); /* read one more */
1321 if (namelist->found_count)
1322 return 0;
1323 }
1324 else
1325 return 0;
1326 }
1327 }
1328
1329 /* This returns a name from the namelist which doesn't have ->found
1330 set. It sets ->found before returning, so successive calls will
1331 find and return all the non-found names in the namelist. */
1332 struct name *gnu_list_name;
1333
1334 struct name const *
1335 name_from_list (void)
1336 {
1337 if (!gnu_list_name)
1338 gnu_list_name = namelist;
1339 while (gnu_list_name
1340 && (gnu_list_name->found_count || gnu_list_name->name[0] == 0))
1341 gnu_list_name = gnu_list_name->next;
1342 if (gnu_list_name)
1343 {
1344 gnu_list_name->found_count++;
1345 chdir_do (gnu_list_name->change_dir);
1346 return gnu_list_name;
1347 }
1348 return NULL;
1349 }
1350
1351 void
1352 blank_name_list (void)
1353 {
1354 struct name *name;
1355
1356 gnu_list_name = 0;
1357 for (name = namelist; name; name = name->next)
1358 name->found_count = 0;
1359 }
1360
1361 /* Yield a newly allocated file name consisting of FILE_NAME concatenated to
1362 NAME, with an intervening slash if FILE_NAME does not already end in one. */
1363 char *
1364 new_name (const char *file_name, const char *name)
1365 {
1366 size_t file_name_len = strlen (file_name);
1367 size_t namesize = strlen (name) + 1;
1368 int slash = file_name_len && ! ISSLASH (file_name[file_name_len - 1]);
1369 char *buffer = xmalloc (file_name_len + slash + namesize);
1370 memcpy (buffer, file_name, file_name_len);
1371 buffer[file_name_len] = '/';
1372 memcpy (buffer + file_name_len + slash, name, namesize);
1373 return buffer;
1374 }
1375
1376 /* Return nonzero if file NAME is excluded. */
1377 bool
1378 excluded_name (char const *name)
1379 {
1380 return excluded_file_name (excluded, name + FILE_SYSTEM_PREFIX_LEN (name));
1381 }
1382 \f
1383
1384 /* Return the size of the prefix of FILE_NAME that is removed after
1385 stripping NUM leading file name components. NUM must be
1386 positive. */
1387
1388 size_t
1389 stripped_prefix_len (char const *file_name, size_t num)
1390 {
1391 char const *p = file_name + FILE_SYSTEM_PREFIX_LEN (file_name);
1392 while (ISSLASH (*p))
1393 p++;
1394 while (*p)
1395 {
1396 bool slash = ISSLASH (*p);
1397 p++;
1398 if (slash)
1399 {
1400 if (--num == 0)
1401 return p - file_name;
1402 while (ISSLASH (*p))
1403 p++;
1404 }
1405 }
1406 return -1;
1407 }
1408 \f
1409 /* Return nonzero if NAME contains ".." as a file name component. */
1410 bool
1411 contains_dot_dot (char const *name)
1412 {
1413 char const *p = name + FILE_SYSTEM_PREFIX_LEN (name);
1414
1415 for (;; p++)
1416 {
1417 if (p[0] == '.' && p[1] == '.' && (ISSLASH (p[2]) || !p[2]))
1418 return 1;
1419
1420 while (! ISSLASH (*p))
1421 {
1422 if (! *p++)
1423 return 0;
1424 }
1425 }
1426 }
This page took 0.094516 seconds and 4 git commands to generate.