]> Dogcows Code - chaz/tar/blob - src/extract.c
Further rewrite
[chaz/tar] / src / extract.c
1 /* Extract files from a tar archive.
2
3 Copyright (C) 1988, 1992, 1993, 1994, 1996, 1997, 1998, 1999, 2000,
4 2001, 2003, 2004 Free Software Foundation, Inc.
5
6 Written by John Gilmore, on 1985-11-19.
7
8 This program is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 2, or (at your option) any later
11 version.
12
13 This program is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
16 Public License for more details.
17
18 You should have received a copy of the GNU General Public License along
19 with this program; if not, write to the Free Software Foundation, Inc.,
20 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
21
22 #include <system.h>
23 #include <quotearg.h>
24 #include <errno.h>
25 #include <xgetcwd.h>
26
27 #if HAVE_UTIME_H
28 # include <utime.h>
29 #else
30 struct utimbuf
31 {
32 long actime;
33 long modtime;
34 };
35 #endif
36
37 #include "common.h"
38
39 bool we_are_root; /* true if our effective uid == 0 */
40 static mode_t newdir_umask; /* umask when creating new directories */
41 static mode_t current_umask; /* current umask (which is set to 0 if -p) */
42
43 /* Status of the permissions of a file that we are extracting. */
44 enum permstatus
45 {
46 /* This file may have existed already; its permissions are unknown. */
47 UNKNOWN_PERMSTATUS,
48
49 /* This file was created using the permissions from the archive. */
50 ARCHIVED_PERMSTATUS,
51
52 /* This is an intermediate directory; the archive did not specify
53 its permissions. */
54 INTERDIR_PERMSTATUS
55 };
56
57 /* List of directories whose statuses we need to extract after we've
58 finished extracting their subsidiary files. If you consider each
59 contiguous subsequence of elements of the form [D]?[^D]*, where [D]
60 represents an element where AFTER_SYMLINKS is nonzero and [^D]
61 represents an element where AFTER_SYMLINKS is zero, then the head
62 of the subsequence has the longest name, and each non-head element
63 in the prefix is an ancestor (in the directory hierarchy) of the
64 preceding element. */
65
66 struct delayed_set_stat
67 {
68 struct delayed_set_stat *next;
69 struct stat stat_info;
70 size_t file_name_len;
71 mode_t invert_permissions;
72 enum permstatus permstatus;
73 bool after_symlinks;
74 char file_name[1];
75 };
76
77 static struct delayed_set_stat *delayed_set_stat_head;
78
79 /* List of symbolic links whose creation we have delayed. */
80 struct delayed_symlink
81 {
82 /* The next delayed symbolic link in the list. */
83 struct delayed_symlink *next;
84
85 /* The device, inode number and last-modified time of the placeholder. */
86 dev_t dev;
87 ino_t ino;
88 time_t mtime;
89
90 /* The desired owner and group of the symbolic link. */
91 uid_t uid;
92 gid_t gid;
93
94 /* A list of sources for this symlink. The sources are all to be
95 hard-linked together. */
96 struct string_list *sources;
97
98 /* The desired target of the desired link. */
99 char target[1];
100 };
101
102 static struct delayed_symlink *delayed_symlink_head;
103
104 struct string_list
105 {
106 struct string_list *next;
107 char string[1];
108 };
109
110 /* Set up to extract files. */
111 void
112 extr_init (void)
113 {
114 we_are_root = geteuid () == 0;
115 same_permissions_option += we_are_root;
116 same_owner_option += we_are_root;
117
118 /* Save 'root device' to avoid purging mount points.
119 FIXME: Should the same be done after handling -C option ? */
120 if (one_file_system_option)
121 {
122 struct stat st;
123 char *dir = xgetcwd ();
124
125 if (deref_stat (true, dir, &st))
126 stat_diag (dir);
127 else
128 root_device = st.st_dev;
129 }
130
131 /* Option -p clears the kernel umask, so it does not affect proper
132 restoration of file permissions. New intermediate directories will
133 comply with umask at start of program. */
134
135 newdir_umask = umask (0);
136 if (0 < same_permissions_option)
137 current_umask = 0;
138 else
139 {
140 umask (newdir_umask); /* restore the kernel umask */
141 current_umask = newdir_umask;
142 }
143 }
144
145 /* If restoring permissions, restore the mode for FILE_NAME from
146 information given in *STAT_INFO (where *CUR_INFO gives
147 the current status if CUR_INFO is nonzero); otherwise invert the
148 INVERT_PERMISSIONS bits from the file's current permissions.
149 PERMSTATUS specifies the status of the file's permissions.
150 TYPEFLAG specifies the type of the file. */
151 static void
152 set_mode (char const *file_name,
153 struct stat const *stat_info,
154 struct stat const *cur_info,
155 mode_t invert_permissions, enum permstatus permstatus,
156 char typeflag)
157 {
158 mode_t mode;
159
160 if (0 < same_permissions_option
161 && permstatus != INTERDIR_PERMSTATUS)
162 {
163 mode = stat_info->st_mode;
164
165 /* If we created the file and it has a usual mode, then its mode
166 is normally set correctly already. But on many hosts, some
167 directories inherit the setgid bits from their parents, so we
168 we must set directories' modes explicitly. */
169 if (permstatus == ARCHIVED_PERMSTATUS
170 && ! (mode & ~ MODE_RWX)
171 && typeflag != DIRTYPE
172 && typeflag != GNUTYPE_DUMPDIR)
173 return;
174 }
175 else if (! invert_permissions)
176 return;
177 else
178 {
179 /* We must inspect a directory's current permissions, since the
180 directory may have inherited its setgid bit from its parent.
181
182 INVERT_PERMISSIONS happens to be nonzero only for directories
183 that we created, so there's no point optimizing this code for
184 other cases. */
185 struct stat st;
186 if (! cur_info)
187 {
188 if (stat (file_name, &st) != 0)
189 {
190 stat_error (file_name);
191 return;
192 }
193 cur_info = &st;
194 }
195 mode = cur_info->st_mode ^ invert_permissions;
196 }
197
198 if (chmod (file_name, mode) != 0)
199 chmod_error_details (file_name, mode);
200 }
201
202 /* Check time after successfully setting FILE_NAME's time stamp to T. */
203 static void
204 check_time (char const *file_name, time_t t)
205 {
206 time_t now;
207 if (t <= 0)
208 WARN ((0, 0, _("%s: implausibly old time stamp %s"),
209 file_name, tartime (t)));
210 else if (start_time < t && (now = time (0)) < t)
211 WARN ((0, 0, _("%s: time stamp %s is %lu s in the future"),
212 file_name, tartime (t), (unsigned long) (t - now)));
213 }
214
215 /* Restore stat attributes (owner, group, mode and times) for
216 FILE_NAME, using information given in *STAT_INFO.
217 If CUR_INFO is nonzero, *CUR_INFO is the
218 file's currernt status.
219 If not restoring permissions, invert the
220 INVERT_PERMISSIONS bits from the file's current permissions.
221 PERMSTATUS specifies the status of the file's permissions.
222 TYPEFLAG specifies the type of the file. */
223
224 /* FIXME: About proper restoration of symbolic link attributes, we still do
225 not have it right. Pretesters' reports tell us we need further study and
226 probably more configuration. For now, just use lchown if it exists, and
227 punt for the rest. Sigh! */
228
229 static void
230 set_stat (char const *file_name,
231 struct stat const *stat_info,
232 struct stat const *cur_info,
233 mode_t invert_permissions, enum permstatus permstatus,
234 char typeflag)
235 {
236 struct utimbuf utimbuf;
237
238 if (typeflag != SYMTYPE)
239 {
240 /* We do the utime before the chmod because some versions of utime are
241 broken and trash the modes of the file. */
242
243 if (! touch_option && permstatus != INTERDIR_PERMSTATUS)
244 {
245 /* We set the accessed time to `now', which is really the time we
246 started extracting files, unless incremental_option is used, in
247 which case .st_atime is used. */
248
249 /* FIXME: incremental_option should set ctime too, but how? */
250
251 if (incremental_option)
252 utimbuf.actime = stat_info->st_atime;
253 else
254 utimbuf.actime = start_time;
255
256 utimbuf.modtime = stat_info->st_mtime;
257
258 if (utime (file_name, &utimbuf) < 0)
259 utime_error (file_name);
260 else
261 {
262 check_time (file_name, utimbuf.actime);
263 check_time (file_name, utimbuf.modtime);
264 }
265 }
266
267 /* Some systems allow non-root users to give files away. Once this
268 done, it is not possible anymore to change file permissions, so we
269 have to set permissions prior to possibly giving files away. */
270
271 set_mode (file_name, stat_info, cur_info,
272 invert_permissions, permstatus, typeflag);
273 }
274
275 if (0 < same_owner_option && permstatus != INTERDIR_PERMSTATUS)
276 {
277 /* When lchown exists, it should be used to change the attributes of
278 the symbolic link itself. In this case, a mere chown would change
279 the attributes of the file the symbolic link is pointing to, and
280 should be avoided. */
281
282 if (typeflag == SYMTYPE)
283 {
284 #if HAVE_LCHOWN
285 if (lchown (file_name, stat_info->st_uid, stat_info->st_gid) < 0)
286 chown_error_details (file_name,
287 stat_info->st_uid, stat_info->st_gid);
288 #endif
289 }
290 else
291 {
292 if (chown (file_name, stat_info->st_uid, stat_info->st_gid) < 0)
293 chown_error_details (file_name,
294 stat_info->st_uid, stat_info->st_gid);
295
296 /* On a few systems, and in particular, those allowing to give files
297 away, changing the owner or group destroys the suid or sgid bits.
298 So let's attempt setting these bits once more. */
299 if (stat_info->st_mode & (S_ISUID | S_ISGID | S_ISVTX))
300 set_mode (file_name, stat_info, 0,
301 invert_permissions, permstatus, typeflag);
302 }
303 }
304 }
305
306 /* Remember to restore stat attributes (owner, group, mode and times)
307 for the directory FILE_NAME, using information given in *STAT_INFO,
308 once we stop extracting files into that directory.
309 If not restoring permissions, remember to invert the
310 INVERT_PERMISSIONS bits from the file's current permissions.
311 PERMSTATUS specifies the status of the file's permissions. */
312 static void
313 delay_set_stat (char const *file_name, struct stat const *stat_info,
314 mode_t invert_permissions, enum permstatus permstatus)
315 {
316 size_t file_name_len = strlen (file_name);
317 struct delayed_set_stat *data =
318 xmalloc (offsetof (struct delayed_set_stat, file_name)
319 + file_name_len + 1);
320 data->file_name_len = file_name_len;
321 strcpy (data->file_name, file_name);
322 data->invert_permissions = invert_permissions;
323 data->permstatus = permstatus;
324 data->after_symlinks = 0;
325 data->stat_info = *stat_info;
326 data->next = delayed_set_stat_head;
327 delayed_set_stat_head = data;
328 }
329
330 /* Update the delayed_set_stat info for an intermediate directory
331 created within the file name of DIR. The intermediate directory turned
332 out to be the same as this directory, e.g. due to ".." or symbolic
333 links. *DIR_STAT_INFO is the status of the directory. */
334 static void
335 repair_delayed_set_stat (char const *dir,
336 struct stat const *dir_stat_info)
337 {
338 struct delayed_set_stat *data;
339 for (data = delayed_set_stat_head; data; data = data->next)
340 {
341 struct stat st;
342 if (stat (data->file_name, &st) != 0)
343 {
344 stat_error (data->file_name);
345 return;
346 }
347
348 if (st.st_dev == dir_stat_info->st_dev
349 && st.st_ino == dir_stat_info->st_ino)
350 {
351 data->stat_info = current_stat_info.stat;
352 data->invert_permissions =
353 (MODE_RWX & (current_stat_info.stat.st_mode ^ st.st_mode));
354 data->permstatus = ARCHIVED_PERMSTATUS;
355 return;
356 }
357 }
358
359 ERROR ((0, 0, _("%s: Unexpected inconsistency when making directory"),
360 quotearg_colon (dir)));
361 }
362
363 /* After a file/link/symlink/directory creation has failed, see if
364 it's because some required directory was not present, and if so,
365 create all required directories. Return non-zero if a directory
366 was created. */
367 static int
368 make_directories (char *file_name)
369 {
370 char *cursor0 = file_name + FILE_SYSTEM_PREFIX_LEN (file_name);
371 char *cursor; /* points into the file name */
372 int did_something = 0; /* did we do anything yet? */
373 int mode;
374 int invert_permissions;
375 int status;
376
377
378 for (cursor = cursor0; *cursor; cursor++)
379 {
380 if (! ISSLASH (*cursor))
381 continue;
382
383 /* Avoid mkdir of empty string, if leading or double '/'. */
384
385 if (cursor == cursor0 || ISSLASH (cursor[-1]))
386 continue;
387
388 /* Avoid mkdir where last part of file name is "." or "..". */
389
390 if (cursor[-1] == '.'
391 && (cursor == cursor0 + 1 || ISSLASH (cursor[-2])
392 || (cursor[-2] == '.'
393 && (cursor == cursor0 + 2 || ISSLASH (cursor[-3])))))
394 continue;
395
396 *cursor = '\0'; /* truncate the name there */
397 mode = MODE_RWX & ~ newdir_umask;
398 invert_permissions = we_are_root ? 0 : MODE_WXUSR & ~ mode;
399 status = mkdir (file_name, mode ^ invert_permissions);
400
401 if (status == 0)
402 {
403 /* Create a struct delayed_set_stat even if
404 invert_permissions is zero, because
405 repair_delayed_set_stat may need to update the struct. */
406 delay_set_stat (file_name,
407 &current_stat_info.stat /* ignored */,
408 invert_permissions, INTERDIR_PERMSTATUS);
409
410 print_for_mkdir (file_name, cursor - file_name, mode);
411 did_something = 1;
412
413 *cursor = '/';
414 continue;
415 }
416
417 *cursor = '/';
418
419 if (errno == EEXIST)
420 continue; /* Directory already exists. */
421 else if ((errno == ENOSYS /* Automounted dirs on Solaris return
422 this. Reported by Warren Hyde
423 <Warren.Hyde@motorola.com> */
424 || ERRNO_IS_EACCES) /* Turbo C mkdir gives a funny errno. */
425 && access (file_name, W_OK) == 0)
426 continue;
427
428 /* Some other error in the mkdir. We return to the caller. */
429 break;
430 }
431
432 return did_something; /* tell them to retry if we made one */
433 }
434
435 static bool
436 file_newer_p (const char *file_name, struct tar_stat_info *tar_stat)
437 {
438 struct stat st;
439
440 if (stat (file_name, &st))
441 {
442 stat_warn (file_name);
443 return true; /* Be on the safe side */
444 }
445 if (!S_ISDIR (st.st_mode)
446 && st.st_mtime >= tar_stat->stat.st_mtime)
447 {
448 return true;
449 }
450 return false;
451 }
452
453 /* Attempt repairing what went wrong with the extraction. Delete an
454 already existing file or create missing intermediate directories.
455 Return nonzero if we somewhat increased our chances at a successful
456 extraction. errno is properly restored on zero return. */
457 static int
458 maybe_recoverable (char *file_name, int *interdir_made)
459 {
460 int e = errno;
461
462 if (*interdir_made)
463 return 0;
464
465 switch (errno)
466 {
467 case EEXIST:
468 /* Remove an old file, if the options allow this. */
469
470 switch (old_files_option)
471 {
472 case KEEP_OLD_FILES:
473 return 0;
474
475 case KEEP_NEWER_FILES:
476 if (file_newer_p (file_name, &current_stat_info))
477 {
478 errno = e;
479 return 0;
480 }
481 /* FALL THROUGH */
482
483 case DEFAULT_OLD_FILES:
484 case NO_OVERWRITE_DIR_OLD_FILES:
485 case OVERWRITE_OLD_FILES:
486 {
487 int r = remove_any_file (file_name, ORDINARY_REMOVE_OPTION);
488 errno = EEXIST;
489 return r;
490 }
491
492 case UNLINK_FIRST_OLD_FILES:
493 break;
494 }
495
496 case ENOENT:
497 /* Attempt creating missing intermediate directories. */
498 if (! make_directories (file_name))
499 {
500 errno = ENOENT;
501 return 0;
502 }
503 *interdir_made = 1;
504 return 1;
505
506 default:
507 /* Just say we can't do anything about it... */
508
509 return 0;
510 }
511 }
512
513 /* Fix the statuses of all directories whose statuses need fixing, and
514 which are not ancestors of FILE_NAME. If AFTER_SYMLINKS is
515 nonzero, do this for all such directories; otherwise, stop at the
516 first directory that is marked to be fixed up only after delayed
517 symlinks are applied. */
518 static void
519 apply_nonancestor_delayed_set_stat (char const *file_name, bool after_symlinks)
520 {
521 size_t file_name_len = strlen (file_name);
522 bool check_for_renamed_directories = 0;
523
524 while (delayed_set_stat_head)
525 {
526 struct delayed_set_stat *data = delayed_set_stat_head;
527 bool skip_this_one = 0;
528 struct stat st;
529 struct stat const *cur_info = 0;
530
531 check_for_renamed_directories |= data->after_symlinks;
532
533 if (after_symlinks < data->after_symlinks
534 || (data->file_name_len < file_name_len
535 && file_name[data->file_name_len]
536 && (ISSLASH (file_name[data->file_name_len])
537 || ISSLASH (file_name[data->file_name_len - 1]))
538 && memcmp (file_name, data->file_name, data->file_name_len) == 0))
539 break;
540
541 if (check_for_renamed_directories)
542 {
543 cur_info = &st;
544 if (stat (data->file_name, &st) != 0)
545 {
546 stat_error (data->file_name);
547 skip_this_one = 1;
548 }
549 else if (! (st.st_dev == data->stat_info.st_dev
550 && (st.st_ino == data->stat_info.st_ino)))
551 {
552 ERROR ((0, 0,
553 _("%s: Directory renamed before its status could be extracted"),
554 quotearg_colon (data->file_name)));
555 skip_this_one = 1;
556 }
557 }
558
559 if (! skip_this_one)
560 set_stat (data->file_name, &data->stat_info, cur_info,
561 data->invert_permissions, data->permstatus, DIRTYPE);
562
563 delayed_set_stat_head = data->next;
564 free (data);
565 }
566 }
567
568 \f
569
570 /* Extractor functions for various member types */
571
572 static int
573 extract_dir (char *file_name, int typeflag)
574 {
575 int status;
576 mode_t mode;
577 int interdir_made = 0;
578
579 if (incremental_option)
580 /* Read the entry and delete files that aren't listed in the archive. */
581 purge_directory (file_name);
582 else if (typeflag == GNUTYPE_DUMPDIR)
583 skip_member ();
584
585 mode = (current_stat_info.stat.st_mode | (we_are_root ? 0 : MODE_WXUSR)) & MODE_RWX;
586
587 while ((status = mkdir (file_name, mode)))
588 {
589 if (errno == EEXIST
590 && (interdir_made
591 || old_files_option == DEFAULT_OLD_FILES
592 || old_files_option == OVERWRITE_OLD_FILES))
593 {
594 struct stat st;
595 if (stat (file_name, &st) == 0)
596 {
597 if (interdir_made)
598 {
599 repair_delayed_set_stat (file_name, &st);
600 return 0;
601 }
602 if (S_ISDIR (st.st_mode))
603 {
604 mode = st.st_mode & ~ current_umask;
605 break;
606 }
607 }
608 errno = EEXIST;
609 }
610
611 if (maybe_recoverable (file_name, &interdir_made))
612 continue;
613
614 if (errno != EEXIST)
615 {
616 mkdir_error (file_name);
617 return 1;
618 }
619 break;
620 }
621
622 if (status == 0
623 || old_files_option == DEFAULT_OLD_FILES
624 || old_files_option == OVERWRITE_OLD_FILES)
625 delay_set_stat (file_name, &current_stat_info.stat,
626 MODE_RWX & (mode ^ current_stat_info.stat.st_mode),
627 (status == 0
628 ? ARCHIVED_PERMSTATUS
629 : UNKNOWN_PERMSTATUS));
630
631 return status;
632 }
633
634
635 static int
636 open_output_file (char *file_name, int typeflag)
637 {
638 int fd;
639 int openflag = (O_WRONLY | O_BINARY | O_CREAT
640 | (old_files_option == OVERWRITE_OLD_FILES
641 ? O_TRUNC
642 : O_EXCL));
643 mode_t mode = current_stat_info.stat.st_mode & MODE_RWX & ~ current_umask;
644
645 #if O_CTG
646 /* Contiguous files (on the Masscomp) have to specify the size in
647 the open call that creates them. */
648
649 if (typeflag == CONTTYPE)
650 fd = open (file_name, openflag | O_CTG, mode, current_stat_info.stat.st_size);
651 else
652 fd = open (file_name, openflag, mode);
653
654 #else /* not O_CTG */
655 if (typeflag == CONTTYPE)
656 {
657 static int conttype_diagnosed;
658
659 if (!conttype_diagnosed)
660 {
661 conttype_diagnosed = 1;
662 WARN ((0, 0, _("Extracting contiguous files as regular files")));
663 }
664 }
665 fd = open (file_name, openflag, mode);
666
667 #endif /* not O_CTG */
668
669 return fd;
670 }
671
672 static int
673 extract_file (char *file_name, int typeflag)
674 {
675 int fd;
676 off_t size;
677 union block *data_block;
678 int status;
679 size_t count;
680 size_t written;
681 int interdir_made = 0;
682
683 /* FIXME: deal with protection issues. */
684
685 if (to_stdout_option)
686 fd = STDOUT_FILENO;
687 else
688 {
689 do
690 fd = open_output_file (file_name, typeflag);
691 while (fd < 0 && maybe_recoverable (file_name, &interdir_made));
692
693 if (fd < 0)
694 {
695 open_error (file_name);
696 return 1;
697 }
698 }
699
700 if (current_stat_info.is_sparse)
701 sparse_extract_file (fd, &current_stat_info, &size);
702 else
703 for (size = current_stat_info.stat.st_size; size > 0; )
704 {
705 if (multi_volume_option)
706 {
707 assign_string (&save_name, current_stat_info.file_name);
708 save_totsize = current_stat_info.stat.st_size;
709 save_sizeleft = size;
710 }
711
712 /* Locate data, determine max length writeable, write it,
713 block that we have used the data, then check if the write
714 worked. */
715
716 data_block = find_next_block ();
717 if (! data_block)
718 {
719 ERROR ((0, 0, _("Unexpected EOF in archive")));
720 break; /* FIXME: What happens, then? */
721 }
722
723 written = available_space_after (data_block);
724
725 if (written > size)
726 written = size;
727 errno = 0;
728 count = full_write (fd, data_block->buffer, written);
729 size -= count;
730
731 set_next_block_after ((union block *)
732 (data_block->buffer + written - 1));
733 if (count != written)
734 {
735 write_error_details (file_name, count, written); /* FIXME: shouldn't we
736 restore from backup? */
737 break;
738 }
739 }
740
741 skip_file (size);
742
743 if (multi_volume_option)
744 assign_string (&save_name, 0);
745
746 /* If writing to stdout, don't try to do anything to the filename;
747 it doesn't exist, or we don't want to touch it anyway. */
748
749 if (to_stdout_option)
750 return 0;
751
752 status = close (fd);
753 if (status < 0)
754 close_error (file_name);
755
756 set_stat (file_name, &current_stat_info.stat, 0, 0,
757 (old_files_option == OVERWRITE_OLD_FILES ?
758 UNKNOWN_PERMSTATUS : ARCHIVED_PERMSTATUS),
759 typeflag);
760
761 return status;
762 }
763
764 static int
765 extract_link (char *file_name, int typeflag)
766 {
767 char const *link_name = safer_name_suffix (current_stat_info.link_name, true);
768 int interdir_made = 0;
769
770 do
771 {
772 struct stat st1, st2;
773 int e;
774 int status = link (link_name, file_name);
775 e = errno;
776
777 if (status == 0)
778 {
779 struct delayed_symlink *ds = delayed_symlink_head;
780 if (ds && lstat (link_name, &st1) == 0)
781 for (; ds; ds = ds->next)
782 if (ds->dev == st1.st_dev
783 && ds->ino == st1.st_ino
784 && ds->mtime == st1.st_mtime)
785 {
786 struct string_list *p = xmalloc (offsetof (struct string_list, string)
787 + strlen (file_name) + 1);
788 strcpy (p->string, file_name);
789 p->next = ds->sources;
790 ds->sources = p;
791 break;
792 }
793 return 0;
794 }
795 else if ((e == EEXIST && strcmp (link_name, file_name) == 0)
796 || (lstat (link_name, &st1) == 0
797 && lstat (file_name, &st2) == 0
798 && st1.st_dev == st2.st_dev
799 && st1.st_ino == st2.st_ino))
800 return 0;
801
802 errno = e;
803 }
804 while (maybe_recoverable (file_name, &interdir_made));
805
806 if (!(incremental_option && errno == EEXIST))
807 {
808 link_error (link_name, file_name);
809 return 1;
810 }
811 return 0;
812 }
813
814 static int
815 extract_symlink (char *file_name, int typeflag)
816 {
817 #ifdef HAVE_SYMLINK
818 int status, fd;
819 int interdir_made = 0;
820
821 if (absolute_names_option
822 || ! (IS_ABSOLUTE_FILE_NAME (current_stat_info.link_name)
823 || contains_dot_dot (current_stat_info.link_name)))
824 {
825 while ((status = symlink (current_stat_info.link_name, file_name)))
826 if (!maybe_recoverable (file_name, &interdir_made))
827 break;
828
829 if (status == 0)
830 set_stat (file_name, &current_stat_info.stat, 0, 0, 0, SYMTYPE);
831 else
832 symlink_error (current_stat_info.link_name, file_name);
833 }
834 else
835 {
836 /* This symbolic link is potentially dangerous. Don't
837 create it now; instead, create a placeholder file, which
838 will be replaced after other extraction is done. */
839 struct stat st;
840
841 while ((fd = open (file_name, O_WRONLY | O_CREAT | O_EXCL, 0)) < 0)
842 if (! maybe_recoverable (file_name, &interdir_made))
843 break;
844
845 status = -1;
846 if (fd < 0)
847 open_error (file_name);
848 else if (fstat (fd, &st) != 0)
849 {
850 stat_error (file_name);
851 close (fd);
852 }
853 else if (close (fd) != 0)
854 close_error (file_name);
855 else
856 {
857 struct delayed_set_stat *h;
858 struct delayed_symlink *p = xmalloc (offsetof (struct delayed_symlink, target)
859 + strlen (current_stat_info.link_name)
860 + 1);
861 p->next = delayed_symlink_head;
862 delayed_symlink_head = p;
863 p->dev = st.st_dev;
864 p->ino = st.st_ino;
865 p->mtime = st.st_mtime;
866 p->uid = current_stat_info.stat.st_uid;
867 p->gid = current_stat_info.stat.st_gid;
868 p->sources = xmalloc (offsetof (struct string_list, string)
869 + strlen (file_name) + 1);
870 p->sources->next = 0;
871 strcpy (p->sources->string, file_name);
872 strcpy (p->target, current_stat_info.link_name);
873
874 h = delayed_set_stat_head;
875 if (h && ! h->after_symlinks
876 && strncmp (file_name, h->file_name, h->file_name_len) == 0
877 && ISSLASH (file_name[h->file_name_len])
878 && (base_name (file_name) == file_name + h->file_name_len + 1))
879 {
880 do
881 {
882 h->after_symlinks = 1;
883
884 if (stat (h->file_name, &st) != 0)
885 stat_error (h->file_name);
886 else
887 {
888 h->stat_info.st_dev = st.st_dev;
889 h->stat_info.st_ino = st.st_ino;
890 }
891 }
892 while ((h = h->next) && ! h->after_symlinks);
893 }
894
895 status = 0;
896 }
897 }
898
899 return status;
900
901 #else
902 static int warned_once;
903
904 if (!warned_once)
905 {
906 warned_once = 1;
907 WARN ((0, 0, _("Attempting extraction of symbolic links as hard links")));
908 }
909 return extract_link (file_name, typeflag);
910 #endif
911 }
912
913 #if S_IFCHR || S_IFBLK
914 static int
915 extract_node (char *file_name, int typeflag)
916 {
917 int status;
918 int interdir_made = 0;
919
920 do
921 status = mknod (file_name, current_stat_info.stat.st_mode,
922 current_stat_info.stat.st_rdev);
923 while (status && maybe_recoverable (file_name, &interdir_made));
924
925 if (status != 0)
926 mknod_error (file_name);
927 else
928 set_stat (file_name, &current_stat_info.stat, 0, 0, ARCHIVED_PERMSTATUS, typeflag);
929 return status;
930 }
931 #endif
932
933 #if HAVE_MKFIFO || defined mkfifo
934 static int
935 extract_fifo (char *file_name, int typeflag)
936 {
937 int status;
938 int interdir_made = 0;
939
940 while ((status = mkfifo (file_name, current_stat_info.stat.st_mode)))
941 if (!maybe_recoverable (file_name, &interdir_made))
942 break;
943
944 if (status == 0)
945 set_stat (file_name, &current_stat_info.stat, NULL, 0,
946 ARCHIVED_PERMSTATUS, typeflag);
947 else
948 mkfifo_error (file_name);
949 return status;
950 }
951 #endif
952
953 static int
954 extract_mangle_wrapper (char *file_name, int typeflag)
955 {
956 extract_mangle ();
957 return 0;
958 }
959
960
961 static int
962 extract_failure (char *file_name, int typeflag)
963 {
964 return 1;
965 }
966
967 typedef int (*tar_extractor_t) (char *file_name, int typeflag);
968
969 \f
970
971 /* Prepare to extract a file. Find extractor function.
972 Return zero if extraction should not proceed. */
973
974 static int
975 prepare_to_extract (char const *file_name, int typeflag, tar_extractor_t *fun)
976 {
977 int rc = 1;
978
979 if (to_stdout_option)
980 rc = 0;
981
982 /* Select the extractor */
983 switch (typeflag)
984 {
985 case GNUTYPE_SPARSE:
986 *fun = extract_file;
987 rc = 1;
988 break;
989
990 case AREGTYPE:
991 case REGTYPE:
992 case CONTTYPE:
993 /* Appears to be a file. But BSD tar uses the convention that a slash
994 suffix means a directory. */
995 if (current_stat_info.had_trailing_slash)
996 *fun = extract_dir;
997 else
998 {
999 *fun = extract_file;
1000 rc = 1;
1001 }
1002 break;
1003
1004 case SYMTYPE:
1005 *fun = extract_symlink;
1006 break;
1007
1008 case LNKTYPE:
1009 *fun = extract_link;
1010 break;
1011
1012 #if S_IFCHR
1013 case CHRTYPE:
1014 current_stat_info.stat.st_mode |= S_IFCHR;
1015 *fun = extract_node;
1016 break;
1017 #endif
1018
1019 #if S_IFBLK
1020 case BLKTYPE:
1021 current_stat_info.stat.st_mode |= S_IFBLK;
1022 *fun = extract_node;
1023 break;
1024 #endif
1025
1026 #if HAVE_MKFIFO || defined mkfifo
1027 case FIFOTYPE:
1028 *fun = extract_fifo;
1029 break;
1030 #endif
1031
1032 case DIRTYPE:
1033 case GNUTYPE_DUMPDIR:
1034 *fun = extract_dir;
1035 break;
1036
1037 case GNUTYPE_VOLHDR:
1038 if (verbose_option)
1039 fprintf (stdlis, _("Reading %s\n"), quote (current_stat_info.file_name));
1040 *fun = NULL;
1041 break;
1042
1043 case GNUTYPE_NAMES:
1044 *fun = extract_mangle_wrapper;
1045 break;
1046
1047 case GNUTYPE_MULTIVOL:
1048 ERROR ((0, 0,
1049 _("%s: Cannot extract -- file is continued from another volume"),
1050 quotearg_colon (current_stat_info.file_name)));
1051 *fun = extract_failure;
1052 break;
1053
1054 case GNUTYPE_LONGNAME:
1055 case GNUTYPE_LONGLINK:
1056 ERROR ((0, 0, _("Unexpected long name header")));
1057 *fun = extract_failure;
1058 break;
1059
1060 default:
1061 WARN ((0, 0,
1062 _("%s: Unknown file type '%c', extracted as normal file"),
1063 quotearg_colon (file_name), typeflag));
1064 *fun = extract_file;
1065 }
1066
1067 /* Determine whether the extraction should proceed */
1068 if (rc == 0)
1069 return 0;
1070
1071 switch (old_files_option)
1072 {
1073 case UNLINK_FIRST_OLD_FILES:
1074 if (!remove_any_file (file_name,
1075 recursive_unlink_option ? RECURSIVE_REMOVE_OPTION
1076 : ORDINARY_REMOVE_OPTION)
1077 && errno && errno != ENOENT)
1078 {
1079 unlink_error (file_name);
1080 return 0;
1081 }
1082 break;
1083
1084 case KEEP_NEWER_FILES:
1085 if (file_newer_p (file_name, &current_stat_info))
1086 {
1087 WARN ((0, 0, _("Current %s is newer"), quote (file_name)));
1088 return 0;
1089 }
1090 break;
1091
1092 default:
1093 break;
1094 }
1095
1096 return 1;
1097 }
1098
1099 /* Extract a file from the archive. */
1100 void
1101 extract_archive (void)
1102 {
1103 char typeflag;
1104 char *file_name;
1105 tar_extractor_t fun;
1106
1107 set_next_block_after (current_header);
1108 decode_header (current_header, &current_stat_info, &current_format, 1);
1109
1110 if (interactive_option && !confirm ("extract", current_stat_info.file_name))
1111 {
1112 skip_member ();
1113 return;
1114 }
1115
1116 /* Print the block from current_header and current_stat. */
1117
1118 if (verbose_option)
1119 print_header (&current_stat_info, -1);
1120
1121 file_name = safer_name_suffix (current_stat_info.file_name, false);
1122 if (strip_name_components)
1123 {
1124 size_t prefix_len = stripped_prefix_len (file_name, strip_name_components);
1125 if (prefix_len == (size_t) -1)
1126 {
1127 skip_member ();
1128 return;
1129 }
1130 file_name += prefix_len;
1131 }
1132
1133 apply_nonancestor_delayed_set_stat (file_name, 0);
1134
1135 /* Take a safety backup of a previously existing file. */
1136
1137 if (backup_option && !to_stdout_option)
1138 if (!maybe_backup_file (file_name, 0))
1139 {
1140 int e = errno;
1141 ERROR ((0, e, _("%s: Was unable to backup this file"),
1142 quotearg_colon (file_name)));
1143 skip_member ();
1144 return;
1145 }
1146
1147 /* Extract the archive entry according to its type. */
1148
1149 /* KLUDGE */
1150 typeflag = sparse_member_p (&current_stat_info) ?
1151 GNUTYPE_SPARSE : current_header->header.typeflag;
1152
1153 if (prepare_to_extract (file_name, typeflag, &fun))
1154 {
1155 if (fun && (*fun) (file_name, typeflag) && backup_option)
1156 undo_last_backup ();
1157 }
1158 else
1159 skip_member ();
1160
1161 }
1162
1163 /* Extract the symbolic links whose final extraction were delayed. */
1164 static void
1165 apply_delayed_symlinks (void)
1166 {
1167 struct delayed_symlink *ds;
1168
1169 for (ds = delayed_symlink_head; ds; )
1170 {
1171 struct string_list *sources = ds->sources;
1172 char const *valid_source = 0;
1173
1174 for (sources = ds->sources; sources; sources = sources->next)
1175 {
1176 char const *source = sources->string;
1177 struct stat st;
1178
1179 /* Make sure the placeholder file is still there. If not,
1180 don't create a symlink, as the placeholder was probably
1181 removed by a later extraction. */
1182 if (lstat (source, &st) == 0
1183 && st.st_dev == ds->dev
1184 && st.st_ino == ds->ino
1185 && st.st_mtime == ds->mtime)
1186 {
1187 /* Unlink the placeholder, then create a hard link if possible,
1188 a symbolic link otherwise. */
1189 if (unlink (source) != 0)
1190 unlink_error (source);
1191 else if (valid_source && link (valid_source, source) == 0)
1192 ;
1193 else if (symlink (ds->target, source) != 0)
1194 symlink_error (ds->target, source);
1195 else
1196 {
1197 valid_source = source;
1198 st.st_uid = ds->uid;
1199 st.st_gid = ds->gid;
1200 set_stat (source, &st, 0, 0, 0, SYMTYPE);
1201 }
1202 }
1203 }
1204
1205 for (sources = ds->sources; sources; )
1206 {
1207 struct string_list *next = sources->next;
1208 free (sources);
1209 sources = next;
1210 }
1211
1212 {
1213 struct delayed_symlink *next = ds->next;
1214 free (ds);
1215 ds = next;
1216 }
1217 }
1218
1219 delayed_symlink_head = 0;
1220 }
1221
1222 /* Finish the extraction of an archive. */
1223 void
1224 extract_finish (void)
1225 {
1226 /* First, fix the status of ordinary directories that need fixing. */
1227 apply_nonancestor_delayed_set_stat ("", 0);
1228
1229 /* Then, apply delayed symlinks, so that they don't affect delayed
1230 directory status-setting for ordinary directories. */
1231 apply_delayed_symlinks ();
1232
1233 /* Finally, fix the status of directories that are ancestors
1234 of delayed symlinks. */
1235 apply_nonancestor_delayed_set_stat ("", 1);
1236 }
1237
1238 void
1239 fatal_exit (void)
1240 {
1241 extract_finish ();
1242 error (TAREXIT_FAILURE, 0, _("Error is not recoverable: exiting now"));
1243 abort ();
1244 }
1245
1246 void
1247 xalloc_die (void)
1248 {
1249 error (0, 0, "%s", _("memory exhausted"));
1250 fatal_exit ();
1251 }
This page took 0.094516 seconds and 5 git commands to generate.