]> Dogcows Code - chaz/tar/blob - src/extract.c
Fix dead loop on extracting existing symlinks with the -k option.
[chaz/tar] / src / extract.c
1 /* Extract files from a tar archive.
2
3 Copyright (C) 1988, 1992, 1993, 1994, 1996, 1997, 1998, 1999, 2000,
4 2001, 2003, 2004, 2005, 2006, 2007, 2010 Free Software Foundation, Inc.
5
6 Written by John Gilmore, on 1985-11-19.
7
8 This program is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 3, or (at your option) any later
11 version.
12
13 This program is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
16 Public License for more details.
17
18 You should have received a copy of the GNU General Public License along
19 with this program; if not, write to the Free Software Foundation, Inc.,
20 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
21
22 #include <system.h>
23 #include <quotearg.h>
24 #include <utimens.h>
25 #include <errno.h>
26 #include <xgetcwd.h>
27 #include <priv-set.h>
28
29 #include "common.h"
30
31 static bool we_are_root; /* true if our effective uid == 0 */
32 static mode_t newdir_umask; /* umask when creating new directories */
33 static mode_t current_umask; /* current umask (which is set to 0 if -p) */
34
35 /* Status of the permissions of a file that we are extracting. */
36 enum permstatus
37 {
38 /* This file may have existed already; its permissions are unknown. */
39 UNKNOWN_PERMSTATUS,
40
41 /* This file was created using the permissions from the archive,
42 except with S_IRWXG | S_IRWXO masked out if 0 < same_owner_option. */
43 ARCHIVED_PERMSTATUS,
44
45 /* This is an intermediate directory; the archive did not specify
46 its permissions. */
47 INTERDIR_PERMSTATUS
48 };
49
50 /* List of directories whose statuses we need to extract after we've
51 finished extracting their subsidiary files. If you consider each
52 contiguous subsequence of elements of the form [D]?[^D]*, where [D]
53 represents an element where AFTER_LINKS is nonzero and [^D]
54 represents an element where AFTER_LINKS is zero, then the head
55 of the subsequence has the longest name, and each non-head element
56 in the prefix is an ancestor (in the directory hierarchy) of the
57 preceding element. */
58
59 struct delayed_set_stat
60 {
61 struct delayed_set_stat *next;
62 dev_t dev;
63 ino_t ino;
64 mode_t mode;
65 uid_t uid;
66 gid_t gid;
67 struct timespec atime;
68 struct timespec mtime;
69 size_t file_name_len;
70 mode_t invert_permissions;
71 enum permstatus permstatus;
72 bool after_links;
73 char file_name[1];
74 };
75
76 static struct delayed_set_stat *delayed_set_stat_head;
77
78 /* List of links whose creation we have delayed. */
79 struct delayed_link
80 {
81 /* The next delayed link in the list. */
82 struct delayed_link *next;
83
84 /* The device, inode number and last-modified time of the placeholder. */
85 dev_t dev;
86 ino_t ino;
87 struct timespec mtime;
88
89 /* True if the link is symbolic. */
90 bool is_symlink;
91
92 /* The desired owner and group of the link, if it is a symlink. */
93 uid_t uid;
94 gid_t gid;
95
96 /* A list of sources for this link. The sources are all to be
97 hard-linked together. */
98 struct string_list *sources;
99
100 /* The desired target of the desired link. */
101 char target[1];
102 };
103
104 static struct delayed_link *delayed_link_head;
105
106 struct string_list
107 {
108 struct string_list *next;
109 char string[1];
110 };
111
112 /* Set up to extract files. */
113 void
114 extr_init (void)
115 {
116 we_are_root = geteuid () == 0;
117 same_permissions_option += we_are_root;
118 same_owner_option += we_are_root;
119
120 /* Option -p clears the kernel umask, so it does not affect proper
121 restoration of file permissions. New intermediate directories will
122 comply with umask at start of program. */
123
124 newdir_umask = umask (0);
125 if (0 < same_permissions_option)
126 current_umask = 0;
127 else
128 {
129 umask (newdir_umask); /* restore the kernel umask */
130 current_umask = newdir_umask;
131 }
132 }
133
134 /* If restoring permissions, restore the mode for FILE_NAME from
135 information given in *STAT_INFO (where *CUR_INFO gives
136 the current status if CUR_INFO is nonzero); otherwise invert the
137 INVERT_PERMISSIONS bits from the file's current permissions.
138 PERMSTATUS specifies the status of the file's permissions.
139 TYPEFLAG specifies the type of the file. */
140 static void
141 set_mode (char const *file_name,
142 struct stat const *stat_info,
143 struct stat const *cur_info,
144 mode_t invert_permissions, enum permstatus permstatus,
145 char typeflag)
146 {
147 mode_t mode;
148 bool failed;
149
150 if (0 < same_permissions_option
151 && permstatus != INTERDIR_PERMSTATUS)
152 {
153 mode = stat_info->st_mode;
154
155 /* If we created the file and it has a mode that we set already
156 with O_CREAT, then its mode is often set correctly already.
157 But if we are changing ownership, the mode's group and and
158 other permission bits were omitted originally, so it's less
159 likely that the mode is OK now. Also, on many hosts, some
160 directories inherit the setgid bits from their parents, so we
161 we must set directories' modes explicitly. */
162 if ((permstatus == ARCHIVED_PERMSTATUS
163 && ! (mode & ~ (0 < same_owner_option ? S_IRWXU : MODE_RWX)))
164 && typeflag != DIRTYPE
165 && typeflag != GNUTYPE_DUMPDIR)
166 return;
167 }
168 else if (! invert_permissions)
169 return;
170 else
171 {
172 /* We must inspect a directory's current permissions, since the
173 directory may have inherited its setgid bit from its parent.
174
175 INVERT_PERMISSIONS happens to be nonzero only for directories
176 that we created, so there's no point optimizing this code for
177 other cases. */
178 struct stat st;
179 if (! cur_info)
180 {
181 if (stat (file_name, &st) != 0)
182 {
183 stat_error (file_name);
184 return;
185 }
186 cur_info = &st;
187 }
188 mode = cur_info->st_mode ^ invert_permissions;
189 }
190
191 failed = chmod (file_name, mode) != 0;
192 if (failed && errno == EPERM)
193 {
194 /* On Solaris, chmod may fail if we don't have PRIV_ALL. */
195 if (priv_set_restore_linkdir () == 0)
196 {
197 failed = chmod (file_name, mode) != 0;
198 priv_set_remove_linkdir ();
199 }
200 }
201 if (failed)
202 chmod_error_details (file_name, mode);
203 }
204
205 /* Check time after successfully setting FILE_NAME's time stamp to T. */
206 static void
207 check_time (char const *file_name, struct timespec t)
208 {
209 if (t.tv_sec <= 0)
210 WARNOPT (WARN_TIMESTAMP,
211 (0, 0, _("%s: implausibly old time stamp %s"),
212 file_name, tartime (t, true)));
213 else if (timespec_cmp (volume_start_time, t) < 0)
214 {
215 struct timespec now;
216 gettime (&now);
217 if (timespec_cmp (now, t) < 0)
218 {
219 char buf[TIMESPEC_STRSIZE_BOUND];
220 struct timespec diff;
221 diff.tv_sec = t.tv_sec - now.tv_sec;
222 diff.tv_nsec = t.tv_nsec - now.tv_nsec;
223 if (diff.tv_nsec < 0)
224 {
225 diff.tv_nsec += BILLION;
226 diff.tv_sec--;
227 }
228 WARNOPT (WARN_TIMESTAMP,
229 (0, 0, _("%s: time stamp %s is %s s in the future"),
230 file_name, tartime (t, true), code_timespec (diff, buf)));
231 }
232 }
233 }
234
235 /* Restore stat attributes (owner, group, mode and times) for
236 FILE_NAME, using information given in *ST.
237 If CUR_INFO is nonzero, *CUR_INFO is the
238 file's current status.
239 If not restoring permissions, invert the
240 INVERT_PERMISSIONS bits from the file's current permissions.
241 PERMSTATUS specifies the status of the file's permissions.
242 TYPEFLAG specifies the type of the file. */
243
244 /* FIXME: About proper restoration of symbolic link attributes, we still do
245 not have it right. Pretesters' reports tell us we need further study and
246 probably more configuration. For now, just use lchown if it exists, and
247 punt for the rest. Sigh! */
248
249 static void
250 set_stat (char const *file_name,
251 struct tar_stat_info const *st,
252 struct stat const *cur_info,
253 mode_t invert_permissions, enum permstatus permstatus,
254 char typeflag)
255 {
256 if (typeflag != SYMTYPE)
257 {
258 /* We do the utime before the chmod because some versions of utime are
259 broken and trash the modes of the file. */
260
261 if (! touch_option && permstatus != INTERDIR_PERMSTATUS)
262 {
263 /* We set the accessed time to `now', which is really the time we
264 started extracting files, unless incremental_option is used, in
265 which case .st_atime is used. */
266
267 /* FIXME: incremental_option should set ctime too, but how? */
268
269 struct timespec ts[2];
270 if (incremental_option)
271 ts[0] = st->atime;
272 else
273 ts[0] = start_time;
274 ts[1] = st->mtime;
275
276 if (utimens (file_name, ts) != 0)
277 utime_error (file_name);
278 else
279 {
280 check_time (file_name, ts[0]);
281 check_time (file_name, ts[1]);
282 }
283 }
284
285 /* Some systems allow non-root users to give files away. Once this
286 done, it is not possible anymore to change file permissions.
287 However, setting file permissions now would be incorrect, since
288 they would apply to the wrong user, and there would be a race
289 condition. So, don't use systems that allow non-root users to
290 give files away. */
291 }
292
293 if (0 < same_owner_option && permstatus != INTERDIR_PERMSTATUS)
294 {
295 /* When lchown exists, it should be used to change the attributes of
296 the symbolic link itself. In this case, a mere chown would change
297 the attributes of the file the symbolic link is pointing to, and
298 should be avoided. */
299 int chown_result = 1;
300
301 if (typeflag == SYMTYPE)
302 {
303 #if HAVE_LCHOWN
304 chown_result = lchown (file_name, st->stat.st_uid, st->stat.st_gid);
305 #endif
306 }
307 else
308 {
309 chown_result = chown (file_name, st->stat.st_uid, st->stat.st_gid);
310 }
311
312 if (chown_result == 0)
313 {
314 /* Changing the owner can flip st_mode bits in some cases, so
315 ignore cur_info if it might be obsolete now. */
316 if (cur_info
317 && cur_info->st_mode & S_IXUGO
318 && cur_info->st_mode & (S_ISUID | S_ISGID))
319 cur_info = NULL;
320 }
321 else if (chown_result < 0)
322 chown_error_details (file_name,
323 st->stat.st_uid, st->stat.st_gid);
324 }
325
326 if (typeflag != SYMTYPE)
327 set_mode (file_name, &st->stat, cur_info,
328 invert_permissions, permstatus, typeflag);
329 }
330
331 /* Remember to restore stat attributes (owner, group, mode and times)
332 for the directory FILE_NAME, using information given in *ST,
333 once we stop extracting files into that directory.
334 If not restoring permissions, remember to invert the
335 INVERT_PERMISSIONS bits from the file's current permissions.
336 PERMSTATUS specifies the status of the file's permissions.
337
338 NOTICE: this works only if the archive has usual member order, i.e.
339 directory, then the files in that directory. Incremental archive have
340 somewhat reversed order: first go subdirectories, then all other
341 members. To help cope with this case the variable
342 delay_directory_restore_option is set by prepare_to_extract.
343
344 If an archive was explicitely created so that its member order is
345 reversed, some directory timestamps can be restored incorrectly,
346 e.g.:
347 tar --no-recursion -cf archive dir dir/file1 foo dir/file2
348 */
349 static void
350 delay_set_stat (char const *file_name, struct tar_stat_info const *st,
351 mode_t invert_permissions, enum permstatus permstatus)
352 {
353 size_t file_name_len = strlen (file_name);
354 struct delayed_set_stat *data =
355 xmalloc (offsetof (struct delayed_set_stat, file_name)
356 + file_name_len + 1);
357 data->next = delayed_set_stat_head;
358 data->dev = st->stat.st_dev;
359 data->ino = st->stat.st_ino;
360 data->mode = st->stat.st_mode;
361 data->uid = st->stat.st_uid;
362 data->gid = st->stat.st_gid;
363 data->atime = st->atime;
364 data->mtime = st->mtime;
365 data->file_name_len = file_name_len;
366 data->invert_permissions = invert_permissions;
367 data->permstatus = permstatus;
368 data->after_links = 0;
369 strcpy (data->file_name, file_name);
370 delayed_set_stat_head = data;
371 }
372
373 /* Update the delayed_set_stat info for an intermediate directory
374 created within the file name of DIR. The intermediate directory turned
375 out to be the same as this directory, e.g. due to ".." or symbolic
376 links. *DIR_STAT_INFO is the status of the directory. */
377 static void
378 repair_delayed_set_stat (char const *dir,
379 struct stat const *dir_stat_info)
380 {
381 struct delayed_set_stat *data;
382 for (data = delayed_set_stat_head; data; data = data->next)
383 {
384 struct stat st;
385 if (stat (data->file_name, &st) != 0)
386 {
387 stat_error (data->file_name);
388 return;
389 }
390
391 if (st.st_dev == dir_stat_info->st_dev
392 && st.st_ino == dir_stat_info->st_ino)
393 {
394 data->dev = current_stat_info.stat.st_dev;
395 data->ino = current_stat_info.stat.st_ino;
396 data->mode = current_stat_info.stat.st_mode;
397 data->uid = current_stat_info.stat.st_uid;
398 data->gid = current_stat_info.stat.st_gid;
399 data->atime = current_stat_info.atime;
400 data->mtime = current_stat_info.mtime;
401 data->invert_permissions =
402 ((current_stat_info.stat.st_mode ^ st.st_mode)
403 & MODE_RWX & ~ current_umask);
404 data->permstatus = ARCHIVED_PERMSTATUS;
405 return;
406 }
407 }
408
409 ERROR ((0, 0, _("%s: Unexpected inconsistency when making directory"),
410 quotearg_colon (dir)));
411 }
412
413 /* After a file/link/directory creation has failed, see if
414 it's because some required directory was not present, and if so,
415 create all required directories. Return non-zero if a directory
416 was created. */
417 static int
418 make_directories (char *file_name)
419 {
420 char *cursor0 = file_name + FILE_SYSTEM_PREFIX_LEN (file_name);
421 char *cursor; /* points into the file name */
422 int did_something = 0; /* did we do anything yet? */
423 int mode;
424 int invert_permissions;
425 int status;
426
427 for (cursor = cursor0; *cursor; cursor++)
428 {
429 if (! ISSLASH (*cursor))
430 continue;
431
432 /* Avoid mkdir of empty string, if leading or double '/'. */
433
434 if (cursor == cursor0 || ISSLASH (cursor[-1]))
435 continue;
436
437 /* Avoid mkdir where last part of file name is "." or "..". */
438
439 if (cursor[-1] == '.'
440 && (cursor == cursor0 + 1 || ISSLASH (cursor[-2])
441 || (cursor[-2] == '.'
442 && (cursor == cursor0 + 2 || ISSLASH (cursor[-3])))))
443 continue;
444
445 *cursor = '\0'; /* truncate the name there */
446 mode = MODE_RWX & ~ newdir_umask;
447 invert_permissions = we_are_root ? 0 : MODE_WXUSR & ~ mode;
448 status = mkdir (file_name, mode ^ invert_permissions);
449
450 if (status == 0)
451 {
452 /* Create a struct delayed_set_stat even if
453 invert_permissions is zero, because
454 repair_delayed_set_stat may need to update the struct. */
455 delay_set_stat (file_name,
456 &current_stat_info,
457 invert_permissions, INTERDIR_PERMSTATUS);
458
459 print_for_mkdir (file_name, cursor - file_name, mode);
460 did_something = 1;
461
462 *cursor = '/';
463 continue;
464 }
465
466 *cursor = '/';
467
468 if (errno == EEXIST)
469 continue; /* Directory already exists. */
470 else if ((errno == ENOSYS /* Automounted dirs on Solaris return
471 this. Reported by Warren Hyde
472 <Warren.Hyde@motorola.com> */
473 || ERRNO_IS_EACCES) /* Turbo C mkdir gives a funny errno. */
474 && access (file_name, W_OK) == 0)
475 continue;
476
477 /* Some other error in the mkdir. We return to the caller. */
478 break;
479 }
480
481 return did_something; /* tell them to retry if we made one */
482 }
483
484 static bool
485 file_newer_p (const char *file_name, struct tar_stat_info *tar_stat)
486 {
487 struct stat st;
488
489 if (stat (file_name, &st))
490 {
491 if (errno != ENOENT)
492 {
493 stat_warn (file_name);
494 /* Be on the safe side: if the file does exist assume it is newer */
495 return true;
496 }
497 return false;
498 }
499 if (!S_ISDIR (st.st_mode)
500 && tar_timespec_cmp (tar_stat->mtime, get_stat_mtime (&st)) <= 0)
501 {
502 return true;
503 }
504 return false;
505 }
506
507 #define RECOVER_NO 0
508 #define RECOVER_OK 1
509 #define RECOVER_SKIP 2
510
511 /* Attempt repairing what went wrong with the extraction. Delete an
512 already existing file or create missing intermediate directories.
513 Return RECOVER_OK if we somewhat increased our chances at a successful
514 extraction, RECOVER_NO if there are no chances, and RECOVER_SKIP if the
515 caller should skip extraction of that member. The value of errno is
516 properly restored on returning RECOVER_NO. */
517
518 static int
519 maybe_recoverable (char *file_name, int *interdir_made)
520 {
521 int e = errno;
522
523 if (*interdir_made)
524 return RECOVER_NO;
525
526 switch (errno)
527 {
528 case EEXIST:
529 /* Remove an old file, if the options allow this. */
530
531 switch (old_files_option)
532 {
533 case KEEP_OLD_FILES:
534 return RECOVER_SKIP;
535
536 case KEEP_NEWER_FILES:
537 if (file_newer_p (file_name, &current_stat_info))
538 {
539 errno = e;
540 return RECOVER_NO;
541 }
542 /* FALL THROUGH */
543
544 case DEFAULT_OLD_FILES:
545 case NO_OVERWRITE_DIR_OLD_FILES:
546 case OVERWRITE_OLD_FILES:
547 {
548 int r = remove_any_file (file_name, ORDINARY_REMOVE_OPTION);
549 errno = EEXIST;
550 return r > 0 ? RECOVER_OK : RECOVER_NO;
551 }
552
553 case UNLINK_FIRST_OLD_FILES:
554 break;
555 }
556
557 case ENOENT:
558 /* Attempt creating missing intermediate directories. */
559 if (! make_directories (file_name))
560 {
561 errno = ENOENT;
562 return RECOVER_NO;
563 }
564 *interdir_made = 1;
565 return RECOVER_OK;
566
567 default:
568 /* Just say we can't do anything about it... */
569
570 return RECOVER_NO;
571 }
572 }
573
574 /* Fix the statuses of all directories whose statuses need fixing, and
575 which are not ancestors of FILE_NAME. If AFTER_LINKS is
576 nonzero, do this for all such directories; otherwise, stop at the
577 first directory that is marked to be fixed up only after delayed
578 links are applied. */
579 static void
580 apply_nonancestor_delayed_set_stat (char const *file_name, bool after_links)
581 {
582 size_t file_name_len = strlen (file_name);
583 bool check_for_renamed_directories = 0;
584
585 while (delayed_set_stat_head)
586 {
587 struct delayed_set_stat *data = delayed_set_stat_head;
588 bool skip_this_one = 0;
589 struct stat st;
590 struct stat const *cur_info = 0;
591
592 check_for_renamed_directories |= data->after_links;
593
594 if (after_links < data->after_links
595 || (data->file_name_len < file_name_len
596 && file_name[data->file_name_len]
597 && (ISSLASH (file_name[data->file_name_len])
598 || ISSLASH (file_name[data->file_name_len - 1]))
599 && memcmp (file_name, data->file_name, data->file_name_len) == 0))
600 break;
601
602 if (check_for_renamed_directories)
603 {
604 cur_info = &st;
605 if (stat (data->file_name, &st) != 0)
606 {
607 stat_error (data->file_name);
608 skip_this_one = 1;
609 }
610 else if (! (st.st_dev == data->dev && st.st_ino == data->ino))
611 {
612 ERROR ((0, 0,
613 _("%s: Directory renamed before its status could be extracted"),
614 quotearg_colon (data->file_name)));
615 skip_this_one = 1;
616 }
617 }
618
619 if (! skip_this_one)
620 {
621 struct tar_stat_info sb;
622 sb.stat.st_mode = data->mode;
623 sb.stat.st_uid = data->uid;
624 sb.stat.st_gid = data->gid;
625 sb.atime = data->atime;
626 sb.mtime = data->mtime;
627 set_stat (data->file_name, &sb, cur_info,
628 data->invert_permissions, data->permstatus, DIRTYPE);
629 }
630
631 delayed_set_stat_head = data->next;
632 free (data);
633 }
634 }
635
636 \f
637
638 /* Extractor functions for various member types */
639
640 static int
641 extract_dir (char *file_name, int typeflag)
642 {
643 int status;
644 mode_t mode;
645 int interdir_made = 0;
646
647 /* Save 'root device' to avoid purging mount points. */
648 if (one_file_system_option && root_device == 0)
649 {
650 struct stat st;
651 char *dir = xgetcwd ();
652
653 if (deref_stat (true, dir, &st))
654 stat_diag (dir);
655 else
656 root_device = st.st_dev;
657 free (dir);
658 }
659
660 if (incremental_option)
661 /* Read the entry and delete files that aren't listed in the archive. */
662 purge_directory (file_name);
663 else if (typeflag == GNUTYPE_DUMPDIR)
664 skip_member ();
665
666 mode = current_stat_info.stat.st_mode | (we_are_root ? 0 : MODE_WXUSR);
667 if (0 < same_owner_option || current_stat_info.stat.st_mode & ~ MODE_RWX)
668 mode &= S_IRWXU;
669
670 while ((status = mkdir (file_name, mode)))
671 {
672 if (errno == EEXIST
673 && (interdir_made
674 || old_files_option == DEFAULT_OLD_FILES
675 || old_files_option == OVERWRITE_OLD_FILES))
676 {
677 struct stat st;
678 if (stat (file_name, &st) == 0)
679 {
680 if (interdir_made)
681 {
682 repair_delayed_set_stat (file_name, &st);
683 return 0;
684 }
685 if (S_ISDIR (st.st_mode))
686 {
687 status = 0;
688 mode = st.st_mode;
689 break;
690 }
691 }
692 errno = EEXIST;
693 }
694
695 switch (maybe_recoverable (file_name, &interdir_made))
696 {
697 case RECOVER_OK:
698 continue;
699
700 case RECOVER_SKIP:
701 break;
702
703 case RECOVER_NO:
704 if (errno != EEXIST)
705 {
706 mkdir_error (file_name);
707 return 1;
708 }
709 break;
710 }
711 break;
712 }
713
714 if (status == 0
715 || old_files_option == DEFAULT_OLD_FILES
716 || old_files_option == OVERWRITE_OLD_FILES)
717 {
718 if (status == 0)
719 delay_set_stat (file_name, &current_stat_info,
720 ((mode ^ current_stat_info.stat.st_mode)
721 & MODE_RWX & ~ current_umask),
722 ARCHIVED_PERMSTATUS);
723 else /* For an already existing directory, invert_perms must be 0 */
724 delay_set_stat (file_name, &current_stat_info,
725 0,
726 UNKNOWN_PERMSTATUS);
727 }
728 return status;
729 }
730
731
732 static int
733 open_output_file (char *file_name, int typeflag, mode_t mode)
734 {
735 int fd;
736 int openflag = (O_WRONLY | O_BINARY | O_CREAT
737 | (old_files_option == OVERWRITE_OLD_FILES
738 ? O_TRUNC
739 : O_EXCL));
740
741 #if O_CTG
742 /* Contiguous files (on the Masscomp) have to specify the size in
743 the open call that creates them. */
744
745 if (typeflag == CONTTYPE)
746 fd = open (file_name, openflag | O_CTG, mode, current_stat_info.stat.st_size);
747 else
748 fd = open (file_name, openflag, mode);
749
750 #else /* not O_CTG */
751 if (typeflag == CONTTYPE)
752 {
753 static int conttype_diagnosed;
754
755 if (!conttype_diagnosed)
756 {
757 conttype_diagnosed = 1;
758 WARNOPT (WARN_CONTIGUOUS_CAST,
759 (0, 0, _("Extracting contiguous files as regular files")));
760 }
761 }
762 fd = open (file_name, openflag, mode);
763
764 #endif /* not O_CTG */
765
766 return fd;
767 }
768
769 static int
770 extract_file (char *file_name, int typeflag)
771 {
772 int fd;
773 off_t size;
774 union block *data_block;
775 int status;
776 size_t count;
777 size_t written;
778 int interdir_made = 0;
779 mode_t mode = current_stat_info.stat.st_mode & MODE_RWX & ~ current_umask;
780 mode_t invert_permissions =
781 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
782
783 /* FIXME: deal with protection issues. */
784
785 if (to_stdout_option)
786 fd = STDOUT_FILENO;
787 else if (to_command_option)
788 {
789 fd = sys_exec_command (file_name, 'f', &current_stat_info);
790 if (fd < 0)
791 {
792 skip_member ();
793 return 0;
794 }
795 }
796 else
797 {
798 int recover = RECOVER_NO;
799 do
800 fd = open_output_file (file_name, typeflag, mode ^ invert_permissions);
801 while (fd < 0
802 && (recover = maybe_recoverable (file_name, &interdir_made))
803 == RECOVER_OK);
804
805 if (fd < 0)
806 {
807 skip_member ();
808 if (recover == RECOVER_SKIP)
809 return 0;
810 open_error (file_name);
811 return 1;
812 }
813 }
814
815 mv_begin (&current_stat_info);
816 if (current_stat_info.is_sparse)
817 sparse_extract_file (fd, &current_stat_info, &size);
818 else
819 for (size = current_stat_info.stat.st_size; size > 0; )
820 {
821 mv_size_left (size);
822
823 /* Locate data, determine max length writeable, write it,
824 block that we have used the data, then check if the write
825 worked. */
826
827 data_block = find_next_block ();
828 if (! data_block)
829 {
830 ERROR ((0, 0, _("Unexpected EOF in archive")));
831 break; /* FIXME: What happens, then? */
832 }
833
834 written = available_space_after (data_block);
835
836 if (written > size)
837 written = size;
838 errno = 0;
839 count = full_write (fd, data_block->buffer, written);
840 size -= written;
841
842 set_next_block_after ((union block *)
843 (data_block->buffer + written - 1));
844 if (count != written)
845 {
846 if (!to_command_option)
847 write_error_details (file_name, count, written);
848 /* FIXME: shouldn't we restore from backup? */
849 break;
850 }
851 }
852
853 skip_file (size);
854
855 mv_end ();
856
857 /* If writing to stdout, don't try to do anything to the filename;
858 it doesn't exist, or we don't want to touch it anyway. */
859
860 if (to_stdout_option)
861 return 0;
862
863 status = close (fd);
864 if (status < 0)
865 close_error (file_name);
866
867 if (to_command_option)
868 sys_wait_command ();
869 else
870 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
871 (old_files_option == OVERWRITE_OLD_FILES ?
872 UNKNOWN_PERMSTATUS : ARCHIVED_PERMSTATUS),
873 typeflag);
874
875 return status;
876 }
877
878 /* Create a placeholder file with name FILE_NAME, which will be
879 replaced after other extraction is done by a symbolic link if
880 IS_SYMLINK is true, and by a hard link otherwise. Set
881 *INTERDIR_MADE if an intermediate directory is made in the
882 process. */
883
884 static int
885 create_placeholder_file (char *file_name, bool is_symlink, int *interdir_made)
886 {
887 int fd;
888 struct stat st;
889
890 while ((fd = open (file_name, O_WRONLY | O_CREAT | O_EXCL, 0)) < 0)
891 {
892 switch (maybe_recoverable (file_name, interdir_made))
893 {
894 case RECOVER_OK:
895 continue;
896
897 case RECOVER_SKIP:
898 return 0;
899
900 case RECOVER_NO:
901 open_error (file_name);
902 return -1;
903 }
904 }
905
906 if (fstat (fd, &st) != 0)
907 {
908 stat_error (file_name);
909 close (fd);
910 }
911 else if (close (fd) != 0)
912 close_error (file_name);
913 else
914 {
915 struct delayed_set_stat *h;
916 struct delayed_link *p =
917 xmalloc (offsetof (struct delayed_link, target)
918 + strlen (current_stat_info.link_name)
919 + 1);
920 p->next = delayed_link_head;
921 delayed_link_head = p;
922 p->dev = st.st_dev;
923 p->ino = st.st_ino;
924 p->mtime = get_stat_mtime (&st);
925 p->is_symlink = is_symlink;
926 if (is_symlink)
927 {
928 p->uid = current_stat_info.stat.st_uid;
929 p->gid = current_stat_info.stat.st_gid;
930 }
931 p->sources = xmalloc (offsetof (struct string_list, string)
932 + strlen (file_name) + 1);
933 p->sources->next = 0;
934 strcpy (p->sources->string, file_name);
935 strcpy (p->target, current_stat_info.link_name);
936
937 h = delayed_set_stat_head;
938 if (h && ! h->after_links
939 && strncmp (file_name, h->file_name, h->file_name_len) == 0
940 && ISSLASH (file_name[h->file_name_len])
941 && (last_component (file_name) == file_name + h->file_name_len + 1))
942 {
943 do
944 {
945 h->after_links = 1;
946
947 if (stat (h->file_name, &st) != 0)
948 stat_error (h->file_name);
949 else
950 {
951 h->dev = st.st_dev;
952 h->ino = st.st_ino;
953 }
954 }
955 while ((h = h->next) && ! h->after_links);
956 }
957
958 return 0;
959 }
960
961 return -1;
962 }
963
964 static int
965 extract_link (char *file_name, int typeflag)
966 {
967 int interdir_made = 0;
968 char const *link_name;
969 int rc;
970
971 link_name = current_stat_info.link_name;
972
973 if (! absolute_names_option && contains_dot_dot (link_name))
974 return create_placeholder_file (file_name, false, &interdir_made);
975
976 do
977 {
978 struct stat st1, st2;
979 int e;
980 int status = link (link_name, file_name);
981 e = errno;
982
983 if (status == 0)
984 {
985 struct delayed_link *ds = delayed_link_head;
986 if (ds && lstat (link_name, &st1) == 0)
987 for (; ds; ds = ds->next)
988 if (ds->dev == st1.st_dev
989 && ds->ino == st1.st_ino
990 && timespec_cmp (ds->mtime, get_stat_mtime (&st1)) == 0)
991 {
992 struct string_list *p = xmalloc (offsetof (struct string_list, string)
993 + strlen (file_name) + 1);
994 strcpy (p->string, file_name);
995 p->next = ds->sources;
996 ds->sources = p;
997 break;
998 }
999 return 0;
1000 }
1001 else if ((e == EEXIST && strcmp (link_name, file_name) == 0)
1002 || (lstat (link_name, &st1) == 0
1003 && lstat (file_name, &st2) == 0
1004 && st1.st_dev == st2.st_dev
1005 && st1.st_ino == st2.st_ino))
1006 return 0;
1007
1008 errno = e;
1009 }
1010 while ((rc = maybe_recoverable (file_name, &interdir_made)) == RECOVER_OK);
1011
1012 if (rc == RECOVER_SKIP)
1013 return 0;
1014 if (!(incremental_option && errno == EEXIST))
1015 {
1016 link_error (link_name, file_name);
1017 return 1;
1018 }
1019 return 0;
1020 }
1021
1022 static int
1023 extract_symlink (char *file_name, int typeflag)
1024 {
1025 #ifdef HAVE_SYMLINK
1026 int interdir_made = 0;
1027
1028 if (! absolute_names_option
1029 && (IS_ABSOLUTE_FILE_NAME (current_stat_info.link_name)
1030 || contains_dot_dot (current_stat_info.link_name)))
1031 return create_placeholder_file (file_name, true, &interdir_made);
1032
1033 while (symlink (current_stat_info.link_name, file_name))
1034 switch (maybe_recoverable (file_name, &interdir_made))
1035 {
1036 case RECOVER_OK:
1037 continue;
1038
1039 case RECOVER_SKIP:
1040 return 0;
1041
1042 case RECOVER_NO:
1043 symlink_error (current_stat_info.link_name, file_name);
1044 return -1;
1045 }
1046
1047 set_stat (file_name, &current_stat_info, NULL, 0, 0, SYMTYPE);
1048 return 0;
1049
1050 #else
1051 static int warned_once;
1052
1053 if (!warned_once)
1054 {
1055 warned_once = 1;
1056 WARNOPT (WARN_SYMBOLIC_CAST,
1057 (0, 0,
1058 _("Attempting extraction of symbolic links as hard links")));
1059 }
1060 return extract_link (file_name, typeflag);
1061 #endif
1062 }
1063
1064 #if S_IFCHR || S_IFBLK
1065 static int
1066 extract_node (char *file_name, int typeflag)
1067 {
1068 int status;
1069 int interdir_made = 0;
1070 mode_t mode = current_stat_info.stat.st_mode & ~ current_umask;
1071 mode_t invert_permissions =
1072 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
1073
1074 while (mknod (file_name, mode ^ invert_permissions,
1075 current_stat_info.stat.st_rdev))
1076 switch (maybe_recoverable (file_name, &interdir_made))
1077 {
1078 case RECOVER_OK:
1079 continue;
1080
1081 case RECOVER_SKIP:
1082 return 0;
1083
1084 case RECOVER_NO:
1085 mknod_error (file_name);
1086 return -1;
1087 }
1088
1089 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
1090 ARCHIVED_PERMSTATUS, typeflag);
1091 return status;
1092 }
1093 #endif
1094
1095 #if HAVE_MKFIFO || defined mkfifo
1096 static int
1097 extract_fifo (char *file_name, int typeflag)
1098 {
1099 int status;
1100 int interdir_made = 0;
1101 mode_t mode = current_stat_info.stat.st_mode & ~ current_umask;
1102 mode_t invert_permissions =
1103 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
1104
1105 while ((status = mkfifo (file_name, mode)) != 0)
1106 switch (maybe_recoverable (file_name, &interdir_made))
1107 {
1108 case RECOVER_OK:
1109 continue;
1110
1111 case RECOVER_SKIP:
1112 return 0;
1113
1114 case RECOVER_NO:
1115 mkfifo_error (file_name);
1116 return -1;
1117 }
1118
1119 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
1120 ARCHIVED_PERMSTATUS, typeflag);
1121 return 0;
1122 }
1123 #endif
1124
1125 static int
1126 extract_volhdr (char *file_name, int typeflag)
1127 {
1128 skip_member ();
1129 return 0;
1130 }
1131
1132 static int
1133 extract_failure (char *file_name, int typeflag)
1134 {
1135 return 1;
1136 }
1137
1138 typedef int (*tar_extractor_t) (char *file_name, int typeflag);
1139
1140 \f
1141
1142 /* Prepare to extract a file. Find extractor function.
1143 Return zero if extraction should not proceed. */
1144
1145 static int
1146 prepare_to_extract (char const *file_name, int typeflag, tar_extractor_t *fun)
1147 {
1148 int rc = 1;
1149
1150 if (EXTRACT_OVER_PIPE)
1151 rc = 0;
1152
1153 /* Select the extractor */
1154 switch (typeflag)
1155 {
1156 case GNUTYPE_SPARSE:
1157 *fun = extract_file;
1158 rc = 1;
1159 break;
1160
1161 case AREGTYPE:
1162 case REGTYPE:
1163 case CONTTYPE:
1164 /* Appears to be a file. But BSD tar uses the convention that a slash
1165 suffix means a directory. */
1166 if (current_stat_info.had_trailing_slash)
1167 *fun = extract_dir;
1168 else
1169 {
1170 *fun = extract_file;
1171 rc = 1;
1172 }
1173 break;
1174
1175 case SYMTYPE:
1176 *fun = extract_symlink;
1177 break;
1178
1179 case LNKTYPE:
1180 *fun = extract_link;
1181 break;
1182
1183 #if S_IFCHR
1184 case CHRTYPE:
1185 current_stat_info.stat.st_mode |= S_IFCHR;
1186 *fun = extract_node;
1187 break;
1188 #endif
1189
1190 #if S_IFBLK
1191 case BLKTYPE:
1192 current_stat_info.stat.st_mode |= S_IFBLK;
1193 *fun = extract_node;
1194 break;
1195 #endif
1196
1197 #if HAVE_MKFIFO || defined mkfifo
1198 case FIFOTYPE:
1199 *fun = extract_fifo;
1200 break;
1201 #endif
1202
1203 case DIRTYPE:
1204 case GNUTYPE_DUMPDIR:
1205 *fun = extract_dir;
1206 if (current_stat_info.is_dumpdir)
1207 delay_directory_restore_option = true;
1208 break;
1209
1210 case GNUTYPE_VOLHDR:
1211 *fun = extract_volhdr;
1212 break;
1213
1214 case GNUTYPE_MULTIVOL:
1215 ERROR ((0, 0,
1216 _("%s: Cannot extract -- file is continued from another volume"),
1217 quotearg_colon (current_stat_info.file_name)));
1218 *fun = extract_failure;
1219 break;
1220
1221 case GNUTYPE_LONGNAME:
1222 case GNUTYPE_LONGLINK:
1223 ERROR ((0, 0, _("Unexpected long name header")));
1224 *fun = extract_failure;
1225 break;
1226
1227 default:
1228 WARNOPT (WARN_UNKNOWN_CAST,
1229 (0, 0,
1230 _("%s: Unknown file type `%c', extracted as normal file"),
1231 quotearg_colon (file_name), typeflag));
1232 *fun = extract_file;
1233 }
1234
1235 /* Determine whether the extraction should proceed */
1236 if (rc == 0)
1237 return 0;
1238
1239 switch (old_files_option)
1240 {
1241 case UNLINK_FIRST_OLD_FILES:
1242 if (!remove_any_file (file_name,
1243 recursive_unlink_option ? RECURSIVE_REMOVE_OPTION
1244 : ORDINARY_REMOVE_OPTION)
1245 && errno && errno != ENOENT)
1246 {
1247 unlink_error (file_name);
1248 return 0;
1249 }
1250 break;
1251
1252 case KEEP_NEWER_FILES:
1253 if (file_newer_p (file_name, &current_stat_info))
1254 {
1255 WARNOPT (WARN_IGNORE_NEWER,
1256 (0, 0, _("Current %s is newer or same age"),
1257 quote (file_name)));
1258 return 0;
1259 }
1260 break;
1261
1262 default:
1263 break;
1264 }
1265
1266 return 1;
1267 }
1268
1269 /* Extract a file from the archive. */
1270 void
1271 extract_archive (void)
1272 {
1273 char typeflag;
1274 tar_extractor_t fun;
1275
1276 fatal_exit_hook = extract_finish;
1277
1278 /* Try to disable the ability to unlink a directory. */
1279 priv_set_remove_linkdir ();
1280
1281 set_next_block_after (current_header);
1282 decode_header (current_header, &current_stat_info, &current_format, 1);
1283 if (!current_stat_info.file_name[0]
1284 || (interactive_option
1285 && !confirm ("extract", current_stat_info.file_name)))
1286 {
1287 skip_member ();
1288 return;
1289 }
1290
1291 /* Print the block from current_header and current_stat. */
1292 if (verbose_option)
1293 print_header (&current_stat_info, current_header, -1);
1294
1295 /* Restore stats for all non-ancestor directories, unless
1296 it is an incremental archive.
1297 (see NOTICE in the comment to delay_set_stat above) */
1298 if (!delay_directory_restore_option)
1299 apply_nonancestor_delayed_set_stat (current_stat_info.file_name, 0);
1300
1301 /* Take a safety backup of a previously existing file. */
1302
1303 if (backup_option)
1304 if (!maybe_backup_file (current_stat_info.file_name, 0))
1305 {
1306 int e = errno;
1307 ERROR ((0, e, _("%s: Was unable to backup this file"),
1308 quotearg_colon (current_stat_info.file_name)));
1309 skip_member ();
1310 return;
1311 }
1312
1313 /* Extract the archive entry according to its type. */
1314 /* KLUDGE */
1315 typeflag = sparse_member_p (&current_stat_info) ?
1316 GNUTYPE_SPARSE : current_header->header.typeflag;
1317
1318 if (prepare_to_extract (current_stat_info.file_name, typeflag, &fun))
1319 {
1320 if (fun && (*fun) (current_stat_info.file_name, typeflag)
1321 && backup_option)
1322 undo_last_backup ();
1323 }
1324 else
1325 skip_member ();
1326
1327 }
1328
1329 /* Extract the symbolic links whose final extraction were delayed. */
1330 static void
1331 apply_delayed_links (void)
1332 {
1333 struct delayed_link *ds;
1334
1335 for (ds = delayed_link_head; ds; )
1336 {
1337 struct string_list *sources = ds->sources;
1338 char const *valid_source = 0;
1339
1340 for (sources = ds->sources; sources; sources = sources->next)
1341 {
1342 char const *source = sources->string;
1343 struct stat st;
1344
1345 /* Make sure the placeholder file is still there. If not,
1346 don't create a link, as the placeholder was probably
1347 removed by a later extraction. */
1348 if (lstat (source, &st) == 0
1349 && st.st_dev == ds->dev
1350 && st.st_ino == ds->ino
1351 && timespec_cmp (get_stat_mtime (&st), ds->mtime) == 0)
1352 {
1353 /* Unlink the placeholder, then create a hard link if possible,
1354 a symbolic link otherwise. */
1355 if (unlink (source) != 0)
1356 unlink_error (source);
1357 else if (valid_source && link (valid_source, source) == 0)
1358 ;
1359 else if (!ds->is_symlink)
1360 {
1361 if (link (ds->target, source) != 0)
1362 link_error (ds->target, source);
1363 }
1364 else if (symlink (ds->target, source) != 0)
1365 symlink_error (ds->target, source);
1366 else
1367 {
1368 struct tar_stat_info st1;
1369 st1.stat.st_uid = ds->uid;
1370 st1.stat.st_gid = ds->gid;
1371 set_stat (source, &st1, NULL, 0, 0, SYMTYPE);
1372 valid_source = source;
1373 }
1374 }
1375 }
1376
1377 for (sources = ds->sources; sources; )
1378 {
1379 struct string_list *next = sources->next;
1380 free (sources);
1381 sources = next;
1382 }
1383
1384 {
1385 struct delayed_link *next = ds->next;
1386 free (ds);
1387 ds = next;
1388 }
1389 }
1390
1391 delayed_link_head = 0;
1392 }
1393
1394 /* Finish the extraction of an archive. */
1395 void
1396 extract_finish (void)
1397 {
1398 /* First, fix the status of ordinary directories that need fixing. */
1399 apply_nonancestor_delayed_set_stat ("", 0);
1400
1401 /* Then, apply delayed links, so that they don't affect delayed
1402 directory status-setting for ordinary directories. */
1403 apply_delayed_links ();
1404
1405 /* Finally, fix the status of directories that are ancestors
1406 of delayed links. */
1407 apply_nonancestor_delayed_set_stat ("", 1);
1408 }
1409
1410 bool
1411 rename_directory (char *src, char *dst)
1412 {
1413 if (rename (src, dst))
1414 {
1415 int e = errno;
1416
1417 switch (e)
1418 {
1419 case ENOENT:
1420 if (make_directories (dst))
1421 {
1422 if (rename (src, dst) == 0)
1423 return true;
1424 e = errno;
1425 }
1426 break;
1427
1428 case EXDEV:
1429 /* FIXME: Fall back to recursive copying */
1430
1431 default:
1432 break;
1433 }
1434
1435 ERROR ((0, e, _("Cannot rename %s to %s"),
1436 quote_n (0, src),
1437 quote_n (1, dst)));
1438 return false;
1439 }
1440 return true;
1441 }
This page took 0.107271 seconds and 5 git commands to generate.