Optimize searches for directory structures by keeping a pointer to struct directory...
[tar/ericb.git] / src / extract.c
blob3c92e53d6d1e3f686e939c419e0df03159bb480b
1 /* Extract files from a tar archive.
3 Copyright (C) 1988, 1992, 1993, 1994, 1996, 1997, 1998, 1999, 2000,
4 2001, 2003, 2004, 2005, 2006, 2007 Free Software Foundation, Inc.
6 Written by John Gilmore, on 1985-11-19.
8 This program is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by the
10 Free Software Foundation; either version 3, or (at your option) any later
11 version.
13 This program is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
16 Public License for more details.
18 You should have received a copy of the GNU General Public License along
19 with this program; if not, write to the Free Software Foundation, Inc.,
20 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
22 #include <system.h>
23 #include <quotearg.h>
24 #include <utimens.h>
25 #include <errno.h>
26 #include <xgetcwd.h>
27 #include <priv-set.h>
29 #include "common.h"
31 static bool we_are_root; /* true if our effective uid == 0 */
32 static mode_t newdir_umask; /* umask when creating new directories */
33 static mode_t current_umask; /* current umask (which is set to 0 if -p) */
35 /* Status of the permissions of a file that we are extracting. */
36 enum permstatus
38 /* This file may have existed already; its permissions are unknown. */
39 UNKNOWN_PERMSTATUS,
41 /* This file was created using the permissions from the archive,
42 except with S_IRWXG | S_IRWXO masked out if 0 < same_owner_option. */
43 ARCHIVED_PERMSTATUS,
45 /* This is an intermediate directory; the archive did not specify
46 its permissions. */
47 INTERDIR_PERMSTATUS
50 /* List of directories whose statuses we need to extract after we've
51 finished extracting their subsidiary files. If you consider each
52 contiguous subsequence of elements of the form [D]?[^D]*, where [D]
53 represents an element where AFTER_LINKS is nonzero and [^D]
54 represents an element where AFTER_LINKS is zero, then the head
55 of the subsequence has the longest name, and each non-head element
56 in the prefix is an ancestor (in the directory hierarchy) of the
57 preceding element. */
59 struct delayed_set_stat
61 struct delayed_set_stat *next;
62 dev_t dev;
63 ino_t ino;
64 mode_t mode;
65 uid_t uid;
66 gid_t gid;
67 struct timespec atime;
68 struct timespec mtime;
69 size_t file_name_len;
70 mode_t invert_permissions;
71 enum permstatus permstatus;
72 bool after_links;
73 char file_name[1];
76 static struct delayed_set_stat *delayed_set_stat_head;
78 /* List of links whose creation we have delayed. */
79 struct delayed_link
81 /* The next delayed link in the list. */
82 struct delayed_link *next;
84 /* The device, inode number and last-modified time of the placeholder. */
85 dev_t dev;
86 ino_t ino;
87 struct timespec mtime;
89 /* True if the link is symbolic. */
90 bool is_symlink;
92 /* The desired owner and group of the link, if it is a symlink. */
93 uid_t uid;
94 gid_t gid;
96 /* A list of sources for this link. The sources are all to be
97 hard-linked together. */
98 struct string_list *sources;
100 /* The desired target of the desired link. */
101 char target[1];
104 static struct delayed_link *delayed_link_head;
106 struct string_list
108 struct string_list *next;
109 char string[1];
112 /* Set up to extract files. */
113 void
114 extr_init (void)
116 we_are_root = geteuid () == 0;
117 same_permissions_option += we_are_root;
118 same_owner_option += we_are_root;
120 /* Option -p clears the kernel umask, so it does not affect proper
121 restoration of file permissions. New intermediate directories will
122 comply with umask at start of program. */
124 newdir_umask = umask (0);
125 if (0 < same_permissions_option)
126 current_umask = 0;
127 else
129 umask (newdir_umask); /* restore the kernel umask */
130 current_umask = newdir_umask;
134 /* If restoring permissions, restore the mode for FILE_NAME from
135 information given in *STAT_INFO (where *CUR_INFO gives
136 the current status if CUR_INFO is nonzero); otherwise invert the
137 INVERT_PERMISSIONS bits from the file's current permissions.
138 PERMSTATUS specifies the status of the file's permissions.
139 TYPEFLAG specifies the type of the file. */
140 static void
141 set_mode (char const *file_name,
142 struct stat const *stat_info,
143 struct stat const *cur_info,
144 mode_t invert_permissions, enum permstatus permstatus,
145 char typeflag)
147 mode_t mode;
148 bool failed;
150 if (0 < same_permissions_option
151 && permstatus != INTERDIR_PERMSTATUS)
153 mode = stat_info->st_mode;
155 /* If we created the file and it has a mode that we set already
156 with O_CREAT, then its mode is often set correctly already.
157 But if we are changing ownership, the mode's group and and
158 other permission bits were omitted originally, so it's less
159 likely that the mode is OK now. Also, on many hosts, some
160 directories inherit the setgid bits from their parents, so we
161 we must set directories' modes explicitly. */
162 if ((permstatus == ARCHIVED_PERMSTATUS
163 && ! (mode & ~ (0 < same_owner_option ? S_IRWXU : MODE_RWX)))
164 && typeflag != DIRTYPE
165 && typeflag != GNUTYPE_DUMPDIR)
166 return;
168 else if (! invert_permissions)
169 return;
170 else
172 /* We must inspect a directory's current permissions, since the
173 directory may have inherited its setgid bit from its parent.
175 INVERT_PERMISSIONS happens to be nonzero only for directories
176 that we created, so there's no point optimizing this code for
177 other cases. */
178 struct stat st;
179 if (! cur_info)
181 if (stat (file_name, &st) != 0)
183 stat_error (file_name);
184 return;
186 cur_info = &st;
188 mode = cur_info->st_mode ^ invert_permissions;
191 failed = chmod (file_name, mode) != 0;
192 if (failed && errno == EPERM)
194 /* On Solaris, chmod may fail if we don't have PRIV_ALL. */
195 if (priv_set_restore_linkdir () == 0)
197 failed = chmod (file_name, mode) != 0;
198 priv_set_remove_linkdir ();
201 if (failed)
202 chmod_error_details (file_name, mode);
205 /* Check time after successfully setting FILE_NAME's time stamp to T. */
206 static void
207 check_time (char const *file_name, struct timespec t)
209 if (t.tv_sec <= 0)
210 WARNOPT (WARN_TIMESTAMP,
211 (0, 0, _("%s: implausibly old time stamp %s"),
212 file_name, tartime (t, true)));
213 else if (timespec_cmp (volume_start_time, t) < 0)
215 struct timespec now;
216 gettime (&now);
217 if (timespec_cmp (now, t) < 0)
219 char buf[TIMESPEC_STRSIZE_BOUND];
220 struct timespec diff;
221 diff.tv_sec = t.tv_sec - now.tv_sec;
222 diff.tv_nsec = t.tv_nsec - now.tv_nsec;
223 if (diff.tv_nsec < 0)
225 diff.tv_nsec += BILLION;
226 diff.tv_sec--;
228 WARNOPT (WARN_TIMESTAMP,
229 (0, 0, _("%s: time stamp %s is %s s in the future"),
230 file_name, tartime (t, true), code_timespec (diff, buf)));
235 /* Restore stat attributes (owner, group, mode and times) for
236 FILE_NAME, using information given in *ST.
237 If CUR_INFO is nonzero, *CUR_INFO is the
238 file's current status.
239 If not restoring permissions, invert the
240 INVERT_PERMISSIONS bits from the file's current permissions.
241 PERMSTATUS specifies the status of the file's permissions.
242 TYPEFLAG specifies the type of the file. */
244 /* FIXME: About proper restoration of symbolic link attributes, we still do
245 not have it right. Pretesters' reports tell us we need further study and
246 probably more configuration. For now, just use lchown if it exists, and
247 punt for the rest. Sigh! */
249 static void
250 set_stat (char const *file_name,
251 struct tar_stat_info const *st,
252 struct stat const *cur_info,
253 mode_t invert_permissions, enum permstatus permstatus,
254 char typeflag)
256 if (typeflag != SYMTYPE)
258 /* We do the utime before the chmod because some versions of utime are
259 broken and trash the modes of the file. */
261 if (! touch_option && permstatus != INTERDIR_PERMSTATUS)
263 /* We set the accessed time to `now', which is really the time we
264 started extracting files, unless incremental_option is used, in
265 which case .st_atime is used. */
267 /* FIXME: incremental_option should set ctime too, but how? */
269 struct timespec ts[2];
270 if (incremental_option)
271 ts[0] = st->atime;
272 else
273 ts[0] = start_time;
274 ts[1] = st->mtime;
276 if (utimens (file_name, ts) != 0)
277 utime_error (file_name);
278 else
280 check_time (file_name, ts[0]);
281 check_time (file_name, ts[1]);
285 /* Some systems allow non-root users to give files away. Once this
286 done, it is not possible anymore to change file permissions.
287 However, setting file permissions now would be incorrect, since
288 they would apply to the wrong user, and there would be a race
289 condition. So, don't use systems that allow non-root users to
290 give files away. */
293 if (0 < same_owner_option && permstatus != INTERDIR_PERMSTATUS)
295 /* When lchown exists, it should be used to change the attributes of
296 the symbolic link itself. In this case, a mere chown would change
297 the attributes of the file the symbolic link is pointing to, and
298 should be avoided. */
299 int chown_result = 1;
301 if (typeflag == SYMTYPE)
303 #if HAVE_LCHOWN
304 chown_result = lchown (file_name, st->stat.st_uid, st->stat.st_gid);
305 #endif
307 else
309 chown_result = chown (file_name, st->stat.st_uid, st->stat.st_gid);
312 if (chown_result == 0)
314 /* Changing the owner can flip st_mode bits in some cases, so
315 ignore cur_info if it might be obsolete now. */
316 if (cur_info
317 && cur_info->st_mode & S_IXUGO
318 && cur_info->st_mode & (S_ISUID | S_ISGID))
319 cur_info = NULL;
321 else if (chown_result < 0)
322 chown_error_details (file_name,
323 st->stat.st_uid, st->stat.st_gid);
326 if (typeflag != SYMTYPE)
327 set_mode (file_name, &st->stat, cur_info,
328 invert_permissions, permstatus, typeflag);
331 /* Remember to restore stat attributes (owner, group, mode and times)
332 for the directory FILE_NAME, using information given in *ST,
333 once we stop extracting files into that directory.
334 If not restoring permissions, remember to invert the
335 INVERT_PERMISSIONS bits from the file's current permissions.
336 PERMSTATUS specifies the status of the file's permissions.
338 NOTICE: this works only if the archive has usual member order, i.e.
339 directory, then the files in that directory. Incremental archive have
340 somewhat reversed order: first go subdirectories, then all other
341 members. To help cope with this case the variable
342 delay_directory_restore_option is set by prepare_to_extract.
344 If an archive was explicitely created so that its member order is
345 reversed, some directory timestamps can be restored incorrectly,
346 e.g.:
347 tar --no-recursion -cf archive dir dir/file1 foo dir/file2
349 static void
350 delay_set_stat (char const *file_name, struct tar_stat_info const *st,
351 mode_t invert_permissions, enum permstatus permstatus)
353 size_t file_name_len = strlen (file_name);
354 struct delayed_set_stat *data =
355 xmalloc (offsetof (struct delayed_set_stat, file_name)
356 + file_name_len + 1);
357 data->next = delayed_set_stat_head;
358 data->dev = st->stat.st_dev;
359 data->ino = st->stat.st_ino;
360 data->mode = st->stat.st_mode;
361 data->uid = st->stat.st_uid;
362 data->gid = st->stat.st_gid;
363 data->atime = st->atime;
364 data->mtime = st->mtime;
365 data->file_name_len = file_name_len;
366 data->invert_permissions = invert_permissions;
367 data->permstatus = permstatus;
368 data->after_links = 0;
369 strcpy (data->file_name, file_name);
370 delayed_set_stat_head = data;
373 /* Update the delayed_set_stat info for an intermediate directory
374 created within the file name of DIR. The intermediate directory turned
375 out to be the same as this directory, e.g. due to ".." or symbolic
376 links. *DIR_STAT_INFO is the status of the directory. */
377 static void
378 repair_delayed_set_stat (char const *dir,
379 struct stat const *dir_stat_info)
381 struct delayed_set_stat *data;
382 for (data = delayed_set_stat_head; data; data = data->next)
384 struct stat st;
385 if (stat (data->file_name, &st) != 0)
387 stat_error (data->file_name);
388 return;
391 if (st.st_dev == dir_stat_info->st_dev
392 && st.st_ino == dir_stat_info->st_ino)
394 data->dev = current_stat_info.stat.st_dev;
395 data->ino = current_stat_info.stat.st_ino;
396 data->mode = current_stat_info.stat.st_mode;
397 data->uid = current_stat_info.stat.st_uid;
398 data->gid = current_stat_info.stat.st_gid;
399 data->atime = current_stat_info.atime;
400 data->mtime = current_stat_info.mtime;
401 data->invert_permissions =
402 ((current_stat_info.stat.st_mode ^ st.st_mode)
403 & MODE_RWX & ~ current_umask);
404 data->permstatus = ARCHIVED_PERMSTATUS;
405 return;
409 ERROR ((0, 0, _("%s: Unexpected inconsistency when making directory"),
410 quotearg_colon (dir)));
413 /* After a file/link/directory creation has failed, see if
414 it's because some required directory was not present, and if so,
415 create all required directories. Return non-zero if a directory
416 was created. */
417 static int
418 make_directories (char *file_name)
420 char *cursor0 = file_name + FILE_SYSTEM_PREFIX_LEN (file_name);
421 char *cursor; /* points into the file name */
422 int did_something = 0; /* did we do anything yet? */
423 int mode;
424 int invert_permissions;
425 int status;
427 for (cursor = cursor0; *cursor; cursor++)
429 if (! ISSLASH (*cursor))
430 continue;
432 /* Avoid mkdir of empty string, if leading or double '/'. */
434 if (cursor == cursor0 || ISSLASH (cursor[-1]))
435 continue;
437 /* Avoid mkdir where last part of file name is "." or "..". */
439 if (cursor[-1] == '.'
440 && (cursor == cursor0 + 1 || ISSLASH (cursor[-2])
441 || (cursor[-2] == '.'
442 && (cursor == cursor0 + 2 || ISSLASH (cursor[-3])))))
443 continue;
445 *cursor = '\0'; /* truncate the name there */
446 mode = MODE_RWX & ~ newdir_umask;
447 invert_permissions = we_are_root ? 0 : MODE_WXUSR & ~ mode;
448 status = mkdir (file_name, mode ^ invert_permissions);
450 if (status == 0)
452 /* Create a struct delayed_set_stat even if
453 invert_permissions is zero, because
454 repair_delayed_set_stat may need to update the struct. */
455 delay_set_stat (file_name,
456 &current_stat_info,
457 invert_permissions, INTERDIR_PERMSTATUS);
459 print_for_mkdir (file_name, cursor - file_name, mode);
460 did_something = 1;
462 *cursor = '/';
463 continue;
466 *cursor = '/';
468 if (errno == EEXIST)
469 continue; /* Directory already exists. */
470 else if ((errno == ENOSYS /* Automounted dirs on Solaris return
471 this. Reported by Warren Hyde
472 <Warren.Hyde@motorola.com> */
473 || ERRNO_IS_EACCES) /* Turbo C mkdir gives a funny errno. */
474 && access (file_name, W_OK) == 0)
475 continue;
477 /* Some other error in the mkdir. We return to the caller. */
478 break;
481 return did_something; /* tell them to retry if we made one */
484 static bool
485 file_newer_p (const char *file_name, struct tar_stat_info *tar_stat)
487 struct stat st;
489 if (stat (file_name, &st))
491 if (errno != ENOENT)
493 stat_warn (file_name);
494 /* Be on the safe side: if the file does exist assume it is newer */
495 return true;
497 return false;
499 if (!S_ISDIR (st.st_mode)
500 && tar_timespec_cmp (tar_stat->mtime, get_stat_mtime (&st)) <= 0)
502 return true;
504 return false;
507 #define RECOVER_NO 0
508 #define RECOVER_OK 1
509 #define RECOVER_SKIP 2
511 /* Attempt repairing what went wrong with the extraction. Delete an
512 already existing file or create missing intermediate directories.
513 Return RECOVER_OK if we somewhat increased our chances at a successful
514 extraction, RECOVER_NO if there are no chances, and RECOVER_SKIP if the
515 caller should skip extraction of that member. The value of errno is
516 properly restored on returning RECOVER_NO. */
518 static int
519 maybe_recoverable (char *file_name, int *interdir_made)
521 int e = errno;
523 if (*interdir_made)
524 return RECOVER_NO;
526 switch (errno)
528 case EEXIST:
529 /* Remove an old file, if the options allow this. */
531 switch (old_files_option)
533 case KEEP_OLD_FILES:
534 return RECOVER_SKIP;
536 case KEEP_NEWER_FILES:
537 if (file_newer_p (file_name, &current_stat_info))
539 errno = e;
540 return RECOVER_NO;
542 /* FALL THROUGH */
544 case DEFAULT_OLD_FILES:
545 case NO_OVERWRITE_DIR_OLD_FILES:
546 case OVERWRITE_OLD_FILES:
548 int r = remove_any_file (file_name, ORDINARY_REMOVE_OPTION);
549 errno = EEXIST;
550 return r > 0 ? RECOVER_OK : RECOVER_NO;
553 case UNLINK_FIRST_OLD_FILES:
554 break;
557 case ENOENT:
558 /* Attempt creating missing intermediate directories. */
559 if (! make_directories (file_name))
561 errno = ENOENT;
562 return RECOVER_NO;
564 *interdir_made = 1;
565 return RECOVER_OK;
567 default:
568 /* Just say we can't do anything about it... */
570 return RECOVER_NO;
574 /* Fix the statuses of all directories whose statuses need fixing, and
575 which are not ancestors of FILE_NAME. If AFTER_LINKS is
576 nonzero, do this for all such directories; otherwise, stop at the
577 first directory that is marked to be fixed up only after delayed
578 links are applied. */
579 static void
580 apply_nonancestor_delayed_set_stat (char const *file_name, bool after_links)
582 size_t file_name_len = strlen (file_name);
583 bool check_for_renamed_directories = 0;
585 while (delayed_set_stat_head)
587 struct delayed_set_stat *data = delayed_set_stat_head;
588 bool skip_this_one = 0;
589 struct stat st;
590 struct stat const *cur_info = 0;
592 check_for_renamed_directories |= data->after_links;
594 if (after_links < data->after_links
595 || (data->file_name_len < file_name_len
596 && file_name[data->file_name_len]
597 && (ISSLASH (file_name[data->file_name_len])
598 || ISSLASH (file_name[data->file_name_len - 1]))
599 && memcmp (file_name, data->file_name, data->file_name_len) == 0))
600 break;
602 if (check_for_renamed_directories)
604 cur_info = &st;
605 if (stat (data->file_name, &st) != 0)
607 stat_error (data->file_name);
608 skip_this_one = 1;
610 else if (! (st.st_dev == data->dev && st.st_ino == data->ino))
612 ERROR ((0, 0,
613 _("%s: Directory renamed before its status could be extracted"),
614 quotearg_colon (data->file_name)));
615 skip_this_one = 1;
619 if (! skip_this_one)
621 struct tar_stat_info sb;
622 sb.stat.st_mode = data->mode;
623 sb.stat.st_uid = data->uid;
624 sb.stat.st_gid = data->gid;
625 sb.atime = data->atime;
626 sb.mtime = data->mtime;
627 set_stat (data->file_name, &sb, cur_info,
628 data->invert_permissions, data->permstatus, DIRTYPE);
631 delayed_set_stat_head = data->next;
632 free (data);
638 /* Extractor functions for various member types */
640 static int
641 extract_dir (char *file_name, int typeflag)
643 int status;
644 mode_t mode;
645 int interdir_made = 0;
647 /* Save 'root device' to avoid purging mount points. */
648 if (one_file_system_option && root_device == 0)
650 struct stat st;
651 char *dir = xgetcwd ();
653 if (deref_stat (true, dir, &st))
654 stat_diag (dir);
655 else
656 root_device = st.st_dev;
657 free (dir);
660 if (incremental_option)
661 /* Read the entry and delete files that aren't listed in the archive. */
662 purge_directory (file_name);
663 else if (typeflag == GNUTYPE_DUMPDIR)
664 skip_member ();
666 mode = current_stat_info.stat.st_mode | (we_are_root ? 0 : MODE_WXUSR);
667 if (0 < same_owner_option || current_stat_info.stat.st_mode & ~ MODE_RWX)
668 mode &= S_IRWXU;
670 while ((status = mkdir (file_name, mode)))
672 if (errno == EEXIST
673 && (interdir_made
674 || old_files_option == DEFAULT_OLD_FILES
675 || old_files_option == OVERWRITE_OLD_FILES))
677 struct stat st;
678 if (stat (file_name, &st) == 0)
680 if (interdir_made)
682 repair_delayed_set_stat (file_name, &st);
683 return 0;
685 if (S_ISDIR (st.st_mode))
687 status = 0;
688 mode = st.st_mode;
689 break;
692 errno = EEXIST;
695 switch (maybe_recoverable (file_name, &interdir_made))
697 case RECOVER_OK:
698 continue;
700 case RECOVER_SKIP:
701 break;
703 case RECOVER_NO:
704 if (errno != EEXIST)
706 mkdir_error (file_name);
707 return 1;
709 break;
711 break;
714 if (status == 0
715 || old_files_option == DEFAULT_OLD_FILES
716 || old_files_option == OVERWRITE_OLD_FILES)
718 if (status == 0)
719 delay_set_stat (file_name, &current_stat_info,
720 ((mode ^ current_stat_info.stat.st_mode)
721 & MODE_RWX & ~ current_umask),
722 ARCHIVED_PERMSTATUS);
723 else /* For an already existing directory, invert_perms must be 0 */
724 delay_set_stat (file_name, &current_stat_info,
726 UNKNOWN_PERMSTATUS);
728 return status;
732 static int
733 open_output_file (char *file_name, int typeflag, mode_t mode)
735 int fd;
736 int openflag = (O_WRONLY | O_BINARY | O_CREAT
737 | (old_files_option == OVERWRITE_OLD_FILES
738 ? O_TRUNC
739 : O_EXCL));
741 #if O_CTG
742 /* Contiguous files (on the Masscomp) have to specify the size in
743 the open call that creates them. */
745 if (typeflag == CONTTYPE)
746 fd = open (file_name, openflag | O_CTG, mode, current_stat_info.stat.st_size);
747 else
748 fd = open (file_name, openflag, mode);
750 #else /* not O_CTG */
751 if (typeflag == CONTTYPE)
753 static int conttype_diagnosed;
755 if (!conttype_diagnosed)
757 conttype_diagnosed = 1;
758 WARNOPT (WARN_CONTIGUOUS_CAST,
759 (0, 0, _("Extracting contiguous files as regular files")));
762 fd = open (file_name, openflag, mode);
764 #endif /* not O_CTG */
766 return fd;
769 static int
770 extract_file (char *file_name, int typeflag)
772 int fd;
773 off_t size;
774 union block *data_block;
775 int status;
776 size_t count;
777 size_t written;
778 int interdir_made = 0;
779 mode_t mode = current_stat_info.stat.st_mode & MODE_RWX & ~ current_umask;
780 mode_t invert_permissions =
781 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
783 /* FIXME: deal with protection issues. */
785 if (to_stdout_option)
786 fd = STDOUT_FILENO;
787 else if (to_command_option)
789 fd = sys_exec_command (file_name, 'f', &current_stat_info);
790 if (fd < 0)
792 skip_member ();
793 return 0;
796 else
798 int recover = RECOVER_NO;
800 fd = open_output_file (file_name, typeflag, mode ^ invert_permissions);
801 while (fd < 0
802 && (recover = maybe_recoverable (file_name, &interdir_made))
803 == RECOVER_OK);
805 if (fd < 0)
807 skip_member ();
808 if (recover == RECOVER_SKIP)
809 return 0;
810 open_error (file_name);
811 return 1;
815 mv_begin (&current_stat_info);
816 if (current_stat_info.is_sparse)
817 sparse_extract_file (fd, &current_stat_info, &size);
818 else
819 for (size = current_stat_info.stat.st_size; size > 0; )
821 mv_size_left (size);
823 /* Locate data, determine max length writeable, write it,
824 block that we have used the data, then check if the write
825 worked. */
827 data_block = find_next_block ();
828 if (! data_block)
830 ERROR ((0, 0, _("Unexpected EOF in archive")));
831 break; /* FIXME: What happens, then? */
834 written = available_space_after (data_block);
836 if (written > size)
837 written = size;
838 errno = 0;
839 count = full_write (fd, data_block->buffer, written);
840 size -= written;
842 set_next_block_after ((union block *)
843 (data_block->buffer + written - 1));
844 if (count != written)
846 if (!to_command_option)
847 write_error_details (file_name, count, written);
848 /* FIXME: shouldn't we restore from backup? */
849 break;
853 skip_file (size);
855 mv_end ();
857 /* If writing to stdout, don't try to do anything to the filename;
858 it doesn't exist, or we don't want to touch it anyway. */
860 if (to_stdout_option)
861 return 0;
863 status = close (fd);
864 if (status < 0)
865 close_error (file_name);
867 if (to_command_option)
868 sys_wait_command ();
869 else
870 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
871 (old_files_option == OVERWRITE_OLD_FILES ?
872 UNKNOWN_PERMSTATUS : ARCHIVED_PERMSTATUS),
873 typeflag);
875 return status;
878 /* Create a placeholder file with name FILE_NAME, which will be
879 replaced after other extraction is done by a symbolic link if
880 IS_SYMLINK is true, and by a hard link otherwise. Set
881 *INTERDIR_MADE if an intermediate directory is made in the
882 process. */
884 static int
885 create_placeholder_file (char *file_name, bool is_symlink, int *interdir_made)
887 int fd;
888 struct stat st;
890 while ((fd = open (file_name, O_WRONLY | O_CREAT | O_EXCL, 0)) < 0)
891 if (! maybe_recoverable (file_name, interdir_made))
892 break;
894 if (fd < 0)
895 open_error (file_name);
896 else if (fstat (fd, &st) != 0)
898 stat_error (file_name);
899 close (fd);
901 else if (close (fd) != 0)
902 close_error (file_name);
903 else
905 struct delayed_set_stat *h;
906 struct delayed_link *p =
907 xmalloc (offsetof (struct delayed_link, target)
908 + strlen (current_stat_info.link_name)
909 + 1);
910 p->next = delayed_link_head;
911 delayed_link_head = p;
912 p->dev = st.st_dev;
913 p->ino = st.st_ino;
914 p->mtime = get_stat_mtime (&st);
915 p->is_symlink = is_symlink;
916 if (is_symlink)
918 p->uid = current_stat_info.stat.st_uid;
919 p->gid = current_stat_info.stat.st_gid;
921 p->sources = xmalloc (offsetof (struct string_list, string)
922 + strlen (file_name) + 1);
923 p->sources->next = 0;
924 strcpy (p->sources->string, file_name);
925 strcpy (p->target, current_stat_info.link_name);
927 h = delayed_set_stat_head;
928 if (h && ! h->after_links
929 && strncmp (file_name, h->file_name, h->file_name_len) == 0
930 && ISSLASH (file_name[h->file_name_len])
931 && (last_component (file_name) == file_name + h->file_name_len + 1))
935 h->after_links = 1;
937 if (stat (h->file_name, &st) != 0)
938 stat_error (h->file_name);
939 else
941 h->dev = st.st_dev;
942 h->ino = st.st_ino;
945 while ((h = h->next) && ! h->after_links);
948 return 0;
951 return -1;
954 static int
955 extract_link (char *file_name, int typeflag)
957 int interdir_made = 0;
958 char const *link_name;
960 link_name = current_stat_info.link_name;
962 if (! absolute_names_option && contains_dot_dot (link_name))
963 return create_placeholder_file (file_name, false, &interdir_made);
967 struct stat st1, st2;
968 int e;
969 int status = link (link_name, file_name);
970 e = errno;
972 if (status == 0)
974 struct delayed_link *ds = delayed_link_head;
975 if (ds && lstat (link_name, &st1) == 0)
976 for (; ds; ds = ds->next)
977 if (ds->dev == st1.st_dev
978 && ds->ino == st1.st_ino
979 && timespec_cmp (ds->mtime, get_stat_mtime (&st1)) == 0)
981 struct string_list *p = xmalloc (offsetof (struct string_list, string)
982 + strlen (file_name) + 1);
983 strcpy (p->string, file_name);
984 p->next = ds->sources;
985 ds->sources = p;
986 break;
988 return 0;
990 else if ((e == EEXIST && strcmp (link_name, file_name) == 0)
991 || (lstat (link_name, &st1) == 0
992 && lstat (file_name, &st2) == 0
993 && st1.st_dev == st2.st_dev
994 && st1.st_ino == st2.st_ino))
995 return 0;
997 errno = e;
999 while (maybe_recoverable (file_name, &interdir_made));
1001 if (!(incremental_option && errno == EEXIST))
1003 link_error (link_name, file_name);
1004 return 1;
1006 return 0;
1009 static int
1010 extract_symlink (char *file_name, int typeflag)
1012 #ifdef HAVE_SYMLINK
1013 int status;
1014 int interdir_made = 0;
1016 if (! absolute_names_option
1017 && (IS_ABSOLUTE_FILE_NAME (current_stat_info.link_name)
1018 || contains_dot_dot (current_stat_info.link_name)))
1019 return create_placeholder_file (file_name, true, &interdir_made);
1021 while ((status = symlink (current_stat_info.link_name, file_name)))
1022 if (!maybe_recoverable (file_name, &interdir_made))
1023 break;
1025 if (status == 0)
1026 set_stat (file_name, &current_stat_info, NULL, 0, 0, SYMTYPE);
1027 else
1028 symlink_error (current_stat_info.link_name, file_name);
1029 return status;
1031 #else
1032 static int warned_once;
1034 if (!warned_once)
1036 warned_once = 1;
1037 WARNOPT (WARN_SYMBOLIC_CAST,
1038 (0, 0,
1039 _("Attempting extraction of symbolic links as hard links")));
1041 return extract_link (file_name, typeflag);
1042 #endif
1045 #if S_IFCHR || S_IFBLK
1046 static int
1047 extract_node (char *file_name, int typeflag)
1049 int status;
1050 int interdir_made = 0;
1051 mode_t mode = current_stat_info.stat.st_mode & ~ current_umask;
1052 mode_t invert_permissions =
1053 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
1056 status = mknod (file_name, mode ^ invert_permissions,
1057 current_stat_info.stat.st_rdev);
1058 while (status && maybe_recoverable (file_name, &interdir_made));
1060 if (status != 0)
1061 mknod_error (file_name);
1062 else
1063 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
1064 ARCHIVED_PERMSTATUS, typeflag);
1065 return status;
1067 #endif
1069 #if HAVE_MKFIFO || defined mkfifo
1070 static int
1071 extract_fifo (char *file_name, int typeflag)
1073 int status;
1074 int interdir_made = 0;
1075 mode_t mode = current_stat_info.stat.st_mode & ~ current_umask;
1076 mode_t invert_permissions =
1077 0 < same_owner_option ? mode & (S_IRWXG | S_IRWXO) : 0;
1079 while ((status = mkfifo (file_name, mode)) != 0)
1080 if (!maybe_recoverable (file_name, &interdir_made))
1081 break;
1083 if (status == 0)
1084 set_stat (file_name, &current_stat_info, NULL, invert_permissions,
1085 ARCHIVED_PERMSTATUS, typeflag);
1086 else
1087 mkfifo_error (file_name);
1088 return status;
1090 #endif
1092 static int
1093 extract_volhdr (char *file_name, int typeflag)
1095 if (verbose_option)
1096 fprintf (stdlis, _("Reading %s\n"), quote (current_stat_info.file_name));
1097 skip_member ();
1098 return 0;
1101 static int
1102 extract_failure (char *file_name, int typeflag)
1104 return 1;
1107 typedef int (*tar_extractor_t) (char *file_name, int typeflag);
1111 /* Prepare to extract a file. Find extractor function.
1112 Return zero if extraction should not proceed. */
1114 static int
1115 prepare_to_extract (char const *file_name, int typeflag, tar_extractor_t *fun)
1117 int rc = 1;
1119 if (EXTRACT_OVER_PIPE)
1120 rc = 0;
1122 /* Select the extractor */
1123 switch (typeflag)
1125 case GNUTYPE_SPARSE:
1126 *fun = extract_file;
1127 rc = 1;
1128 break;
1130 case AREGTYPE:
1131 case REGTYPE:
1132 case CONTTYPE:
1133 /* Appears to be a file. But BSD tar uses the convention that a slash
1134 suffix means a directory. */
1135 if (current_stat_info.had_trailing_slash)
1136 *fun = extract_dir;
1137 else
1139 *fun = extract_file;
1140 rc = 1;
1142 break;
1144 case SYMTYPE:
1145 *fun = extract_symlink;
1146 break;
1148 case LNKTYPE:
1149 *fun = extract_link;
1150 break;
1152 #if S_IFCHR
1153 case CHRTYPE:
1154 current_stat_info.stat.st_mode |= S_IFCHR;
1155 *fun = extract_node;
1156 break;
1157 #endif
1159 #if S_IFBLK
1160 case BLKTYPE:
1161 current_stat_info.stat.st_mode |= S_IFBLK;
1162 *fun = extract_node;
1163 break;
1164 #endif
1166 #if HAVE_MKFIFO || defined mkfifo
1167 case FIFOTYPE:
1168 *fun = extract_fifo;
1169 break;
1170 #endif
1172 case DIRTYPE:
1173 case GNUTYPE_DUMPDIR:
1174 *fun = extract_dir;
1175 if (current_stat_info.is_dumpdir)
1176 delay_directory_restore_option = true;
1177 break;
1179 case GNUTYPE_VOLHDR:
1180 *fun = extract_volhdr;
1181 break;
1183 case GNUTYPE_MULTIVOL:
1184 ERROR ((0, 0,
1185 _("%s: Cannot extract -- file is continued from another volume"),
1186 quotearg_colon (current_stat_info.file_name)));
1187 *fun = extract_failure;
1188 break;
1190 case GNUTYPE_LONGNAME:
1191 case GNUTYPE_LONGLINK:
1192 ERROR ((0, 0, _("Unexpected long name header")));
1193 *fun = extract_failure;
1194 break;
1196 default:
1197 WARNOPT (WARN_UNKNOWN_CAST,
1198 (0, 0,
1199 _("%s: Unknown file type `%c', extracted as normal file"),
1200 quotearg_colon (file_name), typeflag));
1201 *fun = extract_file;
1204 /* Determine whether the extraction should proceed */
1205 if (rc == 0)
1206 return 0;
1208 switch (old_files_option)
1210 case UNLINK_FIRST_OLD_FILES:
1211 if (!remove_any_file (file_name,
1212 recursive_unlink_option ? RECURSIVE_REMOVE_OPTION
1213 : ORDINARY_REMOVE_OPTION)
1214 && errno && errno != ENOENT)
1216 unlink_error (file_name);
1217 return 0;
1219 break;
1221 case KEEP_NEWER_FILES:
1222 if (file_newer_p (file_name, &current_stat_info))
1224 WARNOPT (WARN_IGNORE_NEWER,
1225 (0, 0, _("Current %s is newer or same age"),
1226 quote (file_name)));
1227 return 0;
1229 break;
1231 default:
1232 break;
1235 return 1;
1238 /* Extract a file from the archive. */
1239 void
1240 extract_archive (void)
1242 char typeflag;
1243 tar_extractor_t fun;
1245 /* Try to disable the ability to unlink a directory. */
1246 priv_set_remove_linkdir ();
1248 set_next_block_after (current_header);
1249 decode_header (current_header, &current_stat_info, &current_format, 1);
1250 if (!current_stat_info.file_name[0]
1251 || (interactive_option
1252 && !confirm ("extract", current_stat_info.file_name)))
1254 skip_member ();
1255 return;
1258 /* Print the block from current_header and current_stat. */
1259 if (verbose_option)
1260 print_header (&current_stat_info, -1);
1262 /* Restore stats for all non-ancestor directories, unless
1263 it is an incremental archive.
1264 (see NOTICE in the comment to delay_set_stat above) */
1265 if (!delay_directory_restore_option)
1266 apply_nonancestor_delayed_set_stat (current_stat_info.file_name, 0);
1268 /* Take a safety backup of a previously existing file. */
1270 if (backup_option)
1271 if (!maybe_backup_file (current_stat_info.file_name, 0))
1273 int e = errno;
1274 ERROR ((0, e, _("%s: Was unable to backup this file"),
1275 quotearg_colon (current_stat_info.file_name)));
1276 skip_member ();
1277 return;
1280 /* Extract the archive entry according to its type. */
1281 /* KLUDGE */
1282 typeflag = sparse_member_p (&current_stat_info) ?
1283 GNUTYPE_SPARSE : current_header->header.typeflag;
1285 if (prepare_to_extract (current_stat_info.file_name, typeflag, &fun))
1287 if (fun && (*fun) (current_stat_info.file_name, typeflag)
1288 && backup_option)
1289 undo_last_backup ();
1291 else
1292 skip_member ();
1296 /* Extract the symbolic links whose final extraction were delayed. */
1297 static void
1298 apply_delayed_links (void)
1300 struct delayed_link *ds;
1302 for (ds = delayed_link_head; ds; )
1304 struct string_list *sources = ds->sources;
1305 char const *valid_source = 0;
1307 for (sources = ds->sources; sources; sources = sources->next)
1309 char const *source = sources->string;
1310 struct stat st;
1312 /* Make sure the placeholder file is still there. If not,
1313 don't create a link, as the placeholder was probably
1314 removed by a later extraction. */
1315 if (lstat (source, &st) == 0
1316 && st.st_dev == ds->dev
1317 && st.st_ino == ds->ino
1318 && timespec_cmp (get_stat_mtime (&st), ds->mtime) == 0)
1320 /* Unlink the placeholder, then create a hard link if possible,
1321 a symbolic link otherwise. */
1322 if (unlink (source) != 0)
1323 unlink_error (source);
1324 else if (valid_source && link (valid_source, source) == 0)
1326 else if (!ds->is_symlink)
1328 if (link (ds->target, source) != 0)
1329 link_error (ds->target, source);
1331 else if (symlink (ds->target, source) != 0)
1332 symlink_error (ds->target, source);
1333 else
1335 struct tar_stat_info st1;
1336 st1.stat.st_uid = ds->uid;
1337 st1.stat.st_gid = ds->gid;
1338 set_stat (source, &st1, NULL, 0, 0, SYMTYPE);
1339 valid_source = source;
1344 for (sources = ds->sources; sources; )
1346 struct string_list *next = sources->next;
1347 free (sources);
1348 sources = next;
1352 struct delayed_link *next = ds->next;
1353 free (ds);
1354 ds = next;
1358 delayed_link_head = 0;
1361 /* Finish the extraction of an archive. */
1362 void
1363 extract_finish (void)
1365 /* First, fix the status of ordinary directories that need fixing. */
1366 apply_nonancestor_delayed_set_stat ("", 0);
1368 /* Then, apply delayed links, so that they don't affect delayed
1369 directory status-setting for ordinary directories. */
1370 apply_delayed_links ();
1372 /* Finally, fix the status of directories that are ancestors
1373 of delayed links. */
1374 apply_nonancestor_delayed_set_stat ("", 1);
1377 bool
1378 rename_directory (char *src, char *dst)
1380 if (rename (src, dst))
1382 int e = errno;
1384 switch (e)
1386 case ENOENT:
1387 if (make_directories (dst))
1389 if (rename (src, dst) == 0)
1390 return true;
1391 e = errno;
1393 break;
1395 case EXDEV:
1396 /* FIXME: Fall back to recursive copying */
1398 default:
1399 break;
1402 ERROR ((0, e, _("Cannot rename %s to %s"),
1403 quote_n (0, src),
1404 quote_n (1, dst)));
1405 return false;
1407 return true;
1410 void
1411 fatal_exit (void)
1413 extract_finish ();
1414 error (TAREXIT_FAILURE, 0, _("Error is not recoverable: exiting now"));
1415 abort ();
1418 void
1419 xalloc_die (void)
1421 error (0, 0, "%s", _("memory exhausted"));
1422 fatal_exit ();