2 * Copyright (c) 2003-2007 Tim Kientzle
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
15 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
16 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
17 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
18 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
19 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
20 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
21 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
23 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 #include "bsdtar_platform.h"
27 __FBSDID("$FreeBSD: src/usr.bin/tar/util.c,v 1.20 2008/06/09 14:03:55 cperciva Exp $");
29 #ifdef HAVE_SYS_STAT_H
32 #ifdef HAVE_SYS_TYPES_H
33 #include <sys/types.h> /* Linux doesn't define mode_t, etc. in sys/stat.h. */
52 static void bsdtar_vwarnc(struct bsdtar
*, int code
,
53 const char *fmt
, va_list ap
);
56 * Print a string, taking care with any non-printable characters.
60 safe_fprintf(FILE *f
, const char *fmt
, ...)
72 /* Use a stack-allocated buffer if we can, for speed and safety. */
74 buff_length
= sizeof(buff_stack
);
78 length
= vsnprintf(buff
, buff_length
, fmt
, ap
);
80 /* If the result is too large, allocate a buffer on the heap. */
81 if (length
>= buff_length
) {
82 buff_length
= length
+1;
83 buff_heap
= malloc(buff_length
);
84 /* Failsafe: use the truncated string if malloc fails. */
85 if (buff_heap
!= NULL
) {
88 length
= vsnprintf(buff
, buff_length
, fmt
, ap
);
93 /* Write data, expanding unprintable characters. */
97 unsigned char c
= *p
++;
99 if (isprint(c
) && c
!= '\\')
102 copy_buff
[i
++] = '\\';
104 case '\a': copy_buff
[i
++] = 'a'; break;
105 case '\b': copy_buff
[i
++] = 'b'; break;
106 case '\f': copy_buff
[i
++] = 'f'; break;
107 case '\n': copy_buff
[i
++] = 'n'; break;
109 /* On some platforms, \n and \r are the same. */
110 case '\r': copy_buff
[i
++] = 'r'; break;
112 case '\t': copy_buff
[i
++] = 't'; break;
113 case '\v': copy_buff
[i
++] = 'v'; break;
114 case '\\': copy_buff
[i
++] = '\\'; break;
116 sprintf(copy_buff
+ i
, "%03o", c
);
121 /* If our temp buffer is full, dump it and keep going. */
122 if (i
> (sizeof(copy_buff
) - 8)) {
123 copy_buff
[i
++] = '\0';
124 fprintf(f
, "%s", copy_buff
);
128 copy_buff
[i
++] = '\0';
129 fprintf(f
, "%s", copy_buff
);
131 /* If we allocated a heap-based buffer, free it now. */
132 if (buff_heap
!= NULL
)
137 bsdtar_vwarnc(struct bsdtar
*bsdtar
, int code
, const char *fmt
, va_list ap
)
139 fprintf(stderr
, "%s: ", bsdtar
->progname
);
140 vfprintf(stderr
, fmt
, ap
);
142 fprintf(stderr
, ": %s", strerror(code
));
143 fprintf(stderr
, "\n");
147 bsdtar_warnc(struct bsdtar
*bsdtar
, int code
, const char *fmt
, ...)
152 bsdtar_vwarnc(bsdtar
, code
, fmt
, ap
);
157 bsdtar_errc(struct bsdtar
*bsdtar
, int eval
, int code
, const char *fmt
, ...)
162 bsdtar_vwarnc(bsdtar
, code
, fmt
, ap
);
168 yes(const char *fmt
, ...)
176 vfprintf(stderr
, fmt
, ap
);
178 fprintf(stderr
, " (y/N)? ");
181 l
= read(2, buff
, sizeof(buff
) - 1);
186 for (p
= buff
; *p
!= '\0'; p
++) {
187 if (isspace(0xff & (int)*p
))
203 * Read lines from file and do something with each one. If option_null
204 * is set, lines are terminated with zero bytes; otherwise, they're
205 * terminated with newlines.
207 * This uses a self-sizing buffer to handle arbitrarily-long lines.
208 * If the "process" function returns non-zero for any line, this
209 * function will return non-zero after attempting to process all
213 process_lines(struct bsdtar
*bsdtar
, const char *pathname
,
214 int (*process
)(struct bsdtar
*, const char *))
217 char *buff
, *buff_end
, *line_start
, *line_end
, *p
;
218 size_t buff_length
, new_buff_length
, bytes_read
, bytes_wanted
;
222 separator
= bsdtar
->option_null
? '\0' : '\n';
225 if (strcmp(pathname
, "-") == 0)
228 f
= fopen(pathname
, "r");
230 bsdtar_errc(bsdtar
, 1, errno
, "Couldn't open %s", pathname
);
232 buff
= malloc(buff_length
);
234 bsdtar_errc(bsdtar
, 1, ENOMEM
, "Can't read %s", pathname
);
235 line_start
= line_end
= buff_end
= buff
;
237 /* Get some more data into the buffer. */
238 bytes_wanted
= buff
+ buff_length
- buff_end
;
239 bytes_read
= fread(buff_end
, 1, bytes_wanted
, f
);
240 buff_end
+= bytes_read
;
241 /* Process all complete lines in the buffer. */
242 while (line_end
< buff_end
) {
243 if (*line_end
== separator
) {
245 if ((*process
)(bsdtar
, line_start
) != 0)
247 line_start
= line_end
+ 1;
248 line_end
= line_start
;
255 bsdtar_errc(bsdtar
, 1, errno
,
256 "Can't read %s", pathname
);
257 if (line_start
> buff
) {
258 /* Move a leftover fractional line to the beginning. */
259 memmove(buff
, line_start
, buff_end
- line_start
);
260 buff_end
-= line_start
- buff
;
261 line_end
-= line_start
- buff
;
264 /* Line is too big; enlarge the buffer. */
265 new_buff_length
= buff_length
* 2;
266 if (new_buff_length
<= buff_length
)
267 bsdtar_errc(bsdtar
, 1, ENOMEM
,
268 "Line too long in %s", pathname
);
269 buff_length
= new_buff_length
;
270 p
= realloc(buff
, buff_length
);
272 bsdtar_errc(bsdtar
, 1, ENOMEM
,
273 "Line too long in %s", pathname
);
274 buff_end
= p
+ (buff_end
- buff
);
275 line_end
= p
+ (line_end
- buff
);
276 line_start
= buff
= p
;
279 /* At end-of-file, handle the final line. */
280 if (line_end
> line_start
) {
282 if ((*process
)(bsdtar
, line_start
) != 0)
292 * The logic here for -C <dir> attempts to avoid
293 * chdir() as long as possible. For example:
294 * "-C /foo -C /bar file" needs chdir("/bar") but not chdir("/foo")
295 * "-C /foo -C bar file" needs chdir("/foo/bar")
296 * "-C /foo -C bar /file1" does not need chdir()
297 * "-C /foo -C bar /file1 file2" needs chdir("/foo/bar") before file2
299 * The only correct way to handle this is to record a "pending" chdir
300 * request and combine multiple requests intelligently until we
301 * need to process a non-absolute file. set_chdir() adds the new dir
302 * to the pending list; do_chdir() actually executes any pending chdir.
304 * This way, programs that build tar command lines don't have to worry
305 * about -C with non-existent directories; such requests will only
306 * fail if the directory must be accessed.
309 set_chdir(struct bsdtar
*bsdtar
, const char *newdir
)
311 if (newdir
[0] == '/') {
312 /* The -C /foo -C /bar case; dump first one. */
313 free(bsdtar
->pending_chdir
);
314 bsdtar
->pending_chdir
= NULL
;
316 if (bsdtar
->pending_chdir
== NULL
)
317 /* Easy case: no previously-saved dir. */
318 bsdtar
->pending_chdir
= strdup(newdir
);
320 /* The -C /foo -C bar case; concatenate */
321 char *old_pending
= bsdtar
->pending_chdir
;
322 size_t old_len
= strlen(old_pending
);
323 bsdtar
->pending_chdir
= malloc(old_len
+ strlen(newdir
) + 2);
324 if (old_pending
[old_len
- 1] == '/')
325 old_pending
[old_len
- 1] = '\0';
326 if (bsdtar
->pending_chdir
!= NULL
)
327 sprintf(bsdtar
->pending_chdir
, "%s/%s",
328 old_pending
, newdir
);
331 if (bsdtar
->pending_chdir
== NULL
)
332 bsdtar_errc(bsdtar
, 1, errno
, "No memory");
336 do_chdir(struct bsdtar
*bsdtar
)
338 if (bsdtar
->pending_chdir
== NULL
)
341 if (chdir(bsdtar
->pending_chdir
) != 0) {
342 bsdtar_errc(bsdtar
, 1, 0, "could not chdir to '%s'\n",
343 bsdtar
->pending_chdir
);
345 free(bsdtar
->pending_chdir
);
346 bsdtar
->pending_chdir
= NULL
;
350 * Handle --strip-components and any future path-rewriting options.
351 * Returns non-zero if the pathname should not be extracted.
353 * TODO: Support pax-style regex path rewrites.
356 edit_pathname(struct bsdtar
*bsdtar
, struct archive_entry
*entry
)
358 const char *name
= archive_entry_pathname(entry
);
365 r
= apply_substitution(bsdtar
, name
, &subst_name
, 0);
367 bsdtar_warnc(bsdtar
, 0, "Invalid substituion, skipping entry");
371 archive_entry_copy_pathname(entry
, subst_name
);
372 if (*subst_name
== '\0') {
377 name
= archive_entry_pathname(entry
);
380 if (archive_entry_hardlink(entry
)) {
381 r
= apply_substitution(bsdtar
, archive_entry_hardlink(entry
), &subst_name
, 1);
383 bsdtar_warnc(bsdtar
, 0, "Invalid substituion, skipping entry");
387 archive_entry_copy_hardlink(entry
, subst_name
);
391 if (archive_entry_symlink(entry
) != NULL
) {
392 r
= apply_substitution(bsdtar
, archive_entry_symlink(entry
), &subst_name
, 1);
394 bsdtar_warnc(bsdtar
, 0, "Invalid substituion, skipping entry");
398 archive_entry_copy_symlink(entry
, subst_name
);
404 /* Strip leading dir names as per --strip-components option. */
405 if ((r
= bsdtar
->strip_components
) > 0) {
406 const char *p
= name
;
415 /* Path is too short, skip it. */
425 /* Strip redundant leading '/' characters. */
426 while (name
[0] == '/' && name
[1] == '/')
429 /* Strip leading '/' unless user has asked us not to. */
430 if (name
[0] == '/' && !bsdtar
->option_absolute_paths
) {
431 /* Generate a warning the first time this happens. */
432 if (!bsdtar
->warned_lead_slash
) {
433 bsdtar_warnc(bsdtar
, 0,
434 "Removing leading '/' from member names");
435 bsdtar
->warned_lead_slash
= 1;
438 /* Special case: Stripping leading '/' from "/" yields ".". */
443 /* Safely replace name in archive_entry. */
444 if (name
!= archive_entry_pathname(entry
)) {
445 char *q
= strdup(name
);
446 archive_entry_copy_pathname(entry
, q
);
453 * Like strcmp(), but try to be a little more aware of the fact that
454 * we're comparing two paths. Right now, it just handles leading
455 * "./" and trailing '/' specially, so that "a/b/" == "./a/b"
457 * TODO: Make this better, so that "./a//b/./c/" == "a/b/c"
458 * TODO: After this works, push it down into libarchive.
459 * TODO: Publish the path normalization routines in libarchive so
460 * that bsdtar can normalize paths and use fast strcmp() instead
465 pathcmp(const char *a
, const char *b
)
467 /* Skip leading './' */
468 if (a
[0] == '.' && a
[1] == '/' && a
[2] != '\0')
470 if (b
[0] == '.' && b
[1] == '/' && b
[2] != '\0')
472 /* Find the first difference, or return (0) if none. */
480 * If one ends in '/' and the other one doesn't,
483 if (a
[0] == '/' && a
[1] == '\0' && b
[0] == '\0')
485 if (a
[0] == '\0' && b
[0] == '/' && b
[1] == '\0')
487 /* They're really different, return the correct sign. */
488 return (*(const unsigned char *)a
- *(const unsigned char *)b
);