gzip: Use 0x%04x instead of %x when printing 16-bit checksums
[gzip.git] / gzip.c
blobd42bfa857e1dc70f45a6fcd3d106cc5e43c5c126
1 /* gzip (GNU zip) -- compress files with zip algorithm and 'compress' interface
3 Copyright (C) 1999, 2001-2002, 2006-2007, 2009-2010 Free Software
4 Foundation, Inc.
5 Copyright (C) 1992-1993 Jean-loup Gailly
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, write to the Free Software Foundation,
19 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
22 * The unzip code was written and put in the public domain by Mark Adler.
23 * Portions of the lzw code are derived from the public domain 'compress'
24 * written by Spencer Thomas, Joe Orost, James Woods, Jim McKie, Steve Davies,
25 * Ken Turkowski, Dave Mack and Peter Jannesen.
27 * See the license_msg below and the file COPYING for the software license.
28 * See the file algorithm.doc for the compression algorithms and file formats.
31 static char const *const license_msg[] = {
32 "Copyright (C) 2007, 2010 Free Software Foundation, Inc.",
33 "Copyright (C) 1993 Jean-loup Gailly.",
34 "This is free software. You may redistribute copies of it under the terms of",
35 "the GNU General Public License <http://www.gnu.org/licenses/gpl.html>.",
36 "There is NO WARRANTY, to the extent permitted by law.",
37 0};
39 /* Compress files with zip algorithm and 'compress' interface.
40 * See help() function below for all options.
41 * Outputs:
42 * file.gz: compressed file with same mode, owner, and utimes
43 * or stdout with -c option or if stdin used as input.
44 * If the output file name had to be truncated, the original name is kept
45 * in the compressed file.
46 * On MSDOS, file.tmp -> file.tmz. On VMS, file.tmp -> file.tmp-gz.
48 * Using gz on MSDOS would create too many file name conflicts. For
49 * example, foo.txt -> foo.tgz (.tgz must be reserved as shorthand for
50 * tar.gz). Similarly, foo.dir and foo.doc would both be mapped to foo.dgz.
51 * I also considered 12345678.txt -> 12345txt.gz but this truncates the name
52 * too heavily. There is no ideal solution given the MSDOS 8+3 limitation.
54 * For the meaning of all compilation flags, see comments in Makefile.in.
57 #include <config.h>
58 #include <ctype.h>
59 #include <sys/types.h>
60 #include <signal.h>
61 #include <stdbool.h>
62 #include <sys/stat.h>
63 #include <errno.h>
65 #include "closein.h"
66 #include "tailor.h"
67 #include "gzip.h"
68 #include "lzw.h"
69 #include "revision.h"
70 #include "timespec.h"
72 #include "fcntl-safer.h"
73 #include "getopt.h"
74 #include "ignore-value.h"
75 #include "stat-time.h"
76 #include "version.h"
78 /* configuration */
80 #include <fcntl.h>
81 #include <limits.h>
82 #include <unistd.h>
83 #include <stdlib.h>
84 #include <errno.h>
86 #ifndef NO_DIR
87 # define NO_DIR 0
88 #endif
89 #if !NO_DIR
90 # include <dirent.h>
91 # ifndef _D_EXACT_NAMLEN
92 # define _D_EXACT_NAMLEN(dp) strlen ((dp)->d_name)
93 # endif
94 #endif
96 #ifdef CLOSEDIR_VOID
97 # define CLOSEDIR(d) (closedir(d), 0)
98 #else
99 # define CLOSEDIR(d) closedir(d)
100 #endif
102 #ifndef NO_UTIME
103 # include <utimens.h>
104 #endif
106 #define RW_USER (S_IRUSR | S_IWUSR) /* creation mode for open() */
108 #ifndef MAX_PATH_LEN
109 # define MAX_PATH_LEN 1024 /* max pathname length */
110 #endif
112 #ifndef SEEK_END
113 # define SEEK_END 2
114 #endif
116 #ifndef CHAR_BIT
117 # define CHAR_BIT 8
118 #endif
120 #ifdef off_t
121 off_t lseek OF((int fd, off_t offset, int whence));
122 #endif
124 #ifndef OFF_T_MIN
125 #define OFF_T_MIN (~ (off_t) 0 << (sizeof (off_t) * CHAR_BIT - 1))
126 #endif
128 #ifndef OFF_T_MAX
129 #define OFF_T_MAX (~ (off_t) 0 - OFF_T_MIN)
130 #endif
132 /* Use SA_NOCLDSTOP as a proxy for whether the sigaction machinery is
133 present. */
134 #ifndef SA_NOCLDSTOP
135 # define SA_NOCLDSTOP 0
136 # define sigprocmask(how, set, oset) /* empty */
137 # define sigset_t int
138 # if ! HAVE_SIGINTERRUPT
139 # define siginterrupt(sig, flag) /* empty */
140 # endif
141 #endif
143 #ifndef HAVE_WORKING_O_NOFOLLOW
144 # define HAVE_WORKING_O_NOFOLLOW 0
145 #endif
147 #ifndef ELOOP
148 # define ELOOP EINVAL
149 #endif
151 /* Separator for file name parts (see shorten_name()) */
152 #ifdef NO_MULTIPLE_DOTS
153 # define PART_SEP "-"
154 #else
155 # define PART_SEP "."
156 #endif
158 /* global buffers */
160 DECLARE(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
161 DECLARE(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
162 DECLARE(ush, d_buf, DIST_BUFSIZE);
163 DECLARE(uch, window, 2L*WSIZE);
164 #ifndef MAXSEG_64K
165 DECLARE(ush, tab_prefix, 1L<<BITS);
166 #else
167 DECLARE(ush, tab_prefix0, 1L<<(BITS-1));
168 DECLARE(ush, tab_prefix1, 1L<<(BITS-1));
169 #endif
171 /* local variables */
173 /* If true, pretend that standard input is a tty. This option
174 is deliberately not documented, and only for testing. */
175 static bool presume_input_tty;
177 int ascii = 0; /* convert end-of-lines to local OS conventions */
178 int to_stdout = 0; /* output to stdout (-c) */
179 int decompress = 0; /* decompress (-d) */
180 int force = 0; /* don't ask questions, compress links (-f) */
181 int no_name = -1; /* don't save or restore the original file name */
182 int no_time = -1; /* don't save or restore the original file time */
183 int recursive = 0; /* recurse through directories (-r) */
184 int list = 0; /* list the file contents (-l) */
185 int verbose = 0; /* be verbose (-v) */
186 int quiet = 0; /* be very quiet (-q) */
187 int do_lzw = 0; /* generate output compatible with old compress (-Z) */
188 int test = 0; /* test .gz file integrity */
189 int foreground = 0; /* set if program run in foreground */
190 char *program_name; /* program name */
191 int maxbits = BITS; /* max bits per code for LZW */
192 int method = DEFLATED;/* compression method */
193 int level = 6; /* compression level */
194 int exit_code = OK; /* program exit code */
195 int save_orig_name; /* set if original name must be saved */
196 int last_member; /* set for .zip and .Z files */
197 int part_nb; /* number of parts in .gz file */
198 struct timespec time_stamp; /* original time stamp (modification time) */
199 off_t ifile_size; /* input file size, -1 for devices (debug only) */
200 char *env; /* contents of GZIP env variable */
201 char **args = NULL; /* argv pointer if GZIP env variable defined */
202 char const *z_suffix; /* default suffix (can be set with --suffix) */
203 size_t z_len; /* strlen(z_suffix) */
205 /* The set of signals that are caught. */
206 static sigset_t caught_signals;
208 /* If nonzero then exit with status WARNING, rather than with the usual
209 signal status, on receipt of a signal with this value. This
210 suppresses a "Broken Pipe" message with some shells. */
211 static int volatile exiting_signal;
213 /* If nonnegative, close this file descriptor and unlink ofname on error. */
214 static int volatile remove_ofname_fd = -1;
216 off_t bytes_in; /* number of input bytes */
217 off_t bytes_out; /* number of output bytes */
218 off_t total_in; /* input bytes for all files */
219 off_t total_out; /* output bytes for all files */
220 char ifname[MAX_PATH_LEN]; /* input file name */
221 char ofname[MAX_PATH_LEN]; /* output file name */
222 struct stat istat; /* status for input file */
223 int ifd; /* input file descriptor */
224 int ofd; /* output file descriptor */
225 unsigned insize; /* valid bytes in inbuf */
226 unsigned inptr; /* index of next byte to be processed in inbuf */
227 unsigned outcnt; /* bytes in output buffer */
229 static int handled_sig[] =
231 /* SIGINT must be first, as 'foreground' depends on it. */
232 SIGINT
234 #ifdef SIGHUP
235 , SIGHUP
236 #endif
237 #ifdef SIGPIPE
238 , SIGPIPE
239 #else
240 # define SIGPIPE 0
241 #endif
242 #ifdef SIGTERM
243 , SIGTERM
244 #endif
245 #ifdef SIGXCPU
246 , SIGXCPU
247 #endif
248 #ifdef SIGXFSZ
249 , SIGXFSZ
250 #endif
253 /* For long options that have no equivalent short option, use a
254 non-character as a pseudo short option, starting with CHAR_MAX + 1. */
255 enum
257 PRESUME_INPUT_TTY_OPTION = CHAR_MAX + 1
260 struct option longopts[] =
262 /* { name has_arg *flag val } */
263 {"ascii", 0, 0, 'a'}, /* ascii text mode */
264 {"to-stdout", 0, 0, 'c'}, /* write output on standard output */
265 {"stdout", 0, 0, 'c'}, /* write output on standard output */
266 {"decompress", 0, 0, 'd'}, /* decompress */
267 {"uncompress", 0, 0, 'd'}, /* decompress */
268 /* {"encrypt", 0, 0, 'e'}, encrypt */
269 {"force", 0, 0, 'f'}, /* force overwrite of output file */
270 {"help", 0, 0, 'h'}, /* give help */
271 /* {"pkzip", 0, 0, 'k'}, force output in pkzip format */
272 {"list", 0, 0, 'l'}, /* list .gz file contents */
273 {"license", 0, 0, 'L'}, /* display software license */
274 {"no-name", 0, 0, 'n'}, /* don't save or restore original name & time */
275 {"name", 0, 0, 'N'}, /* save or restore original name & time */
276 {"-presume-input-tty", no_argument, NULL, PRESUME_INPUT_TTY_OPTION},
277 {"quiet", 0, 0, 'q'}, /* quiet mode */
278 {"silent", 0, 0, 'q'}, /* quiet mode */
279 {"recursive", 0, 0, 'r'}, /* recurse through directories */
280 {"suffix", 1, 0, 'S'}, /* use given suffix instead of .gz */
281 {"test", 0, 0, 't'}, /* test compressed file integrity */
282 {"no-time", 0, 0, 'T'}, /* don't save or restore the time stamp */
283 {"verbose", 0, 0, 'v'}, /* verbose mode */
284 {"version", 0, 0, 'V'}, /* display version number */
285 {"fast", 0, 0, '1'}, /* compress faster */
286 {"best", 0, 0, '9'}, /* compress better */
287 {"lzw", 0, 0, 'Z'}, /* make output compatible with old compress */
288 {"bits", 1, 0, 'b'}, /* max number of bits per code (implies -Z) */
290 { 0, 0, 0, 0 }
293 /* local functions */
295 local void try_help OF((void)) ATTRIBUTE_NORETURN;
296 local void help OF((void));
297 local void license OF((void));
298 local void version OF((void));
299 local int input_eof OF((void));
300 local void treat_stdin OF((void));
301 local void treat_file OF((char *iname));
302 local int create_outfile OF((void));
303 local char *get_suffix OF((char *name));
304 local int open_input_file OF((char *iname, struct stat *sbuf));
305 local void discard_input_bytes OF((size_t nbytes, unsigned int flags));
306 local int make_ofname OF((void));
307 local void shorten_name OF((char *name));
308 local int get_method OF((int in));
309 local void do_list OF((int ifd, int method));
310 local int check_ofname OF((void));
311 local void copy_stat OF((struct stat *ifstat));
312 local void install_signal_handlers OF((void));
313 local void remove_output_file OF((void));
314 local RETSIGTYPE abort_gzip_signal OF((int));
315 local void do_exit OF((int exitcode)) ATTRIBUTE_NORETURN;
316 int main OF((int argc, char **argv));
317 int (*work) OF((int infile, int outfile)) = zip; /* function to call */
319 #if ! NO_DIR
320 local void treat_dir OF((int fd, char *dir));
321 #endif
323 #define strequ(s1, s2) (strcmp((s1),(s2)) == 0)
325 static void
326 try_help ()
328 fprintf (stderr, "Try `%s --help' for more information.\n",
329 program_name);
330 do_exit (ERROR);
333 /* ======================================================================== */
334 local void help()
336 static char const* const help_msg[] = {
337 "Compress or uncompress FILEs (by default, compress FILES in-place).",
339 "Mandatory arguments to long options are mandatory for short options too.",
341 #if O_BINARY
342 " -a, --ascii ascii text; convert end-of-line using local conventions",
343 #endif
344 " -c, --stdout write on standard output, keep original files unchanged",
345 " -d, --decompress decompress",
346 /* -e, --encrypt encrypt */
347 " -f, --force force overwrite of output file and compress links",
348 " -h, --help give this help",
349 /* -k, --pkzip force output in pkzip format */
350 " -l, --list list compressed file contents",
351 " -L, --license display software license",
352 #ifdef UNDOCUMENTED
353 " -m, --no-time do not save or restore the original modification time",
354 " -M, --time save or restore the original modification time",
355 #endif
356 " -n, --no-name do not save or restore the original name and time stamp",
357 " -N, --name save or restore the original name and time stamp",
358 " -q, --quiet suppress all warnings",
359 #if ! NO_DIR
360 " -r, --recursive operate recursively on directories",
361 #endif
362 " -S, --suffix=SUF use suffix SUF on compressed files",
363 " -t, --test test compressed file integrity",
364 " -v, --verbose verbose mode",
365 " -V, --version display version number",
366 " -1, --fast compress faster",
367 " -9, --best compress better",
368 #ifdef LZW
369 " -Z, --lzw produce output compatible with old compress",
370 " -b, --bits=BITS max number of bits per code (implies -Z)",
371 #endif
373 "With no FILE, or when FILE is -, read standard input.",
375 "Report bugs to <bug-gzip@gnu.org>.",
377 char const *const *p = help_msg;
379 printf ("Usage: %s [OPTION]... [FILE]...\n", program_name);
380 while (*p) printf ("%s\n", *p++);
383 /* ======================================================================== */
384 local void license()
386 char const *const *p = license_msg;
388 printf ("%s %s\n", program_name, Version);
389 while (*p) printf ("%s\n", *p++);
392 /* ======================================================================== */
393 local void version()
395 license ();
396 printf ("\n");
397 printf ("Written by Jean-loup Gailly.\n");
400 local void progerror (char const *string)
402 int e = errno;
403 fprintf (stderr, "%s: ", program_name);
404 errno = e;
405 perror(string);
406 exit_code = ERROR;
409 /* ======================================================================== */
410 int main (int argc, char **argv)
412 int file_count; /* number of files to process */
413 size_t proglen; /* length of program_name */
414 int optc; /* current option */
416 EXPAND(argc, argv); /* wild card expansion if necessary */
418 program_name = gzip_base_name (argv[0]);
419 proglen = strlen (program_name);
421 atexit (close_stdin);
423 /* Suppress .exe for MSDOS, OS/2 and VMS: */
424 if (4 < proglen && strequ (program_name + proglen - 4, ".exe"))
425 program_name[proglen - 4] = '\0';
427 /* Add options in GZIP environment variable if there is one */
428 env = add_envopt(&argc, &argv, OPTIONS_VAR);
429 if (env != NULL) args = argv;
431 #ifndef GNU_STANDARD
432 # define GNU_STANDARD 1
433 #endif
434 #if !GNU_STANDARD
435 /* For compatibility with old compress, use program name as an option.
436 * Unless you compile with -DGNU_STANDARD=0, this program will behave as
437 * gzip even if it is invoked under the name gunzip or zcat.
439 * Systems which do not support links can still use -d or -dc.
440 * Ignore an .exe extension for MSDOS, OS/2 and VMS.
442 if (strncmp (program_name, "un", 2) == 0 /* ungzip, uncompress */
443 || strncmp (program_name, "gun", 3) == 0) /* gunzip */
444 decompress = 1;
445 else if (strequ (program_name + 1, "cat") /* zcat, pcat, gcat */
446 || strequ (program_name, "gzcat")) /* gzcat */
447 decompress = to_stdout = 1;
448 #endif
450 z_suffix = Z_SUFFIX;
451 z_len = strlen(z_suffix);
453 while ((optc = getopt_long (argc, argv, "ab:cdfhH?lLmMnNqrS:tvVZ123456789",
454 longopts, (int *)0)) != -1) {
455 switch (optc) {
456 case 'a':
457 ascii = 1; break;
458 case 'b':
459 maxbits = atoi(optarg);
460 for (; *optarg; optarg++)
461 if (! ('0' <= *optarg && *optarg <= '9'))
463 fprintf (stderr, "%s: -b operand is not an integer\n",
464 program_name);
465 try_help ();
467 break;
468 case 'c':
469 to_stdout = 1; break;
470 case 'd':
471 decompress = 1; break;
472 case 'f':
473 force++; break;
474 case 'h': case 'H':
475 help(); do_exit(OK); break;
476 case 'l':
477 list = decompress = to_stdout = 1; break;
478 case 'L':
479 license(); do_exit(OK); break;
480 case 'm': /* undocumented, may change later */
481 no_time = 1; break;
482 case 'M': /* undocumented, may change later */
483 no_time = 0; break;
484 case 'n':
485 no_name = no_time = 1; break;
486 case 'N':
487 no_name = no_time = 0; break;
488 case PRESUME_INPUT_TTY_OPTION:
489 presume_input_tty = true; break;
490 case 'q':
491 quiet = 1; verbose = 0; break;
492 case 'r':
493 #if NO_DIR
494 fprintf (stderr, "%s: -r not supported on this system\n",
495 program_name);
496 try_help ();
497 #else
498 recursive = 1;
499 #endif
500 break;
501 case 'S':
502 #ifdef NO_MULTIPLE_DOTS
503 if (*optarg == '.') optarg++;
504 #endif
505 z_len = strlen(optarg);
506 z_suffix = optarg;
507 break;
508 case 't':
509 test = decompress = to_stdout = 1;
510 break;
511 case 'v':
512 verbose++; quiet = 0; break;
513 case 'V':
514 version(); do_exit(OK); break;
515 case 'Z':
516 #ifdef LZW
517 do_lzw = 1; break;
518 #else
519 fprintf(stderr, "%s: -Z not supported in this version\n",
520 program_name);
521 try_help ();
522 break;
523 #endif
524 case '1': case '2': case '3': case '4':
525 case '5': case '6': case '7': case '8': case '9':
526 level = optc - '0';
527 break;
528 default:
529 /* Error message already emitted by getopt_long. */
530 try_help ();
532 } /* loop on all arguments */
534 /* By default, save name and timestamp on compression but do not
535 * restore them on decompression.
537 if (no_time < 0) no_time = decompress;
538 if (no_name < 0) no_name = decompress;
540 file_count = argc - optind;
542 #if O_BINARY
543 #else
544 if (ascii && !quiet) {
545 fprintf(stderr, "%s: option --ascii ignored on this system\n",
546 program_name);
548 #endif
549 if (z_len == 0 || z_len > MAX_SUFFIX) {
550 fprintf(stderr, "%s: invalid suffix '%s'\n", program_name, z_suffix);
551 do_exit(ERROR);
554 if (do_lzw && !decompress) work = lzw;
556 /* Allocate all global buffers (for DYN_ALLOC option) */
557 ALLOC(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
558 ALLOC(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
559 ALLOC(ush, d_buf, DIST_BUFSIZE);
560 ALLOC(uch, window, 2L*WSIZE);
561 #ifndef MAXSEG_64K
562 ALLOC(ush, tab_prefix, 1L<<BITS);
563 #else
564 ALLOC(ush, tab_prefix0, 1L<<(BITS-1));
565 ALLOC(ush, tab_prefix1, 1L<<(BITS-1));
566 #endif
568 exiting_signal = quiet ? SIGPIPE : 0;
569 install_signal_handlers ();
571 /* And get to work */
572 if (file_count != 0) {
573 if (to_stdout && !test && !list && (!decompress || !ascii)) {
574 SET_BINARY_MODE(fileno(stdout));
576 while (optind < argc) {
577 treat_file(argv[optind++]);
579 } else { /* Standard input */
580 treat_stdin();
582 if (list && !quiet && file_count > 1) {
583 do_list(-1, -1); /* print totals */
585 do_exit(exit_code);
586 return exit_code; /* just to avoid lint warning */
589 /* Return nonzero when at end of file on input. */
590 local int
591 input_eof ()
593 if (!decompress || last_member)
594 return 1;
596 if (inptr == insize)
598 if (insize != INBUFSIZ || fill_inbuf (1) == EOF)
599 return 1;
601 /* Unget the char that fill_inbuf got. */
602 inptr = 0;
605 return 0;
608 /* ========================================================================
609 * Compress or decompress stdin
611 local void treat_stdin()
613 if (!force && !list
614 && (presume_input_tty
615 || isatty(fileno((FILE *)(decompress ? stdin : stdout))))) {
616 /* Do not send compressed data to the terminal or read it from
617 * the terminal. We get here when user invoked the program
618 * without parameters, so be helpful. According to the GNU standards:
620 * If there is one behavior you think is most useful when the output
621 * is to a terminal, and another that you think is most useful when
622 * the output is a file or a pipe, then it is usually best to make
623 * the default behavior the one that is useful with output to a
624 * terminal, and have an option for the other behavior.
626 * Here we use the --force option to get the other behavior.
628 fprintf(stderr,
629 "%s: compressed data not %s a terminal. Use -f to force %scompression.\n",
630 program_name, decompress ? "read from" : "written to",
631 decompress ? "de" : "");
632 fprintf (stderr, "For help, type: %s -h\n", program_name);
633 do_exit(ERROR);
636 if (decompress || !ascii) {
637 SET_BINARY_MODE(fileno(stdin));
639 if (!test && !list && (!decompress || !ascii)) {
640 SET_BINARY_MODE(fileno(stdout));
642 strcpy(ifname, "stdin");
643 strcpy(ofname, "stdout");
645 /* Get the file's time stamp and size. */
646 if (fstat (fileno (stdin), &istat) != 0)
648 progerror ("standard input");
649 do_exit (ERROR);
651 ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
652 time_stamp.tv_nsec = -1;
653 if (!no_time || list)
655 if (S_ISREG (istat.st_mode))
656 time_stamp = get_stat_mtime (&istat);
657 else
658 gettime (&time_stamp);
661 clear_bufs(); /* clear input and output buffers */
662 to_stdout = 1;
663 part_nb = 0;
664 ifd = fileno(stdin);
666 if (decompress) {
667 method = get_method(ifd);
668 if (method < 0) {
669 do_exit(exit_code); /* error message already emitted */
672 if (list) {
673 do_list(ifd, method);
674 return;
677 /* Actually do the compression/decompression. Loop over zipped members.
679 for (;;) {
680 if ((*work)(fileno(stdin), fileno(stdout)) != OK) return;
682 if (input_eof ())
683 break;
685 method = get_method(ifd);
686 if (method < 0) return; /* error message already emitted */
687 bytes_out = 0; /* required for length check */
690 if (verbose) {
691 if (test) {
692 fprintf(stderr, " OK\n");
694 } else if (!decompress) {
695 display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
696 fprintf(stderr, "\n");
697 #ifdef DISPLAY_STDIN_RATIO
698 } else {
699 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
700 fprintf(stderr, "\n");
701 #endif
706 /* ========================================================================
707 * Compress or decompress the given file
709 local void treat_file(iname)
710 char *iname;
712 /* Accept "-" as synonym for stdin */
713 if (strequ(iname, "-")) {
714 int cflag = to_stdout;
715 treat_stdin();
716 to_stdout = cflag;
717 return;
720 /* Check if the input file is present, set ifname and istat: */
721 ifd = open_input_file (iname, &istat);
722 if (ifd < 0)
723 return;
725 /* If the input name is that of a directory, recurse or ignore: */
726 if (S_ISDIR(istat.st_mode)) {
727 #if ! NO_DIR
728 if (recursive) {
729 treat_dir (ifd, iname);
730 /* Warning: ifname is now garbage */
731 return;
733 #endif
734 close (ifd);
735 WARN ((stderr, "%s: %s is a directory -- ignored\n",
736 program_name, ifname));
737 return;
740 if (! to_stdout)
742 if (! S_ISREG (istat.st_mode))
744 WARN ((stderr,
745 "%s: %s is not a directory or a regular file - ignored\n",
746 program_name, ifname));
747 close (ifd);
748 return;
750 if (istat.st_mode & S_ISUID)
752 WARN ((stderr, "%s: %s is set-user-ID on execution - ignored\n",
753 program_name, ifname));
754 close (ifd);
755 return;
757 if (istat.st_mode & S_ISGID)
759 WARN ((stderr, "%s: %s is set-group-ID on execution - ignored\n",
760 program_name, ifname));
761 close (ifd);
762 return;
765 if (! force)
767 if (istat.st_mode & S_ISVTX)
769 WARN ((stderr,
770 "%s: %s has the sticky bit set - file ignored\n",
771 program_name, ifname));
772 close (ifd);
773 return;
775 if (2 <= istat.st_nlink)
777 WARN ((stderr, "%s: %s has %lu other link%c -- unchanged\n",
778 program_name, ifname,
779 (unsigned long int) istat.st_nlink - 1,
780 istat.st_nlink == 2 ? ' ' : 's'));
781 close (ifd);
782 return;
787 ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
788 time_stamp.tv_nsec = -1;
789 if (!no_time || list)
790 time_stamp = get_stat_mtime (&istat);
792 /* Generate output file name. For -r and (-t or -l), skip files
793 * without a valid gzip suffix (check done in make_ofname).
795 if (to_stdout && !list && !test) {
796 strcpy(ofname, "stdout");
798 } else if (make_ofname() != OK) {
799 close (ifd);
800 return;
803 clear_bufs(); /* clear input and output buffers */
804 part_nb = 0;
806 if (decompress) {
807 method = get_method(ifd); /* updates ofname if original given */
808 if (method < 0) {
809 close(ifd);
810 return; /* error message already emitted */
813 if (list) {
814 do_list(ifd, method);
815 if (close (ifd) != 0)
816 read_error ();
817 return;
820 /* If compressing to a file, check if ofname is not ambiguous
821 * because the operating system truncates names. Otherwise, generate
822 * a new ofname and save the original name in the compressed file.
824 if (to_stdout) {
825 ofd = fileno(stdout);
826 /* Keep remove_ofname_fd negative. */
827 } else {
828 if (create_outfile() != OK) return;
830 if (!decompress && save_orig_name && !verbose && !quiet) {
831 fprintf(stderr, "%s: %s compressed to %s\n",
832 program_name, ifname, ofname);
835 /* Keep the name even if not truncated except with --no-name: */
836 if (!save_orig_name) save_orig_name = !no_name;
838 if (verbose) {
839 fprintf(stderr, "%s:\t", ifname);
842 /* Actually do the compression/decompression. Loop over zipped members.
844 for (;;) {
845 if ((*work)(ifd, ofd) != OK) {
846 method = -1; /* force cleanup */
847 break;
850 if (input_eof ())
851 break;
853 method = get_method(ifd);
854 if (method < 0) break; /* error message already emitted */
855 bytes_out = 0; /* required for length check */
858 if (close (ifd) != 0)
859 read_error ();
861 if (!to_stdout)
863 sigset_t oldset;
864 int unlink_errno;
866 copy_stat (&istat);
867 if (close (ofd) != 0)
868 write_error ();
870 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
871 remove_ofname_fd = -1;
872 unlink_errno = xunlink (ifname) == 0 ? 0 : errno;
873 sigprocmask (SIG_SETMASK, &oldset, NULL);
875 if (unlink_errno)
877 WARN ((stderr, "%s: ", program_name));
878 if (!quiet)
880 errno = unlink_errno;
881 perror (ifname);
886 if (method == -1) {
887 if (!to_stdout)
888 remove_output_file ();
889 return;
892 /* Display statistics */
893 if(verbose) {
894 if (test) {
895 fprintf(stderr, " OK");
896 } else if (decompress) {
897 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
898 } else {
899 display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
901 if (!test && !to_stdout) {
902 fprintf(stderr, " -- replaced with %s", ofname);
904 fprintf(stderr, "\n");
908 /* ========================================================================
909 * Create the output file. Return OK or ERROR.
910 * Try several times if necessary to avoid truncating the z_suffix. For
911 * example, do not create a compressed file of name "1234567890123."
912 * Sets save_orig_name to true if the file name has been truncated.
913 * IN assertions: the input file has already been open (ifd is set) and
914 * ofname has already been updated if there was an original name.
915 * OUT assertions: ifd and ofd are closed in case of error.
917 local int create_outfile()
919 int name_shortened = 0;
920 int flags = (O_WRONLY | O_CREAT | O_EXCL
921 | (ascii && decompress ? 0 : O_BINARY));
923 for (;;)
925 int open_errno;
926 sigset_t oldset;
928 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
929 remove_ofname_fd = ofd = OPEN (ofname, flags, RW_USER);
930 open_errno = errno;
931 sigprocmask (SIG_SETMASK, &oldset, NULL);
933 if (0 <= ofd)
934 break;
936 switch (open_errno)
938 #ifdef ENAMETOOLONG
939 case ENAMETOOLONG:
940 shorten_name (ofname);
941 name_shortened = 1;
942 break;
943 #endif
945 case EEXIST:
946 if (check_ofname () != OK)
948 close (ifd);
949 return ERROR;
951 break;
953 default:
954 progerror (ofname);
955 close (ifd);
956 return ERROR;
960 if (name_shortened && decompress)
962 /* name might be too long if an original name was saved */
963 WARN ((stderr, "%s: %s: warning, name truncated\n",
964 program_name, ofname));
967 return OK;
970 /* ========================================================================
971 * Return a pointer to the 'z' suffix of a file name, or NULL. For all
972 * systems, ".gz", ".z", ".Z", ".taz", ".tgz", "-gz", "-z" and "_z" are
973 * accepted suffixes, in addition to the value of the --suffix option.
974 * ".tgz" is a useful convention for tar.z files on systems limited
975 * to 3 characters extensions. On such systems, ".?z" and ".??z" are
976 * also accepted suffixes. For Unix, we do not want to accept any
977 * .??z suffix as indicating a compressed file; some people use .xyz
978 * to denote volume data.
979 * On systems allowing multiple versions of the same file (such as VMS),
980 * this function removes any version suffix in the given name.
982 local char *get_suffix(name)
983 char *name;
985 int nlen, slen;
986 char suffix[MAX_SUFFIX+3]; /* last chars of name, forced to lower case */
987 static char const *known_suffixes[] =
988 {NULL, ".gz", ".z", ".taz", ".tgz", "-gz", "-z", "_z",
989 #ifdef MAX_EXT_CHARS
990 "z",
991 #endif
992 NULL};
993 char const **suf = known_suffixes;
995 *suf = z_suffix;
996 if (strequ(z_suffix, "z")) suf++; /* check long suffixes first */
998 #ifdef SUFFIX_SEP
999 /* strip a version number from the file name */
1001 char *v = strrchr(name, SUFFIX_SEP);
1002 if (v != NULL) *v = '\0';
1004 #endif
1005 nlen = strlen(name);
1006 if (nlen <= MAX_SUFFIX+2) {
1007 strcpy(suffix, name);
1008 } else {
1009 strcpy(suffix, name+nlen-MAX_SUFFIX-2);
1011 strlwr(suffix);
1012 slen = strlen(suffix);
1013 do {
1014 int s = strlen(*suf);
1015 if (slen > s && suffix[slen-s-1] != PATH_SEP
1016 && strequ(suffix + slen - s, *suf)) {
1017 return name+nlen-s;
1019 } while (*++suf != NULL);
1021 return NULL;
1025 /* Open file NAME with the given flags and mode and store its status
1026 into *ST. Return a file descriptor to the newly opened file, or -1
1027 (setting errno) on failure. */
1028 static int
1029 open_and_stat (char *name, int flags, mode_t mode, struct stat *st)
1031 int fd;
1033 /* Refuse to follow symbolic links unless -c or -f. */
1034 if (!to_stdout && !force)
1036 if (HAVE_WORKING_O_NOFOLLOW)
1037 flags |= O_NOFOLLOW;
1038 else
1040 #if HAVE_LSTAT || defined lstat
1041 if (lstat (name, st) != 0)
1042 return -1;
1043 else if (S_ISLNK (st->st_mode))
1045 errno = ELOOP;
1046 return -1;
1048 #endif
1052 fd = OPEN (name, flags, mode);
1053 if (0 <= fd && fstat (fd, st) != 0)
1055 int e = errno;
1056 close (fd);
1057 errno = e;
1058 return -1;
1060 return fd;
1064 /* ========================================================================
1065 * Set ifname to the input file name (with a suffix appended if necessary)
1066 * and istat to its stats. For decompression, if no file exists with the
1067 * original name, try adding successively z_suffix, .gz, .z, -z and .Z.
1068 * For MSDOS, we try only z_suffix and z.
1069 * Return an open file descriptor or -1.
1071 static int
1072 open_input_file (iname, sbuf)
1073 char *iname;
1074 struct stat *sbuf;
1076 int ilen; /* strlen(ifname) */
1077 int z_suffix_errno = 0;
1078 static char const *suffixes[] = {NULL, ".gz", ".z", "-z", ".Z", NULL};
1079 char const **suf = suffixes;
1080 char const *s;
1081 #ifdef NO_MULTIPLE_DOTS
1082 char *dot; /* pointer to ifname extension, or NULL */
1083 #endif
1084 int fd;
1085 int open_flags = (O_RDONLY | O_NONBLOCK | O_NOCTTY
1086 | (ascii && !decompress ? 0 : O_BINARY));
1088 *suf = z_suffix;
1090 if (sizeof ifname - 1 <= strlen (iname))
1091 goto name_too_long;
1093 strcpy(ifname, iname);
1095 /* If input file exists, return OK. */
1096 fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1097 if (0 <= fd)
1098 return fd;
1100 if (!decompress || errno != ENOENT) {
1101 progerror(ifname);
1102 return -1;
1104 /* file.ext doesn't exist, try adding a suffix (after removing any
1105 * version number for VMS).
1107 s = get_suffix(ifname);
1108 if (s != NULL) {
1109 progerror(ifname); /* ifname already has z suffix and does not exist */
1110 return -1;
1112 #ifdef NO_MULTIPLE_DOTS
1113 dot = strrchr(ifname, '.');
1114 if (dot == NULL) {
1115 strcat(ifname, ".");
1116 dot = strrchr(ifname, '.');
1118 #endif
1119 ilen = strlen(ifname);
1120 if (strequ(z_suffix, ".gz")) suf++;
1122 /* Search for all suffixes */
1123 do {
1124 char const *s0 = s = *suf;
1125 strcpy (ifname, iname);
1126 #ifdef NO_MULTIPLE_DOTS
1127 if (*s == '.') s++;
1128 if (*dot == '\0') strcpy (dot, ".");
1129 #endif
1130 #ifdef MAX_EXT_CHARS
1131 if (MAX_EXT_CHARS < strlen (s) + strlen (dot + 1))
1132 dot[MAX_EXT_CHARS + 1 - strlen (s)] = '\0';
1133 #endif
1134 if (sizeof ifname <= ilen + strlen (s))
1135 goto name_too_long;
1136 strcat(ifname, s);
1137 fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1138 if (0 <= fd)
1139 return fd;
1140 if (errno != ENOENT)
1142 progerror (ifname);
1143 return -1;
1145 if (strequ (s0, z_suffix))
1146 z_suffix_errno = errno;
1147 } while (*++suf != NULL);
1149 /* No suffix found, complain using z_suffix: */
1150 strcpy(ifname, iname);
1151 #ifdef NO_MULTIPLE_DOTS
1152 if (*dot == '\0') strcpy(dot, ".");
1153 #endif
1154 #ifdef MAX_EXT_CHARS
1155 if (MAX_EXT_CHARS < z_len + strlen (dot + 1))
1156 dot[MAX_EXT_CHARS + 1 - z_len] = '\0';
1157 #endif
1158 strcat(ifname, z_suffix);
1159 errno = z_suffix_errno;
1160 progerror(ifname);
1161 return -1;
1163 name_too_long:
1164 fprintf (stderr, "%s: %s: file name too long\n", program_name, iname);
1165 exit_code = ERROR;
1166 return -1;
1169 /* ========================================================================
1170 * Generate ofname given ifname. Return OK, or WARNING if file must be skipped.
1171 * Sets save_orig_name to true if the file name has been truncated.
1173 local int make_ofname()
1175 char *suff; /* ofname z suffix */
1177 strcpy(ofname, ifname);
1178 /* strip a version number if any and get the gzip suffix if present: */
1179 suff = get_suffix(ofname);
1181 if (decompress) {
1182 if (suff == NULL) {
1183 /* With -t or -l, try all files (even without .gz suffix)
1184 * except with -r (behave as with just -dr).
1186 if (!recursive && (list || test)) return OK;
1188 /* Avoid annoying messages with -r */
1189 if (verbose || (!recursive && !quiet)) {
1190 WARN((stderr,"%s: %s: unknown suffix -- ignored\n",
1191 program_name, ifname));
1193 return WARNING;
1195 /* Make a special case for .tgz and .taz: */
1196 strlwr(suff);
1197 if (strequ(suff, ".tgz") || strequ(suff, ".taz")) {
1198 strcpy(suff, ".tar");
1199 } else {
1200 *suff = '\0'; /* strip the z suffix */
1202 /* ofname might be changed later if infile contains an original name */
1204 } else if (suff && ! force) {
1205 /* Avoid annoying messages with -r (see treat_dir()) */
1206 if (verbose || (!recursive && !quiet)) {
1207 /* Don't use WARN, as it affects exit status. */
1208 fprintf (stderr, "%s: %s already has %s suffix -- unchanged\n",
1209 program_name, ifname, suff);
1211 return WARNING;
1212 } else {
1213 save_orig_name = 0;
1215 #ifdef NO_MULTIPLE_DOTS
1216 suff = strrchr(ofname, '.');
1217 if (suff == NULL) {
1218 if (sizeof ofname <= strlen (ofname) + 1)
1219 goto name_too_long;
1220 strcat(ofname, ".");
1221 # ifdef MAX_EXT_CHARS
1222 if (strequ(z_suffix, "z")) {
1223 if (sizeof ofname <= strlen (ofname) + 2)
1224 goto name_too_long;
1225 strcat(ofname, "gz"); /* enough room */
1226 return OK;
1228 /* On the Atari and some versions of MSDOS,
1229 * ENAMETOOLONG does not work correctly. So we
1230 * must truncate here.
1232 } else if (strlen(suff)-1 + z_len > MAX_SUFFIX) {
1233 suff[MAX_SUFFIX+1-z_len] = '\0';
1234 save_orig_name = 1;
1235 # endif
1237 #endif /* NO_MULTIPLE_DOTS */
1238 if (sizeof ofname <= strlen (ofname) + z_len)
1239 goto name_too_long;
1240 strcat(ofname, z_suffix);
1242 } /* decompress ? */
1243 return OK;
1245 name_too_long:
1246 WARN ((stderr, "%s: %s: file name too long\n", program_name, ifname));
1247 return WARNING;
1250 /* Discard NBYTES input bytes from the input, or up through the next
1251 zero byte if NBYTES == (size_t) -1. If FLAGS say that the header
1252 CRC should be computed, update the CRC accordingly. */
1253 static void
1254 discard_input_bytes (nbytes, flags)
1255 size_t nbytes;
1256 unsigned int flags;
1258 while (nbytes != 0)
1260 uch c = get_byte ();
1261 if (flags & HEADER_CRC)
1262 updcrc (&c, 1);
1263 if (nbytes != (size_t) -1)
1264 nbytes--;
1265 else if (! c)
1266 break;
1270 /* ========================================================================
1271 * Check the magic number of the input file and update ofname if an
1272 * original name was given and to_stdout is not set.
1273 * Return the compression method, -1 for error, -2 for warning.
1274 * Set inptr to the offset of the next byte to be processed.
1275 * Updates time_stamp if there is one and --no-time is not used.
1276 * This function may be called repeatedly for an input file consisting
1277 * of several contiguous gzip'ed members.
1278 * IN assertions: there is at least one remaining compressed member.
1279 * If the member is a zip file, it must be the only one.
1281 local int get_method(in)
1282 int in; /* input file descriptor */
1284 uch flags; /* compression flags */
1285 uch magic[10]; /* magic header */
1286 int imagic0; /* first magic byte or EOF */
1287 int imagic1; /* like magic[1], but can represent EOF */
1288 ulg stamp; /* time stamp */
1290 /* If --force and --stdout, zcat == cat, so do not complain about
1291 * premature end of file: use try_byte instead of get_byte.
1293 if (force && to_stdout) {
1294 imagic0 = try_byte();
1295 magic[0] = imagic0;
1296 imagic1 = try_byte ();
1297 magic[1] = imagic1;
1298 /* If try_byte returned EOF, magic[1] == (char) EOF. */
1299 } else {
1300 magic[0] = get_byte ();
1301 imagic0 = 0;
1302 if (magic[0]) {
1303 magic[1] = get_byte ();
1304 imagic1 = 0; /* avoid lint warning */
1305 } else {
1306 imagic1 = try_byte ();
1307 magic[1] = imagic1;
1310 method = -1; /* unknown yet */
1311 part_nb++; /* number of parts in gzip file */
1312 header_bytes = 0;
1313 last_member = RECORD_IO;
1314 /* assume multiple members in gzip file except for record oriented I/O */
1316 if (memcmp(magic, GZIP_MAGIC, 2) == 0
1317 || memcmp(magic, OLD_GZIP_MAGIC, 2) == 0) {
1319 method = (int)get_byte();
1320 if (method != DEFLATED) {
1321 fprintf(stderr,
1322 "%s: %s: unknown method %d -- not supported\n",
1323 program_name, ifname, method);
1324 exit_code = ERROR;
1325 return -1;
1327 work = unzip;
1328 flags = (uch)get_byte();
1330 if ((flags & ENCRYPTED) != 0) {
1331 fprintf(stderr,
1332 "%s: %s is encrypted -- not supported\n",
1333 program_name, ifname);
1334 exit_code = ERROR;
1335 return -1;
1337 if ((flags & RESERVED) != 0) {
1338 fprintf(stderr,
1339 "%s: %s has flags 0x%x -- not supported\n",
1340 program_name, ifname, flags);
1341 exit_code = ERROR;
1342 if (force <= 1) return -1;
1344 stamp = (ulg)get_byte();
1345 stamp |= ((ulg)get_byte()) << 8;
1346 stamp |= ((ulg)get_byte()) << 16;
1347 stamp |= ((ulg)get_byte()) << 24;
1348 if (stamp != 0 && !no_time)
1350 time_stamp.tv_sec = stamp;
1351 time_stamp.tv_nsec = 0;
1354 magic[8] = get_byte (); /* Ignore extra flags. */
1355 magic[9] = get_byte (); /* Ignore OS type. */
1357 if (flags & HEADER_CRC)
1359 magic[2] = DEFLATED;
1360 magic[3] = flags;
1361 magic[4] = stamp & 0xff;
1362 magic[5] = (stamp >> 8) & 0xff;
1363 magic[6] = (stamp >> 16) & 0xff;
1364 magic[7] = stamp >> 24;
1365 updcrc (NULL, 0);
1366 updcrc (magic, 10);
1369 if ((flags & EXTRA_FIELD) != 0) {
1370 uch lenbuf[2];
1371 unsigned int len = lenbuf[0] = get_byte ();
1372 len |= (lenbuf[1] = get_byte ()) << 8;
1373 if (verbose) {
1374 fprintf(stderr,"%s: %s: extra field of %u bytes ignored\n",
1375 program_name, ifname, len);
1377 if (flags & HEADER_CRC)
1378 updcrc (lenbuf, 2);
1379 discard_input_bytes (len, flags);
1382 /* Get original file name if it was truncated */
1383 if ((flags & ORIG_NAME) != 0) {
1384 if (no_name || (to_stdout && !list) || part_nb > 1) {
1385 /* Discard the old name */
1386 discard_input_bytes (-1, flags);
1387 } else {
1388 /* Copy the base name. Keep a directory prefix intact. */
1389 char *p = gzip_base_name (ofname);
1390 char *base = p;
1391 for (;;) {
1392 *p = (char) get_byte ();
1393 if (*p++ == '\0') break;
1394 if (p >= ofname+sizeof(ofname)) {
1395 gzip_error ("corrupted input -- file name too large");
1398 if (flags & HEADER_CRC)
1399 updcrc ((uch *) base, p - base);
1400 p = gzip_base_name (base);
1401 memmove (base, p, strlen (p) + 1);
1402 /* If necessary, adapt the name to local OS conventions: */
1403 if (!list) {
1404 MAKE_LEGAL_NAME(base);
1405 if (base) list=0; /* avoid warning about unused variable */
1407 } /* no_name || to_stdout */
1408 } /* ORIG_NAME */
1410 /* Discard file comment if any */
1411 if ((flags & COMMENT) != 0) {
1412 discard_input_bytes (-1, flags);
1415 if (flags & HEADER_CRC)
1417 unsigned int crc16 = updcrc (magic, 0) & 0xffff;
1418 unsigned int header16 = get_byte ();
1419 header16 |= ((unsigned int) get_byte ()) << 8;
1420 if (header16 != crc16)
1422 fprintf (stderr,
1423 "%s: %s: header checksum 0x%04x != computed checksum 0x%04x\n",
1424 program_name, ifname, header16, crc16);
1425 exit_code = ERROR;
1426 if (force <= 1)
1427 return -1;
1431 if (part_nb == 1) {
1432 header_bytes = inptr + 2*4; /* include crc and size */
1435 } else if (memcmp(magic, PKZIP_MAGIC, 2) == 0 && inptr == 2
1436 && memcmp((char*)inbuf, PKZIP_MAGIC, 4) == 0) {
1437 /* To simplify the code, we support a zip file when alone only.
1438 * We are thus guaranteed that the entire local header fits in inbuf.
1440 inptr = 0;
1441 work = unzip;
1442 if (check_zipfile(in) != OK) return -1;
1443 /* check_zipfile may get ofname from the local header */
1444 last_member = 1;
1446 } else if (memcmp(magic, PACK_MAGIC, 2) == 0) {
1447 work = unpack;
1448 method = PACKED;
1450 } else if (memcmp(magic, LZW_MAGIC, 2) == 0) {
1451 work = unlzw;
1452 method = COMPRESSED;
1453 last_member = 1;
1455 } else if (memcmp(magic, LZH_MAGIC, 2) == 0) {
1456 work = unlzh;
1457 method = LZHED;
1458 last_member = 1;
1460 } else if (force && to_stdout && !list) { /* pass input unchanged */
1461 method = STORED;
1462 work = copy;
1463 if (imagic1 != EOF)
1464 inptr--;
1465 last_member = 1;
1466 if (imagic0 != EOF) {
1467 write_buf(fileno(stdout), magic, 1);
1468 bytes_out++;
1471 if (method >= 0) return method;
1473 if (part_nb == 1) {
1474 fprintf (stderr, "\n%s: %s: not in gzip format\n",
1475 program_name, ifname);
1476 exit_code = ERROR;
1477 return -1;
1478 } else {
1479 if (magic[0] == 0)
1481 int inbyte;
1482 for (inbyte = imagic1; inbyte == 0; inbyte = try_byte ())
1483 continue;
1484 if (inbyte == EOF)
1486 if (verbose)
1487 WARN ((stderr, "\n%s: %s: decompression OK, trailing zero bytes ignored\n",
1488 program_name, ifname));
1489 return -3;
1493 WARN((stderr, "\n%s: %s: decompression OK, trailing garbage ignored\n",
1494 program_name, ifname));
1495 return -2;
1499 /* ========================================================================
1500 * Display the characteristics of the compressed file.
1501 * If the given method is < 0, display the accumulated totals.
1502 * IN assertions: time_stamp, header_bytes and ifile_size are initialized.
1504 local void do_list(ifd, method)
1505 int ifd; /* input file descriptor */
1506 int method; /* compression method */
1508 ulg crc; /* original crc */
1509 static int first_time = 1;
1510 static char const *const methods[MAX_METHODS] = {
1511 "store", /* 0 */
1512 "compr", /* 1 */
1513 "pack ", /* 2 */
1514 "lzh ", /* 3 */
1515 "", "", "", "", /* 4 to 7 reserved */
1516 "defla"}; /* 8 */
1517 int positive_off_t_width = 1;
1518 off_t o;
1520 for (o = OFF_T_MAX; 9 < o; o /= 10) {
1521 positive_off_t_width++;
1524 if (first_time && method >= 0) {
1525 first_time = 0;
1526 if (verbose) {
1527 printf("method crc date time ");
1529 if (!quiet) {
1530 printf("%*.*s %*.*s ratio uncompressed_name\n",
1531 positive_off_t_width, positive_off_t_width, "compressed",
1532 positive_off_t_width, positive_off_t_width, "uncompressed");
1534 } else if (method < 0) {
1535 if (total_in <= 0 || total_out <= 0) return;
1536 if (verbose) {
1537 printf(" ");
1539 if (verbose || !quiet) {
1540 fprint_off(stdout, total_in, positive_off_t_width);
1541 printf(" ");
1542 fprint_off(stdout, total_out, positive_off_t_width);
1543 printf(" ");
1545 display_ratio(total_out-(total_in-header_bytes), total_out, stdout);
1546 /* header_bytes is not meaningful but used to ensure the same
1547 * ratio if there is a single file.
1549 printf(" (totals)\n");
1550 return;
1552 crc = (ulg)~0; /* unknown */
1553 bytes_out = -1L;
1554 bytes_in = ifile_size;
1556 #if RECORD_IO == 0
1557 if (method == DEFLATED && !last_member) {
1558 /* Get the crc and uncompressed size for gzip'ed (not zip'ed) files.
1559 * If the lseek fails, we could use read() to get to the end, but
1560 * --list is used to get quick results.
1561 * Use "gunzip < foo.gz | wc -c" to get the uncompressed size if
1562 * you are not concerned about speed.
1564 bytes_in = lseek(ifd, (off_t)(-8), SEEK_END);
1565 if (bytes_in != -1L) {
1566 uch buf[8];
1567 bytes_in += 8L;
1568 if (read(ifd, (char*)buf, sizeof(buf)) != sizeof(buf)) {
1569 read_error();
1571 crc = LG(buf);
1572 bytes_out = LG(buf+4);
1575 #endif /* RECORD_IO */
1576 if (verbose)
1578 struct tm *tm = localtime (&time_stamp.tv_sec);
1579 printf ("%5s %08lx ", methods[method], crc);
1580 if (tm)
1581 printf ("%s%3d %02d:%02d ",
1582 ("Jan\0Feb\0Mar\0Apr\0May\0Jun\0Jul\0Aug\0Sep\0Oct\0Nov\0Dec"
1583 + 4 * tm->tm_mon),
1584 tm->tm_mday, tm->tm_hour, tm->tm_min);
1585 else
1586 printf ("??? ?? ??:?? ");
1588 fprint_off(stdout, bytes_in, positive_off_t_width);
1589 printf(" ");
1590 fprint_off(stdout, bytes_out, positive_off_t_width);
1591 printf(" ");
1592 if (bytes_in == -1L) {
1593 total_in = -1L;
1594 bytes_in = bytes_out = header_bytes = 0;
1595 } else if (total_in >= 0) {
1596 total_in += bytes_in;
1598 if (bytes_out == -1L) {
1599 total_out = -1L;
1600 bytes_in = bytes_out = header_bytes = 0;
1601 } else if (total_out >= 0) {
1602 total_out += bytes_out;
1604 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out, stdout);
1605 printf(" %s\n", ofname);
1608 /* ========================================================================
1609 * Shorten the given name by one character, or replace a .tar extension
1610 * with .tgz. Truncate the last part of the name which is longer than
1611 * MIN_PART characters: 1234.678.012.gz -> 123.678.012.gz. If the name
1612 * has only parts shorter than MIN_PART truncate the longest part.
1613 * For decompression, just remove the last character of the name.
1615 * IN assertion: for compression, the suffix of the given name is z_suffix.
1617 local void shorten_name(name)
1618 char *name;
1620 int len; /* length of name without z_suffix */
1621 char *trunc = NULL; /* character to be truncated */
1622 int plen; /* current part length */
1623 int min_part = MIN_PART; /* current minimum part length */
1624 char *p;
1626 len = strlen(name);
1627 if (decompress) {
1628 if (len <= 1)
1629 gzip_error ("name too short");
1630 name[len-1] = '\0';
1631 return;
1633 p = get_suffix(name);
1634 if (! p)
1635 gzip_error ("can't recover suffix\n");
1636 *p = '\0';
1637 save_orig_name = 1;
1639 /* compress 1234567890.tar to 1234567890.tgz */
1640 if (len > 4 && strequ(p-4, ".tar")) {
1641 strcpy(p-4, ".tgz");
1642 return;
1644 /* Try keeping short extensions intact:
1645 * 1234.678.012.gz -> 123.678.012.gz
1647 do {
1648 p = strrchr(name, PATH_SEP);
1649 p = p ? p+1 : name;
1650 while (*p) {
1651 plen = strcspn(p, PART_SEP);
1652 p += plen;
1653 if (plen > min_part) trunc = p-1;
1654 if (*p) p++;
1656 } while (trunc == NULL && --min_part != 0);
1658 if (trunc != NULL) {
1659 do {
1660 trunc[0] = trunc[1];
1661 } while (*trunc++);
1662 trunc--;
1663 } else {
1664 trunc = strrchr(name, PART_SEP[0]);
1665 if (!trunc)
1666 gzip_error ("internal error in shorten_name");
1667 if (trunc[1] == '\0') trunc--; /* force truncation */
1669 strcpy(trunc, z_suffix);
1672 /* ========================================================================
1673 * The compressed file already exists, so ask for confirmation.
1674 * Return ERROR if the file must be skipped.
1676 local int check_ofname()
1678 /* Ask permission to overwrite the existing file */
1679 if (!force) {
1680 int ok = 0;
1681 fprintf (stderr, "%s: %s already exists;", program_name, ofname);
1682 if (foreground && (presume_input_tty || isatty(fileno(stdin)))) {
1683 fprintf(stderr, " do you wish to overwrite (y or n)? ");
1684 fflush(stderr);
1685 ok = yesno();
1687 if (!ok) {
1688 fprintf(stderr, "\tnot overwritten\n");
1689 if (exit_code == OK) exit_code = WARNING;
1690 return ERROR;
1693 if (xunlink (ofname)) {
1694 progerror(ofname);
1695 return ERROR;
1697 return OK;
1701 /* ========================================================================
1702 * Copy modes, times, ownership from input file to output file.
1703 * IN assertion: to_stdout is false.
1705 local void copy_stat(ifstat)
1706 struct stat *ifstat;
1708 mode_t mode = ifstat->st_mode & S_IRWXUGO;
1709 int r;
1711 #ifndef NO_UTIME
1712 struct timespec timespec[2];
1713 timespec[0] = get_stat_atime (ifstat);
1714 timespec[1] = get_stat_mtime (ifstat);
1716 if (decompress && 0 <= time_stamp.tv_nsec
1717 && ! (timespec[1].tv_sec == time_stamp.tv_sec
1718 && timespec[1].tv_nsec == time_stamp.tv_nsec))
1720 timespec[1] = time_stamp;
1721 if (verbose > 1) {
1722 fprintf(stderr, "%s: time stamp restored\n", ofname);
1726 if (gl_futimens (ofd, ofname, timespec) != 0)
1728 int e = errno;
1729 WARN ((stderr, "%s: ", program_name));
1730 if (!quiet)
1732 errno = e;
1733 perror (ofname);
1736 #endif
1738 #ifndef NO_CHOWN
1739 /* Copy ownership */
1740 # if HAVE_FCHOWN
1741 ignore_value (fchown (ofd, ifstat->st_uid, ifstat->st_gid));
1742 # elif HAVE_CHOWN
1743 ignore_value (chown (ofname, ifstat->st_uid, ifstat->st_gid));
1744 # endif
1745 #endif
1747 /* Copy the protection modes */
1748 #if HAVE_FCHMOD
1749 r = fchmod (ofd, mode);
1750 #else
1751 r = chmod (ofname, mode);
1752 #endif
1753 if (r != 0) {
1754 int e = errno;
1755 WARN ((stderr, "%s: ", program_name));
1756 if (!quiet) {
1757 errno = e;
1758 perror(ofname);
1763 #if ! NO_DIR
1765 /* ========================================================================
1766 * Recurse through the given directory. This code is taken from ncompress.
1768 local void treat_dir (fd, dir)
1769 int fd;
1770 char *dir;
1772 struct dirent *dp;
1773 DIR *dirp;
1774 char nbuf[MAX_PATH_LEN];
1775 int len;
1777 dirp = fdopendir (fd);
1779 if (dirp == NULL) {
1780 progerror(dir);
1781 close (fd);
1782 return ;
1785 ** WARNING: the following algorithm could occasionally cause
1786 ** compress to produce error warnings of the form "<filename>.gz
1787 ** already has .gz suffix - ignored". This occurs when the
1788 ** .gz output file is inserted into the directory below
1789 ** readdir's current pointer.
1790 ** These warnings are harmless but annoying, so they are suppressed
1791 ** with option -r (except when -v is on). An alternative
1792 ** to allowing this would be to store the entire directory
1793 ** list in memory, then compress the entries in the stored
1794 ** list. Given the depth-first recursive algorithm used here,
1795 ** this could use up a tremendous amount of memory. I don't
1796 ** think it's worth it. -- Dave Mack
1797 ** (An other alternative might be two passes to avoid depth-first.)
1800 while ((errno = 0, dp = readdir(dirp)) != NULL) {
1802 if (strequ(dp->d_name,".") || strequ(dp->d_name,"..")) {
1803 continue;
1805 len = strlen(dir);
1806 if (len + _D_EXACT_NAMLEN (dp) + 1 < MAX_PATH_LEN - 1) {
1807 strcpy(nbuf,dir);
1808 if (len != 0 /* dir = "" means current dir on Amiga */
1809 #ifdef PATH_SEP2
1810 && dir[len-1] != PATH_SEP2
1811 #endif
1812 #ifdef PATH_SEP3
1813 && dir[len-1] != PATH_SEP3
1814 #endif
1816 nbuf[len++] = PATH_SEP;
1818 strcpy(nbuf+len, dp->d_name);
1819 treat_file(nbuf);
1820 } else {
1821 fprintf(stderr,"%s: %s/%s: pathname too long\n",
1822 program_name, dir, dp->d_name);
1823 exit_code = ERROR;
1826 if (errno != 0)
1827 progerror(dir);
1828 if (CLOSEDIR(dirp) != 0)
1829 progerror(dir);
1831 #endif /* ! NO_DIR */
1833 /* Make sure signals get handled properly. */
1835 static void
1836 install_signal_handlers ()
1838 int nsigs = sizeof handled_sig / sizeof handled_sig[0];
1839 int i;
1841 #if SA_NOCLDSTOP
1842 struct sigaction act;
1844 sigemptyset (&caught_signals);
1845 for (i = 0; i < nsigs; i++)
1847 sigaction (handled_sig[i], NULL, &act);
1848 if (act.sa_handler != SIG_IGN)
1849 sigaddset (&caught_signals, handled_sig[i]);
1852 act.sa_handler = abort_gzip_signal;
1853 act.sa_mask = caught_signals;
1854 act.sa_flags = 0;
1856 for (i = 0; i < nsigs; i++)
1857 if (sigismember (&caught_signals, handled_sig[i]))
1859 if (i == 0)
1860 foreground = 1;
1861 sigaction (handled_sig[i], &act, NULL);
1863 #else
1864 for (i = 0; i < nsigs; i++)
1865 if (signal (handled_sig[i], SIG_IGN) != SIG_IGN)
1867 if (i == 0)
1868 foreground = 1;
1869 signal (handled_sig[i], abort_gzip_signal);
1870 siginterrupt (handled_sig[i], 1);
1872 #endif
1875 /* ========================================================================
1876 * Free all dynamically allocated variables and exit with the given code.
1878 local void do_exit(exitcode)
1879 int exitcode;
1881 static int in_exit = 0;
1883 if (in_exit) exit(exitcode);
1884 in_exit = 1;
1885 free(env);
1886 env = NULL;
1887 free(args);
1888 args = NULL;
1889 FREE(inbuf);
1890 FREE(outbuf);
1891 FREE(d_buf);
1892 FREE(window);
1893 #ifndef MAXSEG_64K
1894 FREE(tab_prefix);
1895 #else
1896 FREE(tab_prefix0);
1897 FREE(tab_prefix1);
1898 #endif
1899 exit(exitcode);
1902 /* ========================================================================
1903 * Close and unlink the output file.
1905 static void
1906 remove_output_file ()
1908 int fd;
1909 sigset_t oldset;
1911 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
1912 fd = remove_ofname_fd;
1913 if (0 <= fd)
1915 remove_ofname_fd = -1;
1916 close (fd);
1917 xunlink (ofname);
1919 sigprocmask (SIG_SETMASK, &oldset, NULL);
1922 /* ========================================================================
1923 * Error handler.
1925 void
1926 abort_gzip ()
1928 remove_output_file ();
1929 do_exit(ERROR);
1932 /* ========================================================================
1933 * Signal handler.
1935 static RETSIGTYPE
1936 abort_gzip_signal (sig)
1937 int sig;
1939 if (! SA_NOCLDSTOP)
1940 signal (sig, SIG_IGN);
1941 remove_output_file ();
1942 if (sig == exiting_signal)
1943 _exit (WARNING);
1944 signal (sig, SIG_DFL);
1945 raise (sig);