1 /* gzip (GNU zip) -- compress files with zip algorithm and 'compress' interface
3 Copyright (C) 1999, 2001-2002, 2006-2007, 2009-2013 Free Software
5 Copyright (C) 1992-1993 Jean-loup Gailly
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, write to the Free Software Foundation,
19 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
22 * The unzip code was written and put in the public domain by Mark Adler.
23 * Portions of the lzw code are derived from the public domain 'compress'
24 * written by Spencer Thomas, Joe Orost, James Woods, Jim McKie, Steve Davies,
25 * Ken Turkowski, Dave Mack and Peter Jannesen.
27 * See the license_msg below and the file COPYING for the software license.
28 * See the file algorithm.doc for the compression algorithms and file formats.
31 static char const *const license_msg[] = {
32 "Copyright (C) 2007, 2010, 2011 Free Software Foundation, Inc.",
33 "Copyright (C) 1993 Jean-loup Gailly.",
34 "This is free software. You may redistribute copies of it under the terms of",
35 "the GNU General Public License <http://www.gnu.org/licenses/gpl.html>.",
36 "There is NO WARRANTY, to the extent permitted by law.",
39 /* Compress files with zip algorithm and 'compress' interface.
40 * See help() function below for all options.
42 * file.gz: compressed file with same mode, owner, and utimes
43 * or stdout with -c option or if stdin used as input.
44 * If the output file name had to be truncated, the original name is kept
45 * in the compressed file.
46 * On MSDOS, file.tmp -> file.tmz. On VMS, file.tmp -> file.tmp-gz.
48 * Using gz on MSDOS would create too many file name conflicts. For
49 * example, foo.txt -> foo.tgz (.tgz must be reserved as shorthand for
50 * tar.gz). Similarly, foo.dir and foo.doc would both be mapped to foo.dgz.
51 * I also considered 12345678.txt -> 12345txt.gz but this truncates the name
52 * too heavily. There is no ideal solution given the MSDOS 8+3 limitation.
54 * For the meaning of all compilation flags, see comments in Makefile.in.
59 #include <sys/types.h>
72 #include "fcntl-safer.h"
74 #include "ignore-value.h"
75 #include "stat-time.h"
99 #define RW_USER (S_IRUSR | S_IWUSR) /* creation mode for open() */
102 # define MAX_PATH_LEN 1024 /* max pathname length */
114 off_t lseek (int fd, off_t offset, int whence);
118 #define OFF_T_MIN (~ (off_t) 0 << (sizeof (off_t) * CHAR_BIT - 1))
122 #define OFF_T_MAX (~ (off_t) 0 - OFF_T_MIN)
125 /* Use SA_NOCLDSTOP as a proxy for whether the sigaction machinery is
128 # define SA_NOCLDSTOP 0
129 # define sigprocmask(how, set, oset) /* empty */
130 # define sigset_t int
131 # if ! HAVE_SIGINTERRUPT
132 # define siginterrupt(sig, flag) /* empty */
136 #ifndef HAVE_WORKING_O_NOFOLLOW
137 # define HAVE_WORKING_O_NOFOLLOW 0
140 /* Separator for file name parts (see shorten_name()) */
141 #ifdef NO_MULTIPLE_DOTS
142 # define PART_SEP "-"
144 # define PART_SEP "."
149 DECLARE(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
150 DECLARE(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
151 DECLARE(ush, d_buf, DIST_BUFSIZE);
152 DECLARE(uch, window, 2L*WSIZE);
154 DECLARE(ush, tab_prefix, 1L<<BITS);
156 DECLARE(ush, tab_prefix0, 1L<<(BITS-1));
157 DECLARE(ush, tab_prefix1, 1L<<(BITS-1));
160 /* local variables */
162 /* If true, pretend that standard input is a tty. This option
163 is deliberately not documented, and only for testing. */
164 static bool presume_input_tty;
166 static int ascii = 0; /* convert end-of-lines to local OS conventions */
167 int to_stdout = 0; /* output to stdout (-c) */
168 static int decompress = 0; /* decompress (-d) */
169 static int force = 0; /* don't ask questions, compress links (-f) */
170 static int keep = 0; /* keep (don't delete) input files */
171 static int no_name = -1; /* don't save or restore the original file name */
172 static int no_time = -1; /* don't save or restore the original file time */
173 static int recursive = 0; /* recurse through directories (-r) */
174 static int list = 0; /* list the file contents (-l) */
175 int verbose = 0; /* be verbose (-v) */
176 int quiet = 0; /* be very quiet (-q) */
177 static int do_lzw = 0; /* generate output compatible with old compress (-Z) */
178 int test = 0; /* test .gz file integrity */
179 static int foreground = 0; /* set if program run in foreground */
180 char *program_name; /* program name */
181 int maxbits = BITS; /* max bits per code for LZW */
182 int method = DEFLATED;/* compression method */
183 int level = 6; /* compression level */
184 int exit_code = OK; /* program exit code */
185 int save_orig_name; /* set if original name must be saved */
186 static int last_member; /* set for .zip and .Z files */
187 static int part_nb; /* number of parts in .gz file */
188 struct timespec time_stamp; /* original time stamp (modification time) */
189 off_t ifile_size; /* input file size, -1 for devices (debug only) */
190 static char *env; /* contents of GZIP env variable */
191 static char **args = NULL; /* argv pointer if GZIP env variable defined */
192 static char const *z_suffix; /* default suffix (can be set with --suffix) */
193 static size_t z_len; /* strlen(z_suffix) */
195 /* The set of signals that are caught. */
196 static sigset_t caught_signals;
198 /* If nonzero then exit with status WARNING, rather than with the usual
199 signal status, on receipt of a signal with this value. This
200 suppresses a "Broken Pipe" message with some shells. */
201 static int volatile exiting_signal;
203 /* If nonnegative, close this file descriptor and unlink ofname on error. */
204 static int volatile remove_ofname_fd = -1;
206 off_t bytes_in; /* number of input bytes */
207 off_t bytes_out; /* number of output bytes */
208 static off_t total_in; /* input bytes for all files */
209 static off_t total_out; /* output bytes for all files */
210 char ifname[MAX_PATH_LEN]; /* input file name */
211 char ofname[MAX_PATH_LEN]; /* output file name */
212 static struct stat istat; /* status for input file */
213 int ifd; /* input file descriptor */
214 int ofd; /* output file descriptor */
215 unsigned insize; /* valid bytes in inbuf */
216 unsigned inptr; /* index of next byte to be processed in inbuf */
217 unsigned outcnt; /* bytes in output buffer */
218 int rsync = 0; /* make ryncable chunks */
220 static int handled_sig[] =
222 /* SIGINT must be first, as 'foreground' depends on it. */
242 /* For long options that have no equivalent short option, use a
243 non-character as a pseudo short option, starting with CHAR_MAX + 1. */
246 PRESUME_INPUT_TTY_OPTION = CHAR_MAX + 1
249 static const struct option longopts[] =
251 /* { name has_arg *flag val } */
252 {"ascii", 0, 0, 'a'}, /* ascii text mode */
253 {"to-stdout", 0, 0, 'c'}, /* write output on standard output */
254 {"stdout", 0, 0, 'c'}, /* write output on standard output */
255 {"decompress", 0, 0, 'd'}, /* decompress */
256 {"uncompress", 0, 0, 'd'}, /* decompress */
257 /* {"encrypt", 0, 0, 'e'}, encrypt */
258 {"force", 0, 0, 'f'}, /* force overwrite of output file */
259 {"help", 0, 0, 'h'}, /* give help */
260 /* {"pkzip", 0, 0, 'k'}, force output in pkzip format */
261 {"keep", 0, 0, 'k'}, /* keep (don't delete) input files */
262 {"list", 0, 0, 'l'}, /* list .gz file contents */
263 {"license", 0, 0, 'L'}, /* display software license */
264 {"no-name", 0, 0, 'n'}, /* don't save or restore original name & time */
265 {"name", 0, 0, 'N'}, /* save or restore original name & time */
266 {"-presume-input-tty", no_argument, NULL, PRESUME_INPUT_TTY_OPTION},
267 {"quiet", 0, 0, 'q'}, /* quiet mode */
268 {"silent", 0, 0, 'q'}, /* quiet mode */
269 {"recursive", 0, 0, 'r'}, /* recurse through directories */
270 {"suffix", 1, 0, 'S'}, /* use given suffix instead of .gz */
271 {"test", 0, 0, 't'}, /* test compressed file integrity */
272 {"no-time", 0, 0, 'T'}, /* don't save or restore the time stamp */
273 {"verbose", 0, 0, 'v'}, /* verbose mode */
274 {"version", 0, 0, 'V'}, /* display version number */
275 {"fast", 0, 0, '1'}, /* compress faster */
276 {"best", 0, 0, '9'}, /* compress better */
277 {"lzw", 0, 0, 'Z'}, /* make output compatible with old compress */
278 {"bits", 1, 0, 'b'}, /* max number of bits per code (implies -Z) */
279 {"rsyncable", 0, 0, 'R'}, /* make rsync-friendly archive */
283 /* local functions */
285 local void try_help (void) ATTRIBUTE_NORETURN;
286 local void help (void);
287 local void license (void);
288 local void version (void);
289 local int input_eof (void);
290 local void treat_stdin (void);
291 local void treat_file (char *iname);
292 local int create_outfile (void);
293 local char *get_suffix (char *name);
294 local int open_input_file (char *iname, struct stat *sbuf);
295 local void discard_input_bytes (size_t nbytes, unsigned int flags);
296 local int make_ofname (void);
297 local void shorten_name (char *name);
298 local int get_method (int in);
299 local void do_list (int ifd, int method);
300 local int check_ofname (void);
301 local void copy_stat (struct stat *ifstat);
302 local void install_signal_handlers (void);
303 local void remove_output_file (void);
304 local RETSIGTYPE abort_gzip_signal (int);
305 local void do_exit (int exitcode) ATTRIBUTE_NORETURN;
306 int main (int argc, char **argv);
307 static int (*work) (int infile, int outfile) = zip; /* function to call */
310 local void treat_dir (int fd, char *dir);
313 #define strequ(s1, s2) (strcmp((s1),(s2)) == 0)
318 fprintf (stderr, "Try `%s --help' for more information.\n",
323 /* ======================================================================== */
326 static char const* const help_msg[] = {
327 "Compress or uncompress FILEs (by default, compress FILES in-place).",
329 "Mandatory arguments to long options are mandatory for short options too.",
332 " -a, --ascii ascii text; convert end-of-line using local conventions",
334 " -c, --stdout write on standard output, keep original files unchanged",
335 " -d, --decompress decompress",
336 /* -e, --encrypt encrypt */
337 " -f, --force force overwrite of output file and compress links",
338 " -h, --help give this help",
339 /* -k, --pkzip force output in pkzip format */
340 " -k, --keep keep (don't delete) input files",
341 " -l, --list list compressed file contents",
342 " -L, --license display software license",
344 " -m, --no-time do not save or restore the original modification time",
345 " -M, --time save or restore the original modification time",
347 " -n, --no-name do not save or restore the original name and time stamp",
348 " -N, --name save or restore the original name and time stamp",
349 " -q, --quiet suppress all warnings",
351 " -r, --recursive operate recursively on directories",
353 " -S, --suffix=SUF use suffix SUF on compressed files",
354 " -t, --test test compressed file integrity",
355 " -v, --verbose verbose mode",
356 " -V, --version display version number",
357 " -1, --fast compress faster",
358 " -9, --best compress better",
360 " -Z, --lzw produce output compatible with old compress",
361 " -b, --bits=BITS max number of bits per code (implies -Z)",
363 " --rsyncable Make rsync-friendly archive",
365 "With no FILE, or when FILE is -, read standard input.",
367 "Report bugs to <bug-gzip@gnu.org>.",
369 char const *const *p = help_msg;
371 printf ("Usage: %s [OPTION]... [FILE]...\n", program_name);
372 while (*p) printf ("%s\n", *p++);
375 /* ======================================================================== */
378 char const *const *p = license_msg;
380 printf ("%s %s\n", program_name, Version);
381 while (*p) printf ("%s\n", *p++);
384 /* ======================================================================== */
389 printf ("Written by Jean-loup Gailly.\n");
392 local void progerror (char const *string)
395 fprintf (stderr, "%s: ", program_name);
401 /* ======================================================================== */
402 int main (int argc, char **argv)
404 int file_count; /* number of files to process */
405 size_t proglen; /* length of program_name */
406 int optc; /* current option */
408 EXPAND(argc, argv); /* wild card expansion if necessary */
410 program_name = gzip_base_name (argv[0]);
411 proglen = strlen (program_name);
413 atexit (close_stdin);
415 /* Suppress .exe for MSDOS, OS/2 and VMS: */
416 if (4 < proglen && strequ (program_name + proglen - 4, ".exe"))
417 program_name[proglen - 4] = '\0';
419 /* Add options in GZIP environment variable if there is one */
420 env = add_envopt(&argc, &argv, OPTIONS_VAR);
421 if (env != NULL) args = argv;
424 # define GNU_STANDARD 1
427 /* For compatibility with old compress, use program name as an option.
428 * Unless you compile with -DGNU_STANDARD=0, this program will behave as
429 * gzip even if it is invoked under the name gunzip or zcat.
431 * Systems which do not support links can still use -d or -dc.
432 * Ignore an .exe extension for MSDOS, OS/2 and VMS.
434 if (strncmp (program_name, "un", 2) == 0 /* ungzip, uncompress */
435 || strncmp (program_name, "gun", 3) == 0) /* gunzip */
437 else if (strequ (program_name + 1, "cat") /* zcat, pcat, gcat */
438 || strequ (program_name, "gzcat")) /* gzcat */
439 decompress = to_stdout = 1;
443 z_len = strlen(z_suffix);
445 while ((optc = getopt_long (argc, argv, "ab:cdfhH?klLmMnNqrS:tvVZ123456789",
446 longopts, (int *)0)) != -1) {
451 maxbits = atoi(optarg);
452 for (; *optarg; optarg++)
453 if (! ('0' <= *optarg && *optarg <= '9'))
455 fprintf (stderr, "%s: -b operand is not an integer\n",
461 to_stdout = 1; break;
463 decompress = 1; break;
467 help(); do_exit(OK); break;
471 list = decompress = to_stdout = 1; break;
473 license(); do_exit(OK); break;
474 case 'm': /* undocumented, may change later */
476 case 'M': /* undocumented, may change later */
479 no_name = no_time = 1; break;
481 no_name = no_time = 0; break;
482 case PRESUME_INPUT_TTY_OPTION:
483 presume_input_tty = true; break;
485 quiet = 1; verbose = 0; break;
488 fprintf (stderr, "%s: -r not supported on this system\n",
499 #ifdef NO_MULTIPLE_DOTS
500 if (*optarg == '.') optarg++;
502 z_len = strlen(optarg);
506 test = decompress = to_stdout = 1;
509 verbose++; quiet = 0; break;
511 version(); do_exit(OK); break;
516 fprintf(stderr, "%s: -Z not supported in this version\n",
521 case '1': case '2': case '3': case '4':
522 case '5': case '6': case '7': case '8': case '9':
526 /* Error message already emitted by getopt_long. */
529 } /* loop on all arguments */
531 /* By default, save name and timestamp on compression but do not
532 * restore them on decompression.
534 if (no_time < 0) no_time = decompress;
535 if (no_name < 0) no_name = decompress;
537 file_count = argc - optind;
541 if (ascii && !quiet) {
542 fprintf(stderr, "%s: option --ascii ignored on this system\n",
546 if (z_len == 0 || z_len > MAX_SUFFIX) {
547 fprintf(stderr, "%s: invalid suffix '%s'\n", program_name, z_suffix);
551 if (do_lzw && !decompress) work = lzw;
553 /* Allocate all global buffers (for DYN_ALLOC option) */
554 ALLOC(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
555 ALLOC(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
556 ALLOC(ush, d_buf, DIST_BUFSIZE);
557 ALLOC(uch, window, 2L*WSIZE);
559 ALLOC(ush, tab_prefix, 1L<<BITS);
561 ALLOC(ush, tab_prefix0, 1L<<(BITS-1));
562 ALLOC(ush, tab_prefix1, 1L<<(BITS-1));
566 exiting_signal = quiet ? SIGPIPE : 0;
570 install_signal_handlers ();
572 /* And get to work */
573 if (file_count != 0) {
574 if (to_stdout && !test && !list && (!decompress || !ascii)) {
575 SET_BINARY_MODE(fileno(stdout));
577 while (optind < argc) {
578 treat_file(argv[optind++]);
580 } else { /* Standard input */
583 if (list && !quiet && file_count > 1) {
584 do_list(-1, -1); /* print totals */
587 return exit_code; /* just to avoid lint warning */
590 /* Return nonzero when at end of file on input. */
594 if (!decompress || last_member)
599 if (insize != INBUFSIZ || fill_inbuf (1) == EOF)
602 /* Unget the char that fill_inbuf got. */
609 /* ========================================================================
610 * Compress or decompress stdin
612 local void treat_stdin()
615 && (presume_input_tty
616 || isatty(fileno((FILE *)(decompress ? stdin : stdout))))) {
617 /* Do not send compressed data to the terminal or read it from
618 * the terminal. We get here when user invoked the program
619 * without parameters, so be helpful. According to the GNU standards:
621 * If there is one behavior you think is most useful when the output
622 * is to a terminal, and another that you think is most useful when
623 * the output is a file or a pipe, then it is usually best to make
624 * the default behavior the one that is useful with output to a
625 * terminal, and have an option for the other behavior.
627 * Here we use the --force option to get the other behavior.
631 ("%s: compressed data not %s a terminal."
632 " Use -f to force %scompression.\n"
633 "For help, type: %s -h\n"),
635 decompress ? "read from" : "written to",
636 decompress ? "de" : "",
641 if (decompress || !ascii) {
642 SET_BINARY_MODE(fileno(stdin));
644 if (!test && !list && (!decompress || !ascii)) {
645 SET_BINARY_MODE(fileno(stdout));
647 strcpy(ifname, "stdin");
648 strcpy(ofname, "stdout");
650 /* Get the file's time stamp and size. */
651 if (fstat (fileno (stdin), &istat) != 0)
653 progerror ("standard input");
656 ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
657 time_stamp.tv_nsec = -1;
658 if (!no_time || list)
660 if (S_ISREG (istat.st_mode))
661 time_stamp = get_stat_mtime (&istat);
663 gettime (&time_stamp);
666 clear_bufs(); /* clear input and output buffers */
672 method = get_method(ifd);
674 do_exit(exit_code); /* error message already emitted */
678 do_list(ifd, method);
682 /* Actually do the compression/decompression. Loop over zipped members.
685 if ((*work)(fileno(stdin), fileno(stdout)) != OK) return;
690 method = get_method(ifd);
691 if (method < 0) return; /* error message already emitted */
692 bytes_out = 0; /* required for length check */
697 fprintf(stderr, " OK\n");
699 } else if (!decompress) {
700 display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
701 fprintf(stderr, "\n");
702 #ifdef DISPLAY_STDIN_RATIO
704 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
705 fprintf(stderr, "\n");
711 /* ========================================================================
712 * Compress or decompress the given file
714 local void treat_file(iname)
717 /* Accept "-" as synonym for stdin */
718 if (strequ(iname, "-")) {
719 int cflag = to_stdout;
725 /* Check if the input file is present, set ifname and istat: */
726 ifd = open_input_file (iname, &istat);
730 /* If the input name is that of a directory, recurse or ignore: */
731 if (S_ISDIR(istat.st_mode)) {
734 treat_dir (ifd, iname);
735 /* Warning: ifname is now garbage */
740 WARN ((stderr, "%s: %s is a directory -- ignored\n",
741 program_name, ifname));
747 if (! S_ISREG (istat.st_mode))
750 "%s: %s is not a directory or a regular file - ignored\n",
751 program_name, ifname));
755 if (istat.st_mode & S_ISUID)
757 WARN ((stderr, "%s: %s is set-user-ID on execution - ignored\n",
758 program_name, ifname));
762 if (istat.st_mode & S_ISGID)
764 WARN ((stderr, "%s: %s is set-group-ID on execution - ignored\n",
765 program_name, ifname));
772 if (istat.st_mode & S_ISVTX)
775 "%s: %s has the sticky bit set - file ignored\n",
776 program_name, ifname));
780 if (2 <= istat.st_nlink)
782 WARN ((stderr, "%s: %s has %lu other link%c -- unchanged\n",
783 program_name, ifname,
784 (unsigned long int) istat.st_nlink - 1,
785 istat.st_nlink == 2 ? ' ' : 's'));
792 ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
793 time_stamp.tv_nsec = -1;
794 if (!no_time || list)
795 time_stamp = get_stat_mtime (&istat);
797 /* Generate output file name. For -r and (-t or -l), skip files
798 * without a valid gzip suffix (check done in make_ofname).
800 if (to_stdout && !list && !test) {
801 strcpy(ofname, "stdout");
803 } else if (make_ofname() != OK) {
808 clear_bufs(); /* clear input and output buffers */
812 method = get_method(ifd); /* updates ofname if original given */
815 return; /* error message already emitted */
819 do_list(ifd, method);
820 if (close (ifd) != 0)
825 /* If compressing to a file, check if ofname is not ambiguous
826 * because the operating system truncates names. Otherwise, generate
827 * a new ofname and save the original name in the compressed file.
830 ofd = fileno(stdout);
831 /* Keep remove_ofname_fd negative. */
833 if (create_outfile() != OK) return;
835 if (!decompress && save_orig_name && !verbose && !quiet) {
836 fprintf(stderr, "%s: %s compressed to %s\n",
837 program_name, ifname, ofname);
840 /* Keep the name even if not truncated except with --no-name: */
841 if (!save_orig_name) save_orig_name = !no_name;
844 fprintf(stderr, "%s:\t", ifname);
847 /* Actually do the compression/decompression. Loop over zipped members.
850 if ((*work)(ifd, ofd) != OK) {
851 method = -1; /* force cleanup */
858 method = get_method(ifd);
859 if (method < 0) break; /* error message already emitted */
860 bytes_out = 0; /* required for length check */
863 if (close (ifd) != 0)
870 if (close (ofd) != 0)
878 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
879 remove_ofname_fd = -1;
880 unlink_errno = xunlink (ifname) == 0 ? 0 : errno;
881 sigprocmask (SIG_SETMASK, &oldset, NULL);
885 WARN ((stderr, "%s: ", program_name));
888 errno = unlink_errno;
897 remove_output_file ();
901 /* Display statistics */
904 fprintf(stderr, " OK");
905 } else if (decompress) {
906 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
908 display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
910 if (!test && !to_stdout) {
911 fprintf(stderr, " -- replaced with %s", ofname);
913 fprintf(stderr, "\n");
917 /* ========================================================================
918 * Create the output file. Return OK or ERROR.
919 * Try several times if necessary to avoid truncating the z_suffix. For
920 * example, do not create a compressed file of name "1234567890123."
921 * Sets save_orig_name to true if the file name has been truncated.
922 * IN assertions: the input file has already been open (ifd is set) and
923 * ofname has already been updated if there was an original name.
924 * OUT assertions: ifd and ofd are closed in case of error.
926 local int create_outfile()
928 int name_shortened = 0;
929 int flags = (O_WRONLY | O_CREAT | O_EXCL
930 | (ascii && decompress ? 0 : O_BINARY));
937 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
938 remove_ofname_fd = ofd = OPEN (ofname, flags, RW_USER);
940 sigprocmask (SIG_SETMASK, &oldset, NULL);
949 shorten_name (ofname);
955 if (check_ofname () != OK)
969 if (name_shortened && decompress)
971 /* name might be too long if an original name was saved */
972 WARN ((stderr, "%s: %s: warning, name truncated\n",
973 program_name, ofname));
979 /* ========================================================================
980 * Return a pointer to the 'z' suffix of a file name, or NULL. For all
981 * systems, ".gz", ".z", ".Z", ".taz", ".tgz", "-gz", "-z" and "_z" are
982 * accepted suffixes, in addition to the value of the --suffix option.
983 * ".tgz" is a useful convention for tar.z files on systems limited
984 * to 3 characters extensions. On such systems, ".?z" and ".??z" are
985 * also accepted suffixes. For Unix, we do not want to accept any
986 * .??z suffix as indicating a compressed file; some people use .xyz
987 * to denote volume data.
988 * On systems allowing multiple versions of the same file (such as VMS),
989 * this function removes any version suffix in the given name.
991 local char *get_suffix(name)
995 char suffix[MAX_SUFFIX+3]; /* last chars of name, forced to lower case */
996 static char const *known_suffixes[] =
997 {NULL, ".gz", ".z", ".taz", ".tgz", "-gz", "-z", "_z",
1002 char const **suf = known_suffixes;
1005 if (strequ(z_suffix, "z")) suf++; /* check long suffixes first */
1008 /* strip a version number from the file name */
1010 char *v = strrchr(name, SUFFIX_SEP);
1011 if (v != NULL) *v = '\0';
1014 nlen = strlen(name);
1015 if (nlen <= MAX_SUFFIX+2) {
1016 strcpy(suffix, name);
1018 strcpy(suffix, name+nlen-MAX_SUFFIX-2);
1021 slen = strlen(suffix);
1023 int s = strlen(*suf);
1024 if (slen > s && suffix[slen-s-1] != PATH_SEP
1025 && strequ(suffix + slen - s, *suf)) {
1028 } while (*++suf != NULL);
1034 /* Open file NAME with the given flags and mode and store its status
1035 into *ST. Return a file descriptor to the newly opened file, or -1
1036 (setting errno) on failure. */
1038 open_and_stat (char *name, int flags, mode_t mode, struct stat *st)
1042 /* Refuse to follow symbolic links unless -c or -f. */
1043 if (!to_stdout && !force)
1045 if (HAVE_WORKING_O_NOFOLLOW)
1046 flags |= O_NOFOLLOW;
1049 #if HAVE_LSTAT || defined lstat
1050 if (lstat (name, st) != 0)
1052 else if (S_ISLNK (st->st_mode))
1061 fd = OPEN (name, flags, mode);
1062 if (0 <= fd && fstat (fd, st) != 0)
1073 /* ========================================================================
1074 * Set ifname to the input file name (with a suffix appended if necessary)
1075 * and istat to its stats. For decompression, if no file exists with the
1076 * original name, try adding successively z_suffix, .gz, .z, -z and .Z.
1077 * For MSDOS, we try only z_suffix and z.
1078 * Return an open file descriptor or -1.
1081 open_input_file (iname, sbuf)
1085 int ilen; /* strlen(ifname) */
1086 int z_suffix_errno = 0;
1087 static char const *suffixes[] = {NULL, ".gz", ".z", "-z", ".Z", NULL};
1088 char const **suf = suffixes;
1090 #ifdef NO_MULTIPLE_DOTS
1091 char *dot; /* pointer to ifname extension, or NULL */
1094 int open_flags = (O_RDONLY | O_NONBLOCK | O_NOCTTY
1095 | (ascii && !decompress ? 0 : O_BINARY));
1099 if (sizeof ifname - 1 <= strlen (iname))
1102 strcpy(ifname, iname);
1104 /* If input file exists, return OK. */
1105 fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1109 if (!decompress || errno != ENOENT) {
1113 /* file.ext doesn't exist, try adding a suffix (after removing any
1114 * version number for VMS).
1116 s = get_suffix(ifname);
1118 progerror(ifname); /* ifname already has z suffix and does not exist */
1121 #ifdef NO_MULTIPLE_DOTS
1122 dot = strrchr(ifname, '.');
1124 strcat(ifname, ".");
1125 dot = strrchr(ifname, '.');
1128 ilen = strlen(ifname);
1129 if (strequ(z_suffix, ".gz")) suf++;
1131 /* Search for all suffixes */
1133 char const *s0 = s = *suf;
1134 strcpy (ifname, iname);
1135 #ifdef NO_MULTIPLE_DOTS
1137 if (*dot == '\0') strcpy (dot, ".");
1139 #ifdef MAX_EXT_CHARS
1140 if (MAX_EXT_CHARS < strlen (s) + strlen (dot + 1))
1141 dot[MAX_EXT_CHARS + 1 - strlen (s)] = '\0';
1143 if (sizeof ifname <= ilen + strlen (s))
1146 fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1149 if (errno != ENOENT)
1154 if (strequ (s0, z_suffix))
1155 z_suffix_errno = errno;
1156 } while (*++suf != NULL);
1158 /* No suffix found, complain using z_suffix: */
1159 strcpy(ifname, iname);
1160 #ifdef NO_MULTIPLE_DOTS
1161 if (*dot == '\0') strcpy(dot, ".");
1163 #ifdef MAX_EXT_CHARS
1164 if (MAX_EXT_CHARS < z_len + strlen (dot + 1))
1165 dot[MAX_EXT_CHARS + 1 - z_len] = '\0';
1167 strcat(ifname, z_suffix);
1168 errno = z_suffix_errno;
1173 fprintf (stderr, "%s: %s: file name too long\n", program_name, iname);
1178 /* ========================================================================
1179 * Generate ofname given ifname. Return OK, or WARNING if file must be skipped.
1180 * Sets save_orig_name to true if the file name has been truncated.
1182 local int make_ofname()
1184 char *suff; /* ofname z suffix */
1186 strcpy(ofname, ifname);
1187 /* strip a version number if any and get the gzip suffix if present: */
1188 suff = get_suffix(ofname);
1192 /* With -t or -l, try all files (even without .gz suffix)
1193 * except with -r (behave as with just -dr).
1195 if (!recursive && (list || test)) return OK;
1197 /* Avoid annoying messages with -r */
1198 if (verbose || (!recursive && !quiet)) {
1199 WARN((stderr,"%s: %s: unknown suffix -- ignored\n",
1200 program_name, ifname));
1204 /* Make a special case for .tgz and .taz: */
1206 if (strequ(suff, ".tgz") || strequ(suff, ".taz")) {
1207 strcpy(suff, ".tar");
1209 *suff = '\0'; /* strip the z suffix */
1211 /* ofname might be changed later if infile contains an original name */
1213 } else if (suff && ! force) {
1214 /* Avoid annoying messages with -r (see treat_dir()) */
1215 if (verbose || (!recursive && !quiet)) {
1216 /* Don't use WARN, as it affects exit status. */
1217 fprintf (stderr, "%s: %s already has %s suffix -- unchanged\n",
1218 program_name, ifname, suff);
1224 #ifdef NO_MULTIPLE_DOTS
1225 suff = strrchr(ofname, '.');
1227 if (sizeof ofname <= strlen (ofname) + 1)
1229 strcat(ofname, ".");
1230 # ifdef MAX_EXT_CHARS
1231 if (strequ(z_suffix, "z")) {
1232 if (sizeof ofname <= strlen (ofname) + 2)
1234 strcat(ofname, "gz"); /* enough room */
1237 /* On the Atari and some versions of MSDOS,
1238 * ENAMETOOLONG does not work correctly. So we
1239 * must truncate here.
1241 } else if (strlen(suff)-1 + z_len > MAX_SUFFIX) {
1242 suff[MAX_SUFFIX+1-z_len] = '\0';
1246 #endif /* NO_MULTIPLE_DOTS */
1247 if (sizeof ofname <= strlen (ofname) + z_len)
1249 strcat(ofname, z_suffix);
1251 } /* decompress ? */
1255 WARN ((stderr, "%s: %s: file name too long\n", program_name, ifname));
1259 /* Discard NBYTES input bytes from the input, or up through the next
1260 zero byte if NBYTES == (size_t) -1. If FLAGS say that the header
1261 CRC should be computed, update the CRC accordingly. */
1263 discard_input_bytes (nbytes, flags)
1269 uch c = get_byte ();
1270 if (flags & HEADER_CRC)
1272 if (nbytes != (size_t) -1)
1279 /* ========================================================================
1280 * Check the magic number of the input file and update ofname if an
1281 * original name was given and to_stdout is not set.
1282 * Return the compression method, -1 for error, -2 for warning.
1283 * Set inptr to the offset of the next byte to be processed.
1284 * Updates time_stamp if there is one and --no-time is not used.
1285 * This function may be called repeatedly for an input file consisting
1286 * of several contiguous gzip'ed members.
1287 * IN assertions: there is at least one remaining compressed member.
1288 * If the member is a zip file, it must be the only one.
1290 local int get_method(in)
1291 int in; /* input file descriptor */
1293 uch flags; /* compression flags */
1294 uch magic[10]; /* magic header */
1295 int imagic0; /* first magic byte or EOF */
1296 int imagic1; /* like magic[1], but can represent EOF */
1297 ulg stamp; /* time stamp */
1299 /* If --force and --stdout, zcat == cat, so do not complain about
1300 * premature end of file: use try_byte instead of get_byte.
1302 if (force && to_stdout) {
1303 imagic0 = try_byte();
1305 imagic1 = try_byte ();
1307 /* If try_byte returned EOF, magic[1] == (char) EOF. */
1309 magic[0] = get_byte ();
1312 magic[1] = get_byte ();
1313 imagic1 = 0; /* avoid lint warning */
1315 imagic1 = try_byte ();
1319 method = -1; /* unknown yet */
1320 part_nb++; /* number of parts in gzip file */
1322 last_member = RECORD_IO;
1323 /* assume multiple members in gzip file except for record oriented I/O */
1325 if (memcmp(magic, GZIP_MAGIC, 2) == 0
1326 || memcmp(magic, OLD_GZIP_MAGIC, 2) == 0) {
1328 method = (int)get_byte();
1329 if (method != DEFLATED) {
1331 "%s: %s: unknown method %d -- not supported\n",
1332 program_name, ifname, method);
1337 flags = (uch)get_byte();
1339 if ((flags & ENCRYPTED) != 0) {
1341 "%s: %s is encrypted -- not supported\n",
1342 program_name, ifname);
1346 if ((flags & RESERVED) != 0) {
1348 "%s: %s has flags 0x%x -- not supported\n",
1349 program_name, ifname, flags);
1351 if (force <= 1) return -1;
1353 stamp = (ulg)get_byte();
1354 stamp |= ((ulg)get_byte()) << 8;
1355 stamp |= ((ulg)get_byte()) << 16;
1356 stamp |= ((ulg)get_byte()) << 24;
1357 if (stamp != 0 && !no_time)
1359 time_stamp.tv_sec = stamp;
1360 time_stamp.tv_nsec = 0;
1363 magic[8] = get_byte (); /* Ignore extra flags. */
1364 magic[9] = get_byte (); /* Ignore OS type. */
1366 if (flags & HEADER_CRC)
1368 magic[2] = DEFLATED;
1370 magic[4] = stamp & 0xff;
1371 magic[5] = (stamp >> 8) & 0xff;
1372 magic[6] = (stamp >> 16) & 0xff;
1373 magic[7] = stamp >> 24;
1378 if ((flags & EXTRA_FIELD) != 0) {
1380 unsigned int len = lenbuf[0] = get_byte ();
1381 len |= (lenbuf[1] = get_byte ()) << 8;
1383 fprintf(stderr,"%s: %s: extra field of %u bytes ignored\n",
1384 program_name, ifname, len);
1386 if (flags & HEADER_CRC)
1388 discard_input_bytes (len, flags);
1391 /* Get original file name if it was truncated */
1392 if ((flags & ORIG_NAME) != 0) {
1393 if (no_name || (to_stdout && !list) || part_nb > 1) {
1394 /* Discard the old name */
1395 discard_input_bytes (-1, flags);
1397 /* Copy the base name. Keep a directory prefix intact. */
1398 char *p = gzip_base_name (ofname);
1401 *p = (char) get_byte ();
1402 if (*p++ == '\0') break;
1403 if (p >= ofname+sizeof(ofname)) {
1404 gzip_error ("corrupted input -- file name too large");
1407 if (flags & HEADER_CRC)
1408 updcrc ((uch *) base, p - base);
1409 p = gzip_base_name (base);
1410 memmove (base, p, strlen (p) + 1);
1411 /* If necessary, adapt the name to local OS conventions: */
1413 MAKE_LEGAL_NAME(base);
1414 if (base) list=0; /* avoid warning about unused variable */
1416 } /* no_name || to_stdout */
1419 /* Discard file comment if any */
1420 if ((flags & COMMENT) != 0) {
1421 discard_input_bytes (-1, flags);
1424 if (flags & HEADER_CRC)
1426 unsigned int crc16 = updcrc (magic, 0) & 0xffff;
1427 unsigned int header16 = get_byte ();
1428 header16 |= ((unsigned int) get_byte ()) << 8;
1429 if (header16 != crc16)
1432 "%s: %s: header checksum 0x%04x != computed checksum 0x%04x\n",
1433 program_name, ifname, header16, crc16);
1441 header_bytes = inptr + 2*4; /* include crc and size */
1444 } else if (memcmp(magic, PKZIP_MAGIC, 2) == 0 && inptr == 2
1445 && memcmp((char*)inbuf, PKZIP_MAGIC, 4) == 0) {
1446 /* To simplify the code, we support a zip file when alone only.
1447 * We are thus guaranteed that the entire local header fits in inbuf.
1451 if (check_zipfile(in) != OK) return -1;
1452 /* check_zipfile may get ofname from the local header */
1455 } else if (memcmp(magic, PACK_MAGIC, 2) == 0) {
1459 } else if (memcmp(magic, LZW_MAGIC, 2) == 0) {
1461 method = COMPRESSED;
1464 } else if (memcmp(magic, LZH_MAGIC, 2) == 0) {
1469 } else if (force && to_stdout && !list) { /* pass input unchanged */
1475 if (imagic0 != EOF) {
1476 write_buf(fileno(stdout), magic, 1);
1480 if (method >= 0) return method;
1483 fprintf (stderr, "\n%s: %s: not in gzip format\n",
1484 program_name, ifname);
1491 for (inbyte = imagic1; inbyte == 0; inbyte = try_byte ())
1496 WARN ((stderr, "\n%s: %s: decompression OK, trailing zero bytes ignored\n",
1497 program_name, ifname));
1502 WARN((stderr, "\n%s: %s: decompression OK, trailing garbage ignored\n",
1503 program_name, ifname));
1508 /* ========================================================================
1509 * Display the characteristics of the compressed file.
1510 * If the given method is < 0, display the accumulated totals.
1511 * IN assertions: time_stamp, header_bytes and ifile_size are initialized.
1513 local void do_list(ifd, method)
1514 int ifd; /* input file descriptor */
1515 int method; /* compression method */
1517 ulg crc; /* original crc */
1518 static int first_time = 1;
1519 static char const *const methods[MAX_METHODS] = {
1524 "", "", "", "", /* 4 to 7 reserved */
1526 int positive_off_t_width = 1;
1529 for (o = OFF_T_MAX; 9 < o; o /= 10) {
1530 positive_off_t_width++;
1533 if (first_time && method >= 0) {
1536 printf("method crc date time ");
1539 printf("%*.*s %*.*s ratio uncompressed_name\n",
1540 positive_off_t_width, positive_off_t_width, "compressed",
1541 positive_off_t_width, positive_off_t_width, "uncompressed");
1543 } else if (method < 0) {
1544 if (total_in <= 0 || total_out <= 0) return;
1548 if (verbose || !quiet) {
1549 fprint_off(stdout, total_in, positive_off_t_width);
1551 fprint_off(stdout, total_out, positive_off_t_width);
1554 display_ratio(total_out-(total_in-header_bytes), total_out, stdout);
1555 /* header_bytes is not meaningful but used to ensure the same
1556 * ratio if there is a single file.
1558 printf(" (totals)\n");
1561 crc = (ulg)~0; /* unknown */
1563 bytes_in = ifile_size;
1565 if (!RECORD_IO && method == DEFLATED && !last_member) {
1566 /* Get the crc and uncompressed size for gzip'ed (not zip'ed) files.
1567 * If the lseek fails, we could use read() to get to the end, but
1568 * --list is used to get quick results.
1569 * Use "gunzip < foo.gz | wc -c" to get the uncompressed size if
1570 * you are not concerned about speed.
1572 bytes_in = lseek(ifd, (off_t)(-8), SEEK_END);
1573 if (bytes_in != -1L) {
1576 if (read(ifd, (char*)buf, sizeof(buf)) != sizeof(buf)) {
1580 bytes_out = LG(buf+4);
1586 struct tm *tm = localtime (&time_stamp.tv_sec);
1587 printf ("%5s %08lx ", methods[method], crc);
1589 printf ("%s%3d %02d:%02d ",
1590 ("Jan\0Feb\0Mar\0Apr\0May\0Jun\0Jul\0Aug\0Sep\0Oct\0Nov\0Dec"
1592 tm->tm_mday, tm->tm_hour, tm->tm_min);
1594 printf ("??? ?? ??:?? ");
1596 fprint_off(stdout, bytes_in, positive_off_t_width);
1598 fprint_off(stdout, bytes_out, positive_off_t_width);
1600 if (bytes_in == -1L) {
1602 bytes_in = bytes_out = header_bytes = 0;
1603 } else if (total_in >= 0) {
1604 total_in += bytes_in;
1606 if (bytes_out == -1L) {
1608 bytes_in = bytes_out = header_bytes = 0;
1609 } else if (total_out >= 0) {
1610 total_out += bytes_out;
1612 display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out, stdout);
1613 printf(" %s\n", ofname);
1616 /* ========================================================================
1617 * Shorten the given name by one character, or replace a .tar extension
1618 * with .tgz. Truncate the last part of the name which is longer than
1619 * MIN_PART characters: 1234.678.012.gz -> 123.678.012.gz. If the name
1620 * has only parts shorter than MIN_PART truncate the longest part.
1621 * For decompression, just remove the last character of the name.
1623 * IN assertion: for compression, the suffix of the given name is z_suffix.
1625 local void shorten_name(name)
1628 int len; /* length of name without z_suffix */
1629 char *trunc = NULL; /* character to be truncated */
1630 int plen; /* current part length */
1631 int min_part = MIN_PART; /* current minimum part length */
1637 gzip_error ("name too short");
1641 p = get_suffix(name);
1643 gzip_error ("can't recover suffix\n");
1647 /* compress 1234567890.tar to 1234567890.tgz */
1648 if (len > 4 && strequ(p-4, ".tar")) {
1649 strcpy(p-4, ".tgz");
1652 /* Try keeping short extensions intact:
1653 * 1234.678.012.gz -> 123.678.012.gz
1656 p = strrchr(name, PATH_SEP);
1659 plen = strcspn(p, PART_SEP);
1661 if (plen > min_part) trunc = p-1;
1664 } while (trunc == NULL && --min_part != 0);
1666 if (trunc != NULL) {
1668 trunc[0] = trunc[1];
1672 trunc = strrchr(name, PART_SEP[0]);
1674 gzip_error ("internal error in shorten_name");
1675 if (trunc[1] == '\0') trunc--; /* force truncation */
1677 strcpy(trunc, z_suffix);
1680 /* ========================================================================
1681 * The compressed file already exists, so ask for confirmation.
1682 * Return ERROR if the file must be skipped.
1684 local int check_ofname()
1686 /* Ask permission to overwrite the existing file */
1689 fprintf (stderr, "%s: %s already exists;", program_name, ofname);
1690 if (foreground && (presume_input_tty || isatty(fileno(stdin)))) {
1691 fprintf(stderr, " do you wish to overwrite (y or n)? ");
1696 fprintf(stderr, "\tnot overwritten\n");
1697 if (exit_code == OK) exit_code = WARNING;
1701 if (xunlink (ofname)) {
1709 /* ========================================================================
1710 * Copy modes, times, ownership from input file to output file.
1711 * IN assertion: to_stdout is false.
1713 local void copy_stat(ifstat)
1714 struct stat *ifstat;
1716 mode_t mode = ifstat->st_mode & S_IRWXUGO;
1720 struct timespec timespec[2];
1721 timespec[0] = get_stat_atime (ifstat);
1722 timespec[1] = get_stat_mtime (ifstat);
1724 if (decompress && 0 <= time_stamp.tv_nsec
1725 && ! (timespec[1].tv_sec == time_stamp.tv_sec
1726 && timespec[1].tv_nsec == time_stamp.tv_nsec))
1728 timespec[1] = time_stamp;
1730 fprintf(stderr, "%s: time stamp restored\n", ofname);
1734 if (fdutimens (ofd, ofname, timespec) != 0)
1737 WARN ((stderr, "%s: ", program_name));
1747 /* Copy ownership */
1749 ignore_value (fchown (ofd, ifstat->st_uid, ifstat->st_gid));
1751 ignore_value (chown (ofname, ifstat->st_uid, ifstat->st_gid));
1755 /* Copy the protection modes */
1757 r = fchmod (ofd, mode);
1759 r = chmod (ofname, mode);
1763 WARN ((stderr, "%s: ", program_name));
1773 /* ========================================================================
1774 * Recurse through the given directory.
1776 local void treat_dir (fd, dir)
1781 char nbuf[MAX_PATH_LEN];
1786 dirp = fdopendir (fd);
1794 entries = streamsavedir (dirp);
1797 if (closedir (dirp) != 0)
1802 for (entry = entries; *entry; entry += entrylen + 1) {
1803 size_t len = strlen (dir);
1804 entrylen = strlen (entry);
1805 if (strequ (entry, ".") || strequ (entry, ".."))
1807 if (len + entrylen < MAX_PATH_LEN - 2) {
1809 if (len != 0 /* dir = "" means current dir on Amiga */
1811 && dir[len-1] != PATH_SEP2
1814 && dir[len-1] != PATH_SEP3
1817 nbuf[len++] = PATH_SEP;
1819 strcpy (nbuf + len, entry);
1822 fprintf(stderr,"%s: %s/%s: pathname too long\n",
1823 program_name, dir, entry);
1829 #endif /* ! NO_DIR */
1831 /* Make sure signals get handled properly. */
1834 install_signal_handlers ()
1836 int nsigs = sizeof handled_sig / sizeof handled_sig[0];
1840 struct sigaction act;
1842 sigemptyset (&caught_signals);
1843 for (i = 0; i < nsigs; i++)
1845 sigaction (handled_sig[i], NULL, &act);
1846 if (act.sa_handler != SIG_IGN)
1847 sigaddset (&caught_signals, handled_sig[i]);
1850 act.sa_handler = abort_gzip_signal;
1851 act.sa_mask = caught_signals;
1854 for (i = 0; i < nsigs; i++)
1855 if (sigismember (&caught_signals, handled_sig[i]))
1859 sigaction (handled_sig[i], &act, NULL);
1862 for (i = 0; i < nsigs; i++)
1863 if (signal (handled_sig[i], SIG_IGN) != SIG_IGN)
1867 signal (handled_sig[i], abort_gzip_signal);
1868 siginterrupt (handled_sig[i], 1);
1873 /* ========================================================================
1874 * Free all dynamically allocated variables and exit with the given code.
1876 local void do_exit(exitcode)
1879 static int in_exit = 0;
1881 if (in_exit) exit(exitcode);
1900 /* ========================================================================
1901 * Close and unlink the output file.
1904 remove_output_file ()
1909 sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
1910 fd = remove_ofname_fd;
1913 remove_ofname_fd = -1;
1917 sigprocmask (SIG_SETMASK, &oldset, NULL);
1920 /* ========================================================================
1926 remove_output_file ();
1930 /* ========================================================================
1934 abort_gzip_signal (sig)
1938 signal (sig, SIG_IGN);
1939 remove_output_file ();
1940 if (sig == exiting_signal)
1942 signal (sig, SIG_DFL);