1
/* gzip (GNU zip) -- compress files with zip algorithm and 'compress' interface
3
Copyright (C) 1999, 2001-2002, 2006-2007, 2009-2012 Free Software
5
Copyright (C) 1992-1993 Jean-loup Gailly
7
This program is free software; you can redistribute it and/or modify
8
it under the terms of the GNU General Public License as published by
9
the Free Software Foundation; either version 3, or (at your option)
12
This program is distributed in the hope that it will be useful,
13
but WITHOUT ANY WARRANTY; without even the implied warranty of
14
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15
GNU General Public License for more details.
17
You should have received a copy of the GNU General Public License
18
along with this program; if not, write to the Free Software Foundation,
19
Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
22
* The unzip code was written and put in the public domain by Mark Adler.
23
* Portions of the lzw code are derived from the public domain 'compress'
24
* written by Spencer Thomas, Joe Orost, James Woods, Jim McKie, Steve Davies,
25
* Ken Turkowski, Dave Mack and Peter Jannesen.
27
* See the license_msg below and the file COPYING for the software license.
28
* See the file algorithm.doc for the compression algorithms and file formats.
31
static char const *const license_msg[] = {
32
"Copyright (C) 2007, 2010, 2011 Free Software Foundation, Inc.",
33
"Copyright (C) 1993 Jean-loup Gailly.",
34
"This is free software. You may redistribute copies of it under the terms of",
35
"the GNU General Public License <http://www.gnu.org/licenses/gpl.html>.",
36
"There is NO WARRANTY, to the extent permitted by law.",
39
/* Compress files with zip algorithm and 'compress' interface.
40
* See help() function below for all options.
42
* file.gz: compressed file with same mode, owner, and utimes
43
* or stdout with -c option or if stdin used as input.
44
* If the output file name had to be truncated, the original name is kept
45
* in the compressed file.
46
* On MSDOS, file.tmp -> file.tmz. On VMS, file.tmp -> file.tmp-gz.
48
* Using gz on MSDOS would create too many file name conflicts. For
49
* example, foo.txt -> foo.tgz (.tgz must be reserved as shorthand for
50
* tar.gz). Similarly, foo.dir and foo.doc would both be mapped to foo.dgz.
51
* I also considered 12345678.txt -> 12345txt.gz but this truncates the name
52
* too heavily. There is no ideal solution given the MSDOS 8+3 limitation.
54
* For the meaning of all compilation flags, see comments in Makefile.in.
59
#include <sys/types.h>
72
#include "fcntl-safer.h"
74
#include "ignore-value.h"
75
#include "stat-time.h"
98
#define RW_USER (S_IRUSR | S_IWUSR) /* creation mode for open() */
101
# define MAX_PATH_LEN 1024 /* max pathname length */
113
off_t lseek (int fd, off_t offset, int whence);
117
#define OFF_T_MIN (~ (off_t) 0 << (sizeof (off_t) * CHAR_BIT - 1))
121
#define OFF_T_MAX (~ (off_t) 0 - OFF_T_MIN)
124
/* Use SA_NOCLDSTOP as a proxy for whether the sigaction machinery is
127
# define SA_NOCLDSTOP 0
128
# define sigprocmask(how, set, oset) /* empty */
129
# define sigset_t int
130
# if ! HAVE_SIGINTERRUPT
131
# define siginterrupt(sig, flag) /* empty */
135
#ifndef HAVE_WORKING_O_NOFOLLOW
136
# define HAVE_WORKING_O_NOFOLLOW 0
139
/* Separator for file name parts (see shorten_name()) */
140
#ifdef NO_MULTIPLE_DOTS
141
# define PART_SEP "-"
143
# define PART_SEP "."
148
DECLARE(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
149
DECLARE(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
150
DECLARE(ush, d_buf, DIST_BUFSIZE);
151
DECLARE(uch, window, 2L*WSIZE);
153
DECLARE(ush, tab_prefix, 1L<<BITS);
155
DECLARE(ush, tab_prefix0, 1L<<(BITS-1));
156
DECLARE(ush, tab_prefix1, 1L<<(BITS-1));
159
/* local variables */
161
/* If true, pretend that standard input is a tty. This option
162
is deliberately not documented, and only for testing. */
163
static bool presume_input_tty;
165
static int ascii = 0; /* convert end-of-lines to local OS conventions */
166
int to_stdout = 0; /* output to stdout (-c) */
167
static int decompress = 0; /* decompress (-d) */
168
static int force = 0; /* don't ask questions, compress links (-f) */
169
static int no_name = -1; /* don't save or restore the original file name */
170
static int no_time = -1; /* don't save or restore the original file time */
171
static int recursive = 0; /* recurse through directories (-r) */
172
static int list = 0; /* list the file contents (-l) */
173
int verbose = 0; /* be verbose (-v) */
174
int quiet = 0; /* be very quiet (-q) */
175
static int do_lzw = 0; /* generate output compatible with old compress (-Z) */
176
int test = 0; /* test .gz file integrity */
177
static int foreground = 0; /* set if program run in foreground */
178
char *program_name; /* program name */
179
int maxbits = BITS; /* max bits per code for LZW */
180
int method = DEFLATED;/* compression method */
181
int level = 6; /* compression level */
182
int exit_code = OK; /* program exit code */
183
int save_orig_name; /* set if original name must be saved */
184
static int last_member; /* set for .zip and .Z files */
185
static int part_nb; /* number of parts in .gz file */
186
struct timespec time_stamp; /* original time stamp (modification time) */
187
off_t ifile_size; /* input file size, -1 for devices (debug only) */
188
static char *env; /* contents of GZIP env variable */
189
static char **args = NULL; /* argv pointer if GZIP env variable defined */
190
static char const *z_suffix; /* default suffix (can be set with --suffix) */
191
static size_t z_len; /* strlen(z_suffix) */
193
/* The set of signals that are caught. */
194
static sigset_t caught_signals;
196
/* If nonzero then exit with status WARNING, rather than with the usual
197
signal status, on receipt of a signal with this value. This
198
suppresses a "Broken Pipe" message with some shells. */
199
static int volatile exiting_signal;
201
/* If nonnegative, close this file descriptor and unlink ofname on error. */
202
static int volatile remove_ofname_fd = -1;
204
off_t bytes_in; /* number of input bytes */
205
off_t bytes_out; /* number of output bytes */
206
static off_t total_in; /* input bytes for all files */
207
static off_t total_out; /* output bytes for all files */
208
char ifname[MAX_PATH_LEN]; /* input file name */
209
char ofname[MAX_PATH_LEN]; /* output file name */
210
static struct stat istat; /* status for input file */
211
int ifd; /* input file descriptor */
212
int ofd; /* output file descriptor */
213
unsigned insize; /* valid bytes in inbuf */
214
unsigned inptr; /* index of next byte to be processed in inbuf */
215
unsigned outcnt; /* bytes in output buffer */
216
int rsync = 0; /* make ryncable chunks */
218
static int handled_sig[] =
220
/* SIGINT must be first, as 'foreground' depends on it. */
238
/* For long options that have no equivalent short option, use a
239
non-character as a pseudo short option, starting with CHAR_MAX + 1. */
242
PRESUME_INPUT_TTY_OPTION = CHAR_MAX + 1
245
static const struct option longopts[] =
247
/* { name has_arg *flag val } */
248
{"ascii", 0, 0, 'a'}, /* ascii text mode */
249
{"to-stdout", 0, 0, 'c'}, /* write output on standard output */
250
{"stdout", 0, 0, 'c'}, /* write output on standard output */
251
{"decompress", 0, 0, 'd'}, /* decompress */
252
{"uncompress", 0, 0, 'd'}, /* decompress */
253
/* {"encrypt", 0, 0, 'e'}, encrypt */
254
{"force", 0, 0, 'f'}, /* force overwrite of output file */
255
{"help", 0, 0, 'h'}, /* give help */
256
/* {"pkzip", 0, 0, 'k'}, force output in pkzip format */
257
{"list", 0, 0, 'l'}, /* list .gz file contents */
258
{"license", 0, 0, 'L'}, /* display software license */
259
{"no-name", 0, 0, 'n'}, /* don't save or restore original name & time */
260
{"name", 0, 0, 'N'}, /* save or restore original name & time */
261
{"-presume-input-tty", no_argument, NULL, PRESUME_INPUT_TTY_OPTION},
262
{"quiet", 0, 0, 'q'}, /* quiet mode */
263
{"silent", 0, 0, 'q'}, /* quiet mode */
264
{"recursive", 0, 0, 'r'}, /* recurse through directories */
265
{"suffix", 1, 0, 'S'}, /* use given suffix instead of .gz */
266
{"test", 0, 0, 't'}, /* test compressed file integrity */
267
{"no-time", 0, 0, 'T'}, /* don't save or restore the time stamp */
268
{"verbose", 0, 0, 'v'}, /* verbose mode */
269
{"version", 0, 0, 'V'}, /* display version number */
270
{"fast", 0, 0, '1'}, /* compress faster */
271
{"best", 0, 0, '9'}, /* compress better */
272
{"lzw", 0, 0, 'Z'}, /* make output compatible with old compress */
273
{"bits", 1, 0, 'b'}, /* max number of bits per code (implies -Z) */
274
{"rsyncable", 0, 0, 'R'}, /* make rsync-friendly archive */
278
/* local functions */
280
local void try_help (void) ATTRIBUTE_NORETURN;
281
local void help (void);
282
local void license (void);
283
local void version (void);
284
local int input_eof (void);
285
local void treat_stdin (void);
286
local void treat_file (char *iname);
287
local int create_outfile (void);
288
local char *get_suffix (char *name);
289
local int open_input_file (char *iname, struct stat *sbuf);
290
local void discard_input_bytes (size_t nbytes, unsigned int flags);
291
local int make_ofname (void);
292
local void shorten_name (char *name);
293
local int get_method (int in);
294
local void do_list (int ifd, int method);
295
local int check_ofname (void);
296
local void copy_stat (struct stat *ifstat);
297
local void install_signal_handlers (void);
298
local void remove_output_file (void);
299
local RETSIGTYPE abort_gzip_signal (int);
300
local void do_exit (int exitcode) ATTRIBUTE_NORETURN;
301
int main (int argc, char **argv);
302
static int (*work) (int infile, int outfile) = zip; /* function to call */
305
local void treat_dir (int fd, char *dir);
308
#define strequ(s1, s2) (strcmp((s1),(s2)) == 0)
313
fprintf (stderr, "Try `%s --help' for more information.\n",
318
/* ======================================================================== */
321
static char const* const help_msg[] = {
322
"Compress or uncompress FILEs (by default, compress FILES in-place).",
324
"Mandatory arguments to long options are mandatory for short options too.",
327
" -a, --ascii ascii text; convert end-of-line using local conventions",
329
" -c, --stdout write on standard output, keep original files unchanged",
330
" -d, --decompress decompress",
331
/* -e, --encrypt encrypt */
332
" -f, --force force overwrite of output file and compress links",
333
" -h, --help give this help",
334
/* -k, --pkzip force output in pkzip format */
335
" -l, --list list compressed file contents",
336
" -L, --license display software license",
338
" -m, --no-time do not save or restore the original modification time",
339
" -M, --time save or restore the original modification time",
341
" -n, --no-name do not save or restore the original name and time stamp",
342
" -N, --name save or restore the original name and time stamp",
343
" -q, --quiet suppress all warnings",
345
" -r, --recursive operate recursively on directories",
347
" -S, --suffix=SUF use suffix SUF on compressed files",
348
" -t, --test test compressed file integrity",
349
" -v, --verbose verbose mode",
350
" -V, --version display version number",
351
" -1, --fast compress faster",
352
" -9, --best compress better",
354
" -Z, --lzw produce output compatible with old compress",
355
" -b, --bits=BITS max number of bits per code (implies -Z)",
357
" --rsyncable Make rsync-friendly archive",
359
"With no FILE, or when FILE is -, read standard input.",
361
"Report bugs to <bug-gzip@gnu.org>.",
363
char const *const *p = help_msg;
365
printf ("Usage: %s [OPTION]... [FILE]...\n", program_name);
366
while (*p) printf ("%s\n", *p++);
369
/* ======================================================================== */
372
char const *const *p = license_msg;
374
printf ("%s %s\n", program_name, Version);
375
while (*p) printf ("%s\n", *p++);
378
/* ======================================================================== */
383
printf ("Written by Jean-loup Gailly.\n");
386
local void progerror (char const *string)
389
fprintf (stderr, "%s: ", program_name);
395
/* ======================================================================== */
396
int main (int argc, char **argv)
398
int file_count; /* number of files to process */
399
size_t proglen; /* length of program_name */
400
int optc; /* current option */
402
EXPAND(argc, argv); /* wild card expansion if necessary */
404
program_name = gzip_base_name (argv[0]);
405
proglen = strlen (program_name);
407
atexit (close_stdin);
409
/* Suppress .exe for MSDOS, OS/2 and VMS: */
410
if (4 < proglen && strequ (program_name + proglen - 4, ".exe"))
411
program_name[proglen - 4] = '\0';
413
/* Add options in GZIP environment variable if there is one */
414
env = add_envopt(&argc, &argv, OPTIONS_VAR);
415
if (env != NULL) args = argv;
418
# define GNU_STANDARD 1
421
/* For compatibility with old compress, use program name as an option.
422
* Unless you compile with -DGNU_STANDARD=0, this program will behave as
423
* gzip even if it is invoked under the name gunzip or zcat.
425
* Systems which do not support links can still use -d or -dc.
426
* Ignore an .exe extension for MSDOS, OS/2 and VMS.
428
if (strncmp (program_name, "un", 2) == 0 /* ungzip, uncompress */
429
|| strncmp (program_name, "gun", 3) == 0) /* gunzip */
431
else if (strequ (program_name + 1, "cat") /* zcat, pcat, gcat */
432
|| strequ (program_name, "gzcat")) /* gzcat */
433
decompress = to_stdout = 1;
437
z_len = strlen(z_suffix);
439
while ((optc = getopt_long (argc, argv, "ab:cdfhH?lLmMnNqrS:tvVZ123456789",
440
longopts, (int *)0)) != -1) {
445
maxbits = atoi(optarg);
446
for (; *optarg; optarg++)
447
if (! ('0' <= *optarg && *optarg <= '9'))
449
fprintf (stderr, "%s: -b operand is not an integer\n",
455
to_stdout = 1; break;
457
decompress = 1; break;
461
help(); do_exit(OK); break;
463
list = decompress = to_stdout = 1; break;
465
license(); do_exit(OK); break;
466
case 'm': /* undocumented, may change later */
468
case 'M': /* undocumented, may change later */
471
no_name = no_time = 1; break;
473
no_name = no_time = 0; break;
474
case PRESUME_INPUT_TTY_OPTION:
475
presume_input_tty = true; break;
477
quiet = 1; verbose = 0; break;
480
fprintf (stderr, "%s: -r not supported on this system\n",
491
#ifdef NO_MULTIPLE_DOTS
492
if (*optarg == '.') optarg++;
494
z_len = strlen(optarg);
498
test = decompress = to_stdout = 1;
501
verbose++; quiet = 0; break;
503
version(); do_exit(OK); break;
508
fprintf(stderr, "%s: -Z not supported in this version\n",
513
case '1': case '2': case '3': case '4':
514
case '5': case '6': case '7': case '8': case '9':
518
/* Error message already emitted by getopt_long. */
521
} /* loop on all arguments */
523
/* By default, save name and timestamp on compression but do not
524
* restore them on decompression.
526
if (no_time < 0) no_time = decompress;
527
if (no_name < 0) no_name = decompress;
529
file_count = argc - optind;
533
if (ascii && !quiet) {
534
fprintf(stderr, "%s: option --ascii ignored on this system\n",
538
if (z_len == 0 || z_len > MAX_SUFFIX) {
539
fprintf(stderr, "%s: invalid suffix '%s'\n", program_name, z_suffix);
543
if (do_lzw && !decompress) work = lzw;
545
/* Allocate all global buffers (for DYN_ALLOC option) */
546
ALLOC(uch, inbuf, INBUFSIZ +INBUF_EXTRA);
547
ALLOC(uch, outbuf, OUTBUFSIZ+OUTBUF_EXTRA);
548
ALLOC(ush, d_buf, DIST_BUFSIZE);
549
ALLOC(uch, window, 2L*WSIZE);
551
ALLOC(ush, tab_prefix, 1L<<BITS);
553
ALLOC(ush, tab_prefix0, 1L<<(BITS-1));
554
ALLOC(ush, tab_prefix1, 1L<<(BITS-1));
557
exiting_signal = quiet ? SIGPIPE : 0;
558
install_signal_handlers ();
560
/* And get to work */
561
if (file_count != 0) {
562
if (to_stdout && !test && !list && (!decompress || !ascii)) {
563
SET_BINARY_MODE(fileno(stdout));
565
while (optind < argc) {
566
treat_file(argv[optind++]);
568
} else { /* Standard input */
571
if (list && !quiet && file_count > 1) {
572
do_list(-1, -1); /* print totals */
575
return exit_code; /* just to avoid lint warning */
578
/* Return nonzero when at end of file on input. */
582
if (!decompress || last_member)
587
if (insize != INBUFSIZ || fill_inbuf (1) == EOF)
590
/* Unget the char that fill_inbuf got. */
597
/* ========================================================================
598
* Compress or decompress stdin
600
local void treat_stdin()
603
&& (presume_input_tty
604
|| isatty(fileno((FILE *)(decompress ? stdin : stdout))))) {
605
/* Do not send compressed data to the terminal or read it from
606
* the terminal. We get here when user invoked the program
607
* without parameters, so be helpful. According to the GNU standards:
609
* If there is one behavior you think is most useful when the output
610
* is to a terminal, and another that you think is most useful when
611
* the output is a file or a pipe, then it is usually best to make
612
* the default behavior the one that is useful with output to a
613
* terminal, and have an option for the other behavior.
615
* Here we use the --force option to get the other behavior.
619
("%s: compressed data not %s a terminal."
620
" Use -f to force %scompression.\n"
621
"For help, type: %s -h\n"),
623
decompress ? "read from" : "written to",
624
decompress ? "de" : "",
629
if (decompress || !ascii) {
630
SET_BINARY_MODE(fileno(stdin));
632
if (!test && !list && (!decompress || !ascii)) {
633
SET_BINARY_MODE(fileno(stdout));
635
strcpy(ifname, "stdin");
636
strcpy(ofname, "stdout");
638
/* Get the file's time stamp and size. */
639
if (fstat (fileno (stdin), &istat) != 0)
641
progerror ("standard input");
644
ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
645
time_stamp.tv_nsec = -1;
646
if (!no_time || list)
648
if (S_ISREG (istat.st_mode))
649
time_stamp = get_stat_mtime (&istat);
651
gettime (&time_stamp);
654
clear_bufs(); /* clear input and output buffers */
660
method = get_method(ifd);
662
do_exit(exit_code); /* error message already emitted */
666
do_list(ifd, method);
670
/* Actually do the compression/decompression. Loop over zipped members.
673
if ((*work)(fileno(stdin), fileno(stdout)) != OK) return;
678
method = get_method(ifd);
679
if (method < 0) return; /* error message already emitted */
680
bytes_out = 0; /* required for length check */
685
fprintf(stderr, " OK\n");
687
} else if (!decompress) {
688
display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
689
fprintf(stderr, "\n");
690
#ifdef DISPLAY_STDIN_RATIO
692
display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
693
fprintf(stderr, "\n");
699
/* ========================================================================
700
* Compress or decompress the given file
702
local void treat_file(iname)
705
/* Accept "-" as synonym for stdin */
706
if (strequ(iname, "-")) {
707
int cflag = to_stdout;
713
/* Check if the input file is present, set ifname and istat: */
714
ifd = open_input_file (iname, &istat);
718
/* If the input name is that of a directory, recurse or ignore: */
719
if (S_ISDIR(istat.st_mode)) {
722
treat_dir (ifd, iname);
723
/* Warning: ifname is now garbage */
728
WARN ((stderr, "%s: %s is a directory -- ignored\n",
729
program_name, ifname));
735
if (! S_ISREG (istat.st_mode))
738
"%s: %s is not a directory or a regular file - ignored\n",
739
program_name, ifname));
743
if (istat.st_mode & S_ISUID)
745
WARN ((stderr, "%s: %s is set-user-ID on execution - ignored\n",
746
program_name, ifname));
750
if (istat.st_mode & S_ISGID)
752
WARN ((stderr, "%s: %s is set-group-ID on execution - ignored\n",
753
program_name, ifname));
760
if (istat.st_mode & S_ISVTX)
763
"%s: %s has the sticky bit set - file ignored\n",
764
program_name, ifname));
768
if (2 <= istat.st_nlink)
770
WARN ((stderr, "%s: %s has %lu other link%c -- unchanged\n",
771
program_name, ifname,
772
(unsigned long int) istat.st_nlink - 1,
773
istat.st_nlink == 2 ? ' ' : 's'));
780
ifile_size = S_ISREG (istat.st_mode) ? istat.st_size : -1;
781
time_stamp.tv_nsec = -1;
782
if (!no_time || list)
783
time_stamp = get_stat_mtime (&istat);
785
/* Generate output file name. For -r and (-t or -l), skip files
786
* without a valid gzip suffix (check done in make_ofname).
788
if (to_stdout && !list && !test) {
789
strcpy(ofname, "stdout");
791
} else if (make_ofname() != OK) {
796
clear_bufs(); /* clear input and output buffers */
800
method = get_method(ifd); /* updates ofname if original given */
803
return; /* error message already emitted */
807
do_list(ifd, method);
808
if (close (ifd) != 0)
813
/* If compressing to a file, check if ofname is not ambiguous
814
* because the operating system truncates names. Otherwise, generate
815
* a new ofname and save the original name in the compressed file.
818
ofd = fileno(stdout);
819
/* Keep remove_ofname_fd negative. */
821
if (create_outfile() != OK) return;
823
if (!decompress && save_orig_name && !verbose && !quiet) {
824
fprintf(stderr, "%s: %s compressed to %s\n",
825
program_name, ifname, ofname);
828
/* Keep the name even if not truncated except with --no-name: */
829
if (!save_orig_name) save_orig_name = !no_name;
832
fprintf(stderr, "%s:\t", ifname);
835
/* Actually do the compression/decompression. Loop over zipped members.
838
if ((*work)(ifd, ofd) != OK) {
839
method = -1; /* force cleanup */
846
method = get_method(ifd);
847
if (method < 0) break; /* error message already emitted */
848
bytes_out = 0; /* required for length check */
851
if (close (ifd) != 0)
860
if (close (ofd) != 0)
863
sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
864
remove_ofname_fd = -1;
865
unlink_errno = xunlink (ifname) == 0 ? 0 : errno;
866
sigprocmask (SIG_SETMASK, &oldset, NULL);
870
WARN ((stderr, "%s: ", program_name));
873
errno = unlink_errno;
881
remove_output_file ();
885
/* Display statistics */
888
fprintf(stderr, " OK");
889
} else if (decompress) {
890
display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out,stderr);
892
display_ratio(bytes_in-(bytes_out-header_bytes), bytes_in, stderr);
894
if (!test && !to_stdout) {
895
fprintf(stderr, " -- replaced with %s", ofname);
897
fprintf(stderr, "\n");
901
/* ========================================================================
902
* Create the output file. Return OK or ERROR.
903
* Try several times if necessary to avoid truncating the z_suffix. For
904
* example, do not create a compressed file of name "1234567890123."
905
* Sets save_orig_name to true if the file name has been truncated.
906
* IN assertions: the input file has already been open (ifd is set) and
907
* ofname has already been updated if there was an original name.
908
* OUT assertions: ifd and ofd are closed in case of error.
910
local int create_outfile()
912
int name_shortened = 0;
913
int flags = (O_WRONLY | O_CREAT | O_EXCL
914
| (ascii && decompress ? 0 : O_BINARY));
921
sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
922
remove_ofname_fd = ofd = OPEN (ofname, flags, RW_USER);
924
sigprocmask (SIG_SETMASK, &oldset, NULL);
933
shorten_name (ofname);
939
if (check_ofname () != OK)
953
if (name_shortened && decompress)
955
/* name might be too long if an original name was saved */
956
WARN ((stderr, "%s: %s: warning, name truncated\n",
957
program_name, ofname));
963
/* ========================================================================
964
* Return a pointer to the 'z' suffix of a file name, or NULL. For all
965
* systems, ".gz", ".z", ".Z", ".taz", ".tgz", "-gz", "-z" and "_z" are
966
* accepted suffixes, in addition to the value of the --suffix option.
967
* ".tgz" is a useful convention for tar.z files on systems limited
968
* to 3 characters extensions. On such systems, ".?z" and ".??z" are
969
* also accepted suffixes. For Unix, we do not want to accept any
970
* .??z suffix as indicating a compressed file; some people use .xyz
971
* to denote volume data.
972
* On systems allowing multiple versions of the same file (such as VMS),
973
* this function removes any version suffix in the given name.
975
local char *get_suffix(name)
979
char suffix[MAX_SUFFIX+3]; /* last chars of name, forced to lower case */
980
static char const *known_suffixes[] =
981
{NULL, ".gz", ".z", ".taz", ".tgz", "-gz", "-z", "_z",
986
char const **suf = known_suffixes;
989
if (strequ(z_suffix, "z")) suf++; /* check long suffixes first */
992
/* strip a version number from the file name */
994
char *v = strrchr(name, SUFFIX_SEP);
995
if (v != NULL) *v = '\0';
999
if (nlen <= MAX_SUFFIX+2) {
1000
strcpy(suffix, name);
1002
strcpy(suffix, name+nlen-MAX_SUFFIX-2);
1005
slen = strlen(suffix);
1007
int s = strlen(*suf);
1008
if (slen > s && suffix[slen-s-1] != PATH_SEP
1009
&& strequ(suffix + slen - s, *suf)) {
1012
} while (*++suf != NULL);
1018
/* Open file NAME with the given flags and mode and store its status
1019
into *ST. Return a file descriptor to the newly opened file, or -1
1020
(setting errno) on failure. */
1022
open_and_stat (char *name, int flags, mode_t mode, struct stat *st)
1026
/* Refuse to follow symbolic links unless -c or -f. */
1027
if (!to_stdout && !force)
1029
if (HAVE_WORKING_O_NOFOLLOW)
1030
flags |= O_NOFOLLOW;
1033
#if HAVE_LSTAT || defined lstat
1034
if (lstat (name, st) != 0)
1036
else if (S_ISLNK (st->st_mode))
1045
fd = OPEN (name, flags, mode);
1046
if (0 <= fd && fstat (fd, st) != 0)
1057
/* ========================================================================
1058
* Set ifname to the input file name (with a suffix appended if necessary)
1059
* and istat to its stats. For decompression, if no file exists with the
1060
* original name, try adding successively z_suffix, .gz, .z, -z and .Z.
1061
* For MSDOS, we try only z_suffix and z.
1062
* Return an open file descriptor or -1.
1065
open_input_file (iname, sbuf)
1069
int ilen; /* strlen(ifname) */
1070
int z_suffix_errno = 0;
1071
static char const *suffixes[] = {NULL, ".gz", ".z", "-z", ".Z", NULL};
1072
char const **suf = suffixes;
1074
#ifdef NO_MULTIPLE_DOTS
1075
char *dot; /* pointer to ifname extension, or NULL */
1078
int open_flags = (O_RDONLY | O_NONBLOCK | O_NOCTTY
1079
| (ascii && !decompress ? 0 : O_BINARY));
1083
if (sizeof ifname - 1 <= strlen (iname))
1086
strcpy(ifname, iname);
1088
/* If input file exists, return OK. */
1089
fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1093
if (!decompress || errno != ENOENT) {
1097
/* file.ext doesn't exist, try adding a suffix (after removing any
1098
* version number for VMS).
1100
s = get_suffix(ifname);
1102
progerror(ifname); /* ifname already has z suffix and does not exist */
1105
#ifdef NO_MULTIPLE_DOTS
1106
dot = strrchr(ifname, '.');
1108
strcat(ifname, ".");
1109
dot = strrchr(ifname, '.');
1112
ilen = strlen(ifname);
1113
if (strequ(z_suffix, ".gz")) suf++;
1115
/* Search for all suffixes */
1117
char const *s0 = s = *suf;
1118
strcpy (ifname, iname);
1119
#ifdef NO_MULTIPLE_DOTS
1121
if (*dot == '\0') strcpy (dot, ".");
1123
#ifdef MAX_EXT_CHARS
1124
if (MAX_EXT_CHARS < strlen (s) + strlen (dot + 1))
1125
dot[MAX_EXT_CHARS + 1 - strlen (s)] = '\0';
1127
if (sizeof ifname <= ilen + strlen (s))
1130
fd = open_and_stat (ifname, open_flags, RW_USER, sbuf);
1133
if (errno != ENOENT)
1138
if (strequ (s0, z_suffix))
1139
z_suffix_errno = errno;
1140
} while (*++suf != NULL);
1142
/* No suffix found, complain using z_suffix: */
1143
strcpy(ifname, iname);
1144
#ifdef NO_MULTIPLE_DOTS
1145
if (*dot == '\0') strcpy(dot, ".");
1147
#ifdef MAX_EXT_CHARS
1148
if (MAX_EXT_CHARS < z_len + strlen (dot + 1))
1149
dot[MAX_EXT_CHARS + 1 - z_len] = '\0';
1151
strcat(ifname, z_suffix);
1152
errno = z_suffix_errno;
1157
fprintf (stderr, "%s: %s: file name too long\n", program_name, iname);
1162
/* ========================================================================
1163
* Generate ofname given ifname. Return OK, or WARNING if file must be skipped.
1164
* Sets save_orig_name to true if the file name has been truncated.
1166
local int make_ofname()
1168
char *suff; /* ofname z suffix */
1170
strcpy(ofname, ifname);
1171
/* strip a version number if any and get the gzip suffix if present: */
1172
suff = get_suffix(ofname);
1176
/* With -t or -l, try all files (even without .gz suffix)
1177
* except with -r (behave as with just -dr).
1179
if (!recursive && (list || test)) return OK;
1181
/* Avoid annoying messages with -r */
1182
if (verbose || (!recursive && !quiet)) {
1183
WARN((stderr,"%s: %s: unknown suffix -- ignored\n",
1184
program_name, ifname));
1188
/* Make a special case for .tgz and .taz: */
1190
if (strequ(suff, ".tgz") || strequ(suff, ".taz")) {
1191
strcpy(suff, ".tar");
1193
*suff = '\0'; /* strip the z suffix */
1195
/* ofname might be changed later if infile contains an original name */
1197
} else if (suff && ! force) {
1198
/* Avoid annoying messages with -r (see treat_dir()) */
1199
if (verbose || (!recursive && !quiet)) {
1200
/* Don't use WARN, as it affects exit status. */
1201
fprintf (stderr, "%s: %s already has %s suffix -- unchanged\n",
1202
program_name, ifname, suff);
1208
#ifdef NO_MULTIPLE_DOTS
1209
suff = strrchr(ofname, '.');
1211
if (sizeof ofname <= strlen (ofname) + 1)
1213
strcat(ofname, ".");
1214
# ifdef MAX_EXT_CHARS
1215
if (strequ(z_suffix, "z")) {
1216
if (sizeof ofname <= strlen (ofname) + 2)
1218
strcat(ofname, "gz"); /* enough room */
1221
/* On the Atari and some versions of MSDOS,
1222
* ENAMETOOLONG does not work correctly. So we
1223
* must truncate here.
1225
} else if (strlen(suff)-1 + z_len > MAX_SUFFIX) {
1226
suff[MAX_SUFFIX+1-z_len] = '\0';
1230
#endif /* NO_MULTIPLE_DOTS */
1231
if (sizeof ofname <= strlen (ofname) + z_len)
1233
strcat(ofname, z_suffix);
1235
} /* decompress ? */
1239
WARN ((stderr, "%s: %s: file name too long\n", program_name, ifname));
1243
/* Discard NBYTES input bytes from the input, or up through the next
1244
zero byte if NBYTES == (size_t) -1. If FLAGS say that the header
1245
CRC should be computed, update the CRC accordingly. */
1247
discard_input_bytes (nbytes, flags)
1253
uch c = get_byte ();
1254
if (flags & HEADER_CRC)
1256
if (nbytes != (size_t) -1)
1263
/* ========================================================================
1264
* Check the magic number of the input file and update ofname if an
1265
* original name was given and to_stdout is not set.
1266
* Return the compression method, -1 for error, -2 for warning.
1267
* Set inptr to the offset of the next byte to be processed.
1268
* Updates time_stamp if there is one and --no-time is not used.
1269
* This function may be called repeatedly for an input file consisting
1270
* of several contiguous gzip'ed members.
1271
* IN assertions: there is at least one remaining compressed member.
1272
* If the member is a zip file, it must be the only one.
1274
local int get_method(in)
1275
int in; /* input file descriptor */
1277
uch flags; /* compression flags */
1278
uch magic[10]; /* magic header */
1279
int imagic0; /* first magic byte or EOF */
1280
int imagic1; /* like magic[1], but can represent EOF */
1281
ulg stamp; /* time stamp */
1283
/* If --force and --stdout, zcat == cat, so do not complain about
1284
* premature end of file: use try_byte instead of get_byte.
1286
if (force && to_stdout) {
1287
imagic0 = try_byte();
1289
imagic1 = try_byte ();
1291
/* If try_byte returned EOF, magic[1] == (char) EOF. */
1293
magic[0] = get_byte ();
1296
magic[1] = get_byte ();
1297
imagic1 = 0; /* avoid lint warning */
1299
imagic1 = try_byte ();
1303
method = -1; /* unknown yet */
1304
part_nb++; /* number of parts in gzip file */
1306
last_member = RECORD_IO;
1307
/* assume multiple members in gzip file except for record oriented I/O */
1309
if (memcmp(magic, GZIP_MAGIC, 2) == 0
1310
|| memcmp(magic, OLD_GZIP_MAGIC, 2) == 0) {
1312
method = (int)get_byte();
1313
if (method != DEFLATED) {
1315
"%s: %s: unknown method %d -- not supported\n",
1316
program_name, ifname, method);
1321
flags = (uch)get_byte();
1323
if ((flags & ENCRYPTED) != 0) {
1325
"%s: %s is encrypted -- not supported\n",
1326
program_name, ifname);
1330
if ((flags & RESERVED) != 0) {
1332
"%s: %s has flags 0x%x -- not supported\n",
1333
program_name, ifname, flags);
1335
if (force <= 1) return -1;
1337
stamp = (ulg)get_byte();
1338
stamp |= ((ulg)get_byte()) << 8;
1339
stamp |= ((ulg)get_byte()) << 16;
1340
stamp |= ((ulg)get_byte()) << 24;
1341
if (stamp != 0 && !no_time)
1343
time_stamp.tv_sec = stamp;
1344
time_stamp.tv_nsec = 0;
1347
magic[8] = get_byte (); /* Ignore extra flags. */
1348
magic[9] = get_byte (); /* Ignore OS type. */
1350
if (flags & HEADER_CRC)
1352
magic[2] = DEFLATED;
1354
magic[4] = stamp & 0xff;
1355
magic[5] = (stamp >> 8) & 0xff;
1356
magic[6] = (stamp >> 16) & 0xff;
1357
magic[7] = stamp >> 24;
1362
if ((flags & EXTRA_FIELD) != 0) {
1364
unsigned int len = lenbuf[0] = get_byte ();
1365
len |= (lenbuf[1] = get_byte ()) << 8;
1367
fprintf(stderr,"%s: %s: extra field of %u bytes ignored\n",
1368
program_name, ifname, len);
1370
if (flags & HEADER_CRC)
1372
discard_input_bytes (len, flags);
1375
/* Get original file name if it was truncated */
1376
if ((flags & ORIG_NAME) != 0) {
1377
if (no_name || (to_stdout && !list) || part_nb > 1) {
1378
/* Discard the old name */
1379
discard_input_bytes (-1, flags);
1381
/* Copy the base name. Keep a directory prefix intact. */
1382
char *p = gzip_base_name (ofname);
1385
*p = (char) get_byte ();
1386
if (*p++ == '\0') break;
1387
if (p >= ofname+sizeof(ofname)) {
1388
gzip_error ("corrupted input -- file name too large");
1391
if (flags & HEADER_CRC)
1392
updcrc ((uch *) base, p - base);
1393
p = gzip_base_name (base);
1394
memmove (base, p, strlen (p) + 1);
1395
/* If necessary, adapt the name to local OS conventions: */
1397
MAKE_LEGAL_NAME(base);
1398
if (base) list=0; /* avoid warning about unused variable */
1400
} /* no_name || to_stdout */
1403
/* Discard file comment if any */
1404
if ((flags & COMMENT) != 0) {
1405
discard_input_bytes (-1, flags);
1408
if (flags & HEADER_CRC)
1410
unsigned int crc16 = updcrc (magic, 0) & 0xffff;
1411
unsigned int header16 = get_byte ();
1412
header16 |= ((unsigned int) get_byte ()) << 8;
1413
if (header16 != crc16)
1416
"%s: %s: header checksum 0x%04x != computed checksum 0x%04x\n",
1417
program_name, ifname, header16, crc16);
1425
header_bytes = inptr + 2*4; /* include crc and size */
1428
} else if (memcmp(magic, PKZIP_MAGIC, 2) == 0 && inptr == 2
1429
&& memcmp((char*)inbuf, PKZIP_MAGIC, 4) == 0) {
1430
/* To simplify the code, we support a zip file when alone only.
1431
* We are thus guaranteed that the entire local header fits in inbuf.
1435
if (check_zipfile(in) != OK) return -1;
1436
/* check_zipfile may get ofname from the local header */
1439
} else if (memcmp(magic, PACK_MAGIC, 2) == 0) {
1443
} else if (memcmp(magic, LZW_MAGIC, 2) == 0) {
1445
method = COMPRESSED;
1448
} else if (memcmp(magic, LZH_MAGIC, 2) == 0) {
1453
} else if (force && to_stdout && !list) { /* pass input unchanged */
1459
if (imagic0 != EOF) {
1460
write_buf(fileno(stdout), magic, 1);
1464
if (method >= 0) return method;
1467
fprintf (stderr, "\n%s: %s: not in gzip format\n",
1468
program_name, ifname);
1475
for (inbyte = imagic1; inbyte == 0; inbyte = try_byte ())
1480
WARN ((stderr, "\n%s: %s: decompression OK, trailing zero bytes ignored\n",
1481
program_name, ifname));
1486
WARN((stderr, "\n%s: %s: decompression OK, trailing garbage ignored\n",
1487
program_name, ifname));
1492
/* ========================================================================
1493
* Display the characteristics of the compressed file.
1494
* If the given method is < 0, display the accumulated totals.
1495
* IN assertions: time_stamp, header_bytes and ifile_size are initialized.
1497
local void do_list(ifd, method)
1498
int ifd; /* input file descriptor */
1499
int method; /* compression method */
1501
ulg crc; /* original crc */
1502
static int first_time = 1;
1503
static char const *const methods[MAX_METHODS] = {
1508
"", "", "", "", /* 4 to 7 reserved */
1510
int positive_off_t_width = 1;
1513
for (o = OFF_T_MAX; 9 < o; o /= 10) {
1514
positive_off_t_width++;
1517
if (first_time && method >= 0) {
1520
printf("method crc date time ");
1523
printf("%*.*s %*.*s ratio uncompressed_name\n",
1524
positive_off_t_width, positive_off_t_width, "compressed",
1525
positive_off_t_width, positive_off_t_width, "uncompressed");
1527
} else if (method < 0) {
1528
if (total_in <= 0 || total_out <= 0) return;
1532
if (verbose || !quiet) {
1533
fprint_off(stdout, total_in, positive_off_t_width);
1535
fprint_off(stdout, total_out, positive_off_t_width);
1538
display_ratio(total_out-(total_in-header_bytes), total_out, stdout);
1539
/* header_bytes is not meaningful but used to ensure the same
1540
* ratio if there is a single file.
1542
printf(" (totals)\n");
1545
crc = (ulg)~0; /* unknown */
1547
bytes_in = ifile_size;
1549
if (!RECORD_IO && method == DEFLATED && !last_member) {
1550
/* Get the crc and uncompressed size for gzip'ed (not zip'ed) files.
1551
* If the lseek fails, we could use read() to get to the end, but
1552
* --list is used to get quick results.
1553
* Use "gunzip < foo.gz | wc -c" to get the uncompressed size if
1554
* you are not concerned about speed.
1556
bytes_in = lseek(ifd, (off_t)(-8), SEEK_END);
1557
if (bytes_in != -1L) {
1560
if (read(ifd, (char*)buf, sizeof(buf)) != sizeof(buf)) {
1564
bytes_out = LG(buf+4);
1570
struct tm *tm = localtime (&time_stamp.tv_sec);
1571
printf ("%5s %08lx ", methods[method], crc);
1573
printf ("%s%3d %02d:%02d ",
1574
("Jan\0Feb\0Mar\0Apr\0May\0Jun\0Jul\0Aug\0Sep\0Oct\0Nov\0Dec"
1576
tm->tm_mday, tm->tm_hour, tm->tm_min);
1578
printf ("??? ?? ??:?? ");
1580
fprint_off(stdout, bytes_in, positive_off_t_width);
1582
fprint_off(stdout, bytes_out, positive_off_t_width);
1584
if (bytes_in == -1L) {
1586
bytes_in = bytes_out = header_bytes = 0;
1587
} else if (total_in >= 0) {
1588
total_in += bytes_in;
1590
if (bytes_out == -1L) {
1592
bytes_in = bytes_out = header_bytes = 0;
1593
} else if (total_out >= 0) {
1594
total_out += bytes_out;
1596
display_ratio(bytes_out-(bytes_in-header_bytes), bytes_out, stdout);
1597
printf(" %s\n", ofname);
1600
/* ========================================================================
1601
* Shorten the given name by one character, or replace a .tar extension
1602
* with .tgz. Truncate the last part of the name which is longer than
1603
* MIN_PART characters: 1234.678.012.gz -> 123.678.012.gz. If the name
1604
* has only parts shorter than MIN_PART truncate the longest part.
1605
* For decompression, just remove the last character of the name.
1607
* IN assertion: for compression, the suffix of the given name is z_suffix.
1609
local void shorten_name(name)
1612
int len; /* length of name without z_suffix */
1613
char *trunc = NULL; /* character to be truncated */
1614
int plen; /* current part length */
1615
int min_part = MIN_PART; /* current minimum part length */
1621
gzip_error ("name too short");
1625
p = get_suffix(name);
1627
gzip_error ("can't recover suffix\n");
1631
/* compress 1234567890.tar to 1234567890.tgz */
1632
if (len > 4 && strequ(p-4, ".tar")) {
1633
strcpy(p-4, ".tgz");
1636
/* Try keeping short extensions intact:
1637
* 1234.678.012.gz -> 123.678.012.gz
1640
p = strrchr(name, PATH_SEP);
1643
plen = strcspn(p, PART_SEP);
1645
if (plen > min_part) trunc = p-1;
1648
} while (trunc == NULL && --min_part != 0);
1650
if (trunc != NULL) {
1652
trunc[0] = trunc[1];
1656
trunc = strrchr(name, PART_SEP[0]);
1658
gzip_error ("internal error in shorten_name");
1659
if (trunc[1] == '\0') trunc--; /* force truncation */
1661
strcpy(trunc, z_suffix);
1664
/* ========================================================================
1665
* The compressed file already exists, so ask for confirmation.
1666
* Return ERROR if the file must be skipped.
1668
local int check_ofname()
1670
/* Ask permission to overwrite the existing file */
1673
fprintf (stderr, "%s: %s already exists;", program_name, ofname);
1674
if (foreground && (presume_input_tty || isatty(fileno(stdin)))) {
1675
fprintf(stderr, " do you wish to overwrite (y or n)? ");
1680
fprintf(stderr, "\tnot overwritten\n");
1681
if (exit_code == OK) exit_code = WARNING;
1685
if (xunlink (ofname)) {
1693
/* ========================================================================
1694
* Copy modes, times, ownership from input file to output file.
1695
* IN assertion: to_stdout is false.
1697
local void copy_stat(ifstat)
1698
struct stat *ifstat;
1700
mode_t mode = ifstat->st_mode & S_IRWXUGO;
1704
struct timespec timespec[2];
1705
timespec[0] = get_stat_atime (ifstat);
1706
timespec[1] = get_stat_mtime (ifstat);
1708
if (decompress && 0 <= time_stamp.tv_nsec
1709
&& ! (timespec[1].tv_sec == time_stamp.tv_sec
1710
&& timespec[1].tv_nsec == time_stamp.tv_nsec))
1712
timespec[1] = time_stamp;
1714
fprintf(stderr, "%s: time stamp restored\n", ofname);
1718
if (fdutimens (ofd, ofname, timespec) != 0)
1721
WARN ((stderr, "%s: ", program_name));
1731
/* Copy ownership */
1733
ignore_value (fchown (ofd, ifstat->st_uid, ifstat->st_gid));
1735
ignore_value (chown (ofname, ifstat->st_uid, ifstat->st_gid));
1739
/* Copy the protection modes */
1741
r = fchmod (ofd, mode);
1743
r = chmod (ofname, mode);
1747
WARN ((stderr, "%s: ", program_name));
1757
/* ========================================================================
1758
* Recurse through the given directory.
1760
local void treat_dir (fd, dir)
1765
char nbuf[MAX_PATH_LEN];
1770
dirp = fdopendir (fd);
1778
entries = streamsavedir (dirp);
1781
if (closedir (dirp) != 0)
1786
for (entry = entries; *entry; entry += entrylen + 1) {
1787
size_t len = strlen (dir);
1788
entrylen = strlen (entry);
1789
if (strequ (entry, ".") || strequ (entry, ".."))
1791
if (len + entrylen < MAX_PATH_LEN - 2) {
1793
if (len != 0 /* dir = "" means current dir on Amiga */
1795
&& dir[len-1] != PATH_SEP2
1798
&& dir[len-1] != PATH_SEP3
1801
nbuf[len++] = PATH_SEP;
1803
strcpy (nbuf + len, entry);
1806
fprintf(stderr,"%s: %s/%s: pathname too long\n",
1807
program_name, dir, entry);
1813
#endif /* ! NO_DIR */
1815
/* Make sure signals get handled properly. */
1818
install_signal_handlers ()
1820
int nsigs = sizeof handled_sig / sizeof handled_sig[0];
1824
struct sigaction act;
1826
sigemptyset (&caught_signals);
1827
for (i = 0; i < nsigs; i++)
1829
sigaction (handled_sig[i], NULL, &act);
1830
if (act.sa_handler != SIG_IGN)
1831
sigaddset (&caught_signals, handled_sig[i]);
1834
act.sa_handler = abort_gzip_signal;
1835
act.sa_mask = caught_signals;
1838
for (i = 0; i < nsigs; i++)
1839
if (sigismember (&caught_signals, handled_sig[i]))
1843
sigaction (handled_sig[i], &act, NULL);
1846
for (i = 0; i < nsigs; i++)
1847
if (signal (handled_sig[i], SIG_IGN) != SIG_IGN)
1851
signal (handled_sig[i], abort_gzip_signal);
1852
siginterrupt (handled_sig[i], 1);
1857
/* ========================================================================
1858
* Free all dynamically allocated variables and exit with the given code.
1860
local void do_exit(exitcode)
1863
static int in_exit = 0;
1865
if (in_exit) exit(exitcode);
1884
/* ========================================================================
1885
* Close and unlink the output file.
1888
remove_output_file ()
1893
sigprocmask (SIG_BLOCK, &caught_signals, &oldset);
1894
fd = remove_ofname_fd;
1897
remove_ofname_fd = -1;
1901
sigprocmask (SIG_SETMASK, &oldset, NULL);
1904
/* ========================================================================
1910
remove_output_file ();
1914
/* ========================================================================
1918
abort_gzip_signal (sig)
1922
signal (sig, SIG_IGN);
1923
remove_output_file ();
1924
if (sig == exiting_signal)
1926
signal (sig, SIG_DFL);