gzip.c revision 1.12 1 1.12 mrg /* $NetBSD: gzip.c,v 1.12 2004/01/01 05:28:44 mrg Exp $ */
2 1.1 mrg
3 1.1 mrg /*
4 1.1 mrg * Copyright (c) 1997, 1998, 2003 Matthew R. Green
5 1.1 mrg * All rights reserved.
6 1.1 mrg *
7 1.1 mrg * Redistribution and use in source and binary forms, with or without
8 1.1 mrg * modification, are permitted provided that the following conditions
9 1.1 mrg * are met:
10 1.1 mrg * 1. Redistributions of source code must retain the above copyright
11 1.1 mrg * notice, this list of conditions and the following disclaimer.
12 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mrg * notice, this list of conditions and the following disclaimer in the
14 1.1 mrg * documentation and/or other materials provided with the distribution.
15 1.1 mrg * 3. The name of the author may not be used to endorse or promote products
16 1.1 mrg * derived from this software without specific prior written permission.
17 1.1 mrg *
18 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
19 1.1 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
20 1.1 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
21 1.1 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
22 1.1 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
23 1.1 mrg * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
24 1.1 mrg * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
25 1.1 mrg * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
26 1.1 mrg * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 1.1 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28 1.1 mrg * SUCH DAMAGE.
29 1.1 mrg */
30 1.1 mrg
31 1.4 mrg #include <sys/cdefs.h>
32 1.4 mrg #ifndef lint
33 1.4 mrg __COPYRIGHT("@(#) Copyright (c) 1997, 1998, 2003 Matthew R. Green\n\
34 1.4 mrg All rights reserved.\n");
35 1.12 mrg __RCSID("$NetBSD: gzip.c,v 1.12 2004/01/01 05:28:44 mrg Exp $");
36 1.4 mrg #endif /* not lint */
37 1.4 mrg
38 1.1 mrg /*
39 1.1 mrg * gzip.c -- GPL free gzip using zlib.
40 1.1 mrg *
41 1.6 mrg * very minor portions of this code are (very loosely) derived from
42 1.1 mrg * the minigzip.c in the zlib distribution.
43 1.6 mrg *
44 1.6 mrg * TODO:
45 1.6 mrg * - handle .taz/.tgz files?
46 1.10 mrg * - use mmap where possible
47 1.1 mrg */
48 1.1 mrg
49 1.1 mrg #include <sys/param.h>
50 1.1 mrg #include <sys/stat.h>
51 1.1 mrg #include <sys/time.h>
52 1.1 mrg
53 1.1 mrg #include <unistd.h>
54 1.1 mrg #include <stdio.h>
55 1.1 mrg #include <string.h>
56 1.1 mrg #include <stdlib.h>
57 1.1 mrg #include <err.h>
58 1.1 mrg #include <errno.h>
59 1.1 mrg #include <fcntl.h>
60 1.1 mrg #include <zlib.h>
61 1.1 mrg #include <fts.h>
62 1.1 mrg #include <libgen.h>
63 1.1 mrg #include <stdarg.h>
64 1.1 mrg #include <getopt.h>
65 1.1 mrg
66 1.10 mrg /* what type of file are we dealing with */
67 1.10 mrg enum filetype {
68 1.10 mrg FT_GZIP,
69 1.10 mrg FT_BZIP2,
70 1.10 mrg FT_LAST,
71 1.10 mrg FT_UNKNOWN
72 1.10 mrg };
73 1.10 mrg
74 1.10 mrg #define BZ_NO_STDIO
75 1.10 mrg #include <bzlib.h>
76 1.10 mrg
77 1.10 mrg #define BZ2_SUFFIX ".bz2"
78 1.10 mrg #define BZIP2_MAGIC "\102\132\150"
79 1.10 mrg
80 1.10 mrg #define GZ_SUFFIX ".gz"
81 1.1 mrg
82 1.10 mrg #define BUFLEN (32 * 1024)
83 1.1 mrg
84 1.9 mrg #define GZIP_MAGIC0 0x1F
85 1.10 mrg #define GZIP_MAGIC1 0x8B
86 1.10 mrg #define GZIP_OMAGIC1 0x9E
87 1.9 mrg
88 1.9 mrg #define ORIG_NAME 0x08
89 1.1 mrg
90 1.1 mrg /* Define this if you have the NetBSD gzopenfull(3) extension to zlib(3) */
91 1.1 mrg #define HAVE_ZLIB_GZOPENFULL 0
92 1.1 mrg
93 1.10 mrg static const char gzip_version[] = "NetBSD gzip 2.1";
94 1.1 mrg
95 1.3 jdolecek static char gzipflags[3]; /* `w' or `r', possible with [1-9] */
96 1.1 mrg static int cflag; /* stdout mode */
97 1.1 mrg static int dflag; /* decompress mode */
98 1.1 mrg static int fflag; /* force mode */
99 1.5 mrg static int lflag; /* list mode */
100 1.1 mrg static int nflag; /* don't save name/timestamp */
101 1.1 mrg static int Nflag; /* don't restore name/timestamp */
102 1.1 mrg static int qflag; /* quiet mode */
103 1.1 mrg static int rflag; /* recursive mode */
104 1.1 mrg static int tflag; /* test */
105 1.1 mrg static int vflag; /* verbose mode */
106 1.10 mrg static char *Sflag;
107 1.10 mrg static char *suffix;
108 1.1 mrg
109 1.10 mrg #define suffix_len (strlen(suffix) + 1) /* len + nul */
110 1.1 mrg static char *newfile; /* name of newly created file */
111 1.1 mrg static char *infile; /* name of file coming in */
112 1.1 mrg
113 1.1 mrg static void maybe_err(int rv, const char *fmt, ...);
114 1.9 mrg static void maybe_errx(int rv, const char *fmt, ...);
115 1.1 mrg static void maybe_warn(const char *fmt, ...);
116 1.1 mrg static void maybe_warnx(const char *fmt, ...);
117 1.1 mrg static void gz_compress(FILE *, gzFile);
118 1.1 mrg static off_t gz_uncompress(gzFile, FILE *);
119 1.1 mrg static void copymodes(const char *, struct stat *);
120 1.1 mrg static ssize_t file_compress(char *);
121 1.1 mrg static ssize_t file_uncompress(char *);
122 1.1 mrg static void handle_pathname(char *);
123 1.1 mrg static void handle_file(char *, struct stat *);
124 1.1 mrg static void handle_dir(char *, struct stat *);
125 1.1 mrg static void handle_stdin(void);
126 1.1 mrg static void handle_stdout(void);
127 1.6 mrg static void print_ratio(off_t, off_t, FILE *);
128 1.1 mrg static void print_verbage(char *, char *, ssize_t, ssize_t);
129 1.1 mrg static void print_test(char *, int);
130 1.7 mrg static void print_list(int fd, off_t, const char *, time_t);
131 1.10 mrg static void usage(void);
132 1.10 mrg static void display_version(void);
133 1.10 mrg static off_t unbzip2(int, int);
134 1.1 mrg
135 1.1 mrg int main(int, char *p[]);
136 1.1 mrg
137 1.11 mrg #ifdef SMALL
138 1.11 mrg #define getopt_long(a,b,c,d,e) getopt(a,b,c)
139 1.11 mrg #else
140 1.3 jdolecek static const struct option longopts[] = {
141 1.1 mrg { "stdout", no_argument, 0, 'c' },
142 1.1 mrg { "to-stdout", no_argument, 0, 'c' },
143 1.1 mrg { "decompress", no_argument, 0, 'd' },
144 1.1 mrg { "uncompress", no_argument, 0, 'd' },
145 1.1 mrg { "force", no_argument, 0, 'f' },
146 1.1 mrg { "help", no_argument, 0, 'h' },
147 1.5 mrg { "list", no_argument, 0, 'l' },
148 1.1 mrg { "no-name", no_argument, 0, 'n' },
149 1.1 mrg { "name", no_argument, 0, 'N' },
150 1.1 mrg { "quiet", no_argument, 0, 'q' },
151 1.1 mrg { "recursive", no_argument, 0, 'r' },
152 1.1 mrg { "suffix", required_argument, 0, 'S' },
153 1.1 mrg { "test", no_argument, 0, 't' },
154 1.1 mrg { "verbose", no_argument, 0, 'v' },
155 1.1 mrg { "version", no_argument, 0, 'V' },
156 1.1 mrg { "fast", no_argument, 0, '1' },
157 1.1 mrg { "best", no_argument, 0, '9' },
158 1.1 mrg #if 0
159 1.1 mrg /*
160 1.10 mrg * This is what else GNU gzip implements. --ascii isn't useful
161 1.10 mrg * on NetBSD, and I don't care to have a --license.
162 1.1 mrg */
163 1.1 mrg { "ascii", no_argument, 0, 'a' },
164 1.1 mrg { "license", no_argument, 0, 'L' },
165 1.1 mrg #endif
166 1.12 mrg { NULL, no_argument, 0, 0 },
167 1.1 mrg };
168 1.11 mrg #endif
169 1.1 mrg
170 1.1 mrg int
171 1.1 mrg main(int argc, char **argv)
172 1.1 mrg {
173 1.1 mrg const char *progname = getprogname();
174 1.1 mrg int ch;
175 1.1 mrg
176 1.1 mrg gzipflags[0] = 'w';
177 1.1 mrg gzipflags[1] = '\0';
178 1.1 mrg
179 1.10 mrg suffix = GZ_SUFFIX;;
180 1.10 mrg
181 1.1 mrg /*
182 1.1 mrg * XXX
183 1.1 mrg * handle being called `gunzip', `zcat' and `gzcat'
184 1.1 mrg */
185 1.1 mrg if (strcmp(progname, "gunzip") == 0)
186 1.1 mrg dflag = 1;
187 1.1 mrg else if (strcmp(progname, "zcat") == 0 ||
188 1.1 mrg strcmp(progname, "gzcat") == 0)
189 1.1 mrg dflag = cflag = 1;
190 1.1 mrg
191 1.1 mrg while ((ch = getopt_long(argc, argv, "cdfhHlnNqrS:tvV123456789",
192 1.1 mrg longopts, NULL)) != -1)
193 1.1 mrg switch (ch) {
194 1.1 mrg case 'c':
195 1.1 mrg cflag = 1;
196 1.1 mrg break;
197 1.1 mrg case 'd':
198 1.1 mrg dflag = 1;
199 1.1 mrg break;
200 1.1 mrg case 'f':
201 1.1 mrg fflag = 1;
202 1.1 mrg break;
203 1.5 mrg case 'l':
204 1.5 mrg lflag = 1;
205 1.5 mrg tflag = 1;
206 1.5 mrg dflag = 1;
207 1.5 mrg break;
208 1.1 mrg case 'n':
209 1.1 mrg nflag = 1;
210 1.1 mrg Nflag = 0;
211 1.1 mrg break;
212 1.1 mrg case 'N':
213 1.1 mrg nflag = 0;
214 1.1 mrg Nflag = 1;
215 1.1 mrg break;
216 1.1 mrg case 'q':
217 1.1 mrg qflag = 1;
218 1.1 mrg break;
219 1.1 mrg case 'r':
220 1.1 mrg rflag = 1;
221 1.1 mrg break;
222 1.1 mrg case 'S':
223 1.1 mrg Sflag = optarg;
224 1.1 mrg break;
225 1.1 mrg case 't':
226 1.1 mrg cflag = 1;
227 1.1 mrg tflag = 1;
228 1.1 mrg dflag = 1;
229 1.1 mrg break;
230 1.1 mrg case 'v':
231 1.1 mrg vflag = 1;
232 1.1 mrg break;
233 1.1 mrg case 'V':
234 1.1 mrg display_version();
235 1.1 mrg /* NOTREACHED */
236 1.1 mrg case '1': case '2': case '3':
237 1.1 mrg case '4': case '5': case '6':
238 1.1 mrg case '7': case '8': case '9':
239 1.1 mrg gzipflags[1] = (char)ch;
240 1.1 mrg gzipflags[2] = '\0';
241 1.1 mrg break;
242 1.12 mrg default:
243 1.12 mrg usage();
244 1.12 mrg /* NOTREACHED */
245 1.1 mrg }
246 1.1 mrg argv += optind;
247 1.1 mrg argc -= optind;
248 1.1 mrg if (dflag)
249 1.1 mrg gzipflags[0] = 'r';
250 1.1 mrg
251 1.1 mrg if (argc == 0) {
252 1.1 mrg if (dflag) /* stdin mode */
253 1.1 mrg handle_stdin();
254 1.1 mrg else /* stdout mode */
255 1.1 mrg handle_stdout();
256 1.1 mrg } else {
257 1.1 mrg do {
258 1.1 mrg handle_pathname(argv[0]);
259 1.5 mrg } while (*++argv);
260 1.1 mrg }
261 1.6 mrg if (qflag == 0 && lflag && argc > 1)
262 1.7 mrg print_list(-1, 0, "(totals)", 0);
263 1.1 mrg exit(0);
264 1.1 mrg }
265 1.1 mrg
266 1.1 mrg /* maybe print a warning */
267 1.1 mrg void
268 1.1 mrg maybe_warn(const char *fmt, ...)
269 1.1 mrg {
270 1.1 mrg va_list ap;
271 1.1 mrg
272 1.1 mrg if (qflag == 0) {
273 1.1 mrg va_start(ap, fmt);
274 1.1 mrg vwarn(fmt, ap);
275 1.1 mrg va_end(ap);
276 1.1 mrg }
277 1.1 mrg }
278 1.1 mrg
279 1.1 mrg void
280 1.1 mrg maybe_warnx(const char *fmt, ...)
281 1.1 mrg {
282 1.1 mrg va_list ap;
283 1.1 mrg
284 1.1 mrg if (qflag == 0) {
285 1.1 mrg va_start(ap, fmt);
286 1.1 mrg vwarnx(fmt, ap);
287 1.1 mrg va_end(ap);
288 1.1 mrg }
289 1.1 mrg }
290 1.1 mrg
291 1.1 mrg /* maybe print a warning */
292 1.1 mrg void
293 1.1 mrg maybe_err(int rv, const char *fmt, ...)
294 1.1 mrg {
295 1.1 mrg va_list ap;
296 1.1 mrg
297 1.1 mrg if (qflag == 0) {
298 1.1 mrg va_start(ap, fmt);
299 1.1 mrg vwarn(fmt, ap);
300 1.1 mrg va_end(ap);
301 1.1 mrg }
302 1.1 mrg exit(rv);
303 1.1 mrg }
304 1.1 mrg
305 1.9 mrg /* maybe print a warning */
306 1.9 mrg void
307 1.9 mrg maybe_errx(int rv, const char *fmt, ...)
308 1.9 mrg {
309 1.9 mrg va_list ap;
310 1.9 mrg
311 1.9 mrg if (qflag == 0) {
312 1.9 mrg va_start(ap, fmt);
313 1.9 mrg vwarnx(fmt, ap);
314 1.9 mrg va_end(ap);
315 1.9 mrg }
316 1.9 mrg exit(rv);
317 1.9 mrg }
318 1.9 mrg
319 1.1 mrg /* compress input to output then close both files */
320 1.1 mrg static void
321 1.1 mrg gz_compress(FILE *in, gzFile out)
322 1.1 mrg {
323 1.1 mrg char buf[BUFLEN];
324 1.1 mrg ssize_t len;
325 1.1 mrg int i;
326 1.1 mrg
327 1.1 mrg for (;;) {
328 1.1 mrg len = fread(buf, 1, sizeof(buf), in);
329 1.1 mrg if (ferror(in))
330 1.1 mrg maybe_err(1, "fread");
331 1.1 mrg if (len == 0)
332 1.1 mrg break;
333 1.1 mrg
334 1.1 mrg if ((ssize_t)gzwrite(out, buf, len) != len)
335 1.1 mrg maybe_err(1, gzerror(out, &i));
336 1.1 mrg }
337 1.1 mrg if (fclose(in) < 0)
338 1.1 mrg maybe_err(1, "failed fclose");
339 1.1 mrg if (gzclose(out) != Z_OK)
340 1.1 mrg maybe_err(1, "failed gzclose");
341 1.1 mrg }
342 1.1 mrg
343 1.1 mrg /* uncompress input to output then close the input */
344 1.1 mrg static off_t
345 1.1 mrg gz_uncompress(gzFile in, FILE *out)
346 1.1 mrg {
347 1.1 mrg char buf[BUFLEN];
348 1.1 mrg off_t size;
349 1.1 mrg ssize_t len;
350 1.1 mrg int i;
351 1.1 mrg
352 1.1 mrg for (size = 0;;) {
353 1.1 mrg len = gzread(in, buf, sizeof(buf));
354 1.1 mrg
355 1.1 mrg if (len < 0) {
356 1.1 mrg if (tflag) {
357 1.1 mrg print_test(infile, 0);
358 1.1 mrg return (0);
359 1.1 mrg } else
360 1.10 mrg maybe_errx(1, gzerror(in, &i));
361 1.1 mrg } else if (len == 0) {
362 1.1 mrg if (tflag)
363 1.1 mrg print_test(infile, 1);
364 1.1 mrg break;
365 1.1 mrg }
366 1.1 mrg
367 1.1 mrg size += len;
368 1.1 mrg
369 1.1 mrg /* don't write anything with -t */
370 1.1 mrg if (tflag)
371 1.1 mrg continue;
372 1.1 mrg
373 1.1 mrg if (fwrite(buf, 1, (unsigned)len, out) != (ssize_t)len)
374 1.1 mrg maybe_err(1, "failed fwrite");
375 1.1 mrg }
376 1.1 mrg if (gzclose(in) != Z_OK)
377 1.10 mrg maybe_errx(1, "failed gzclose");
378 1.1 mrg
379 1.1 mrg return (size);
380 1.1 mrg }
381 1.1 mrg
382 1.1 mrg /*
383 1.1 mrg * set the owner, mode, flags & utimes for a file
384 1.1 mrg */
385 1.1 mrg static void
386 1.1 mrg copymodes(const char *file, struct stat *sbp)
387 1.1 mrg {
388 1.1 mrg struct timeval times[2];
389 1.1 mrg
390 1.1 mrg /*
391 1.1 mrg * If we have no info on the input, give this file some
392 1.1 mrg * default values and return..
393 1.1 mrg */
394 1.1 mrg if (sbp == NULL) {
395 1.1 mrg mode_t mask = umask(022);
396 1.1 mrg
397 1.1 mrg (void)chmod(file, DEFFILEMODE & ~mask);
398 1.1 mrg (void)umask(mask);
399 1.1 mrg return;
400 1.1 mrg }
401 1.1 mrg
402 1.1 mrg /* if the chown fails, remove set-id bits as-per compress(1) */
403 1.1 mrg if (chown(file, sbp->st_uid, sbp->st_gid) < 0) {
404 1.1 mrg if (errno != EPERM)
405 1.1 mrg maybe_warn("couldn't chown: %s", file);
406 1.1 mrg sbp->st_mode &= ~(S_ISUID|S_ISGID);
407 1.1 mrg }
408 1.1 mrg
409 1.1 mrg /* we only allow set-id and the 9 normal permission bits */
410 1.1 mrg sbp->st_mode &= S_ISUID|S_ISGID|S_IRWXU|S_IRWXG|S_IRWXO;
411 1.1 mrg if (chmod(file, sbp->st_mode) < 0)
412 1.1 mrg maybe_warn("couldn't chmod: %s", file);
413 1.1 mrg
414 1.1 mrg /* only try flags if they exist already */
415 1.1 mrg if (sbp->st_flags != 0 && chflags(file, sbp->st_flags) < 0)
416 1.1 mrg maybe_warn("couldn't chflags: %s", file);
417 1.1 mrg
418 1.1 mrg TIMESPEC_TO_TIMEVAL(×[0], &sbp->st_atimespec);
419 1.1 mrg TIMESPEC_TO_TIMEVAL(×[1], &sbp->st_mtimespec);
420 1.1 mrg if (utimes(file, times) < 0)
421 1.1 mrg maybe_warn("couldn't utimes: %s", file);
422 1.1 mrg }
423 1.1 mrg
424 1.1 mrg /*
425 1.1 mrg * compress the given file: create a corresponding .gz file and remove the
426 1.1 mrg * original.
427 1.1 mrg */
428 1.1 mrg static ssize_t
429 1.1 mrg file_compress(char *file)
430 1.1 mrg {
431 1.1 mrg FILE *in;
432 1.1 mrg gzFile out;
433 1.1 mrg struct stat isb, osb;
434 1.5 mrg char outfile[MAXPATHLEN];
435 1.1 mrg ssize_t size;
436 1.1 mrg u_int32_t mtime = 0;
437 1.1 mrg
438 1.1 mrg if (cflag == 0) {
439 1.1 mrg (void)strncpy(outfile, file, MAXPATHLEN - suffix_len);
440 1.1 mrg outfile[MAXPATHLEN - suffix_len] = '\0';
441 1.10 mrg (void)strlcat(outfile, suffix, sizeof(outfile));
442 1.1 mrg
443 1.1 mrg if (fflag == 0) {
444 1.1 mrg if (stat(outfile, &osb) == 0) {
445 1.1 mrg maybe_warnx("%s already exists -- skipping",
446 1.1 mrg outfile);
447 1.1 mrg goto lose;
448 1.1 mrg }
449 1.1 mrg }
450 1.1 mrg if (stat(file, &isb) == 0) {
451 1.1 mrg if (isb.st_nlink > 1) {
452 1.1 mrg maybe_warnx("%s has %d other link%s -- "
453 1.1 mrg "skipping", file, isb.st_nlink-1,
454 1.1 mrg isb.st_nlink == 1 ? "" : "s");
455 1.1 mrg goto lose;
456 1.1 mrg }
457 1.1 mrg if (nflag == 0)
458 1.1 mrg mtime = (u_int32_t)isb.st_mtime;
459 1.1 mrg }
460 1.1 mrg }
461 1.1 mrg in = fopen(file, "r");
462 1.1 mrg if (in == 0)
463 1.1 mrg maybe_err(1, "can't fopen %s", file);
464 1.1 mrg
465 1.1 mrg if (cflag == 0) {
466 1.1 mrg #if HAVE_ZLIB_GZOPENFULL
467 1.1 mrg char *savename;
468 1.1 mrg
469 1.1 mrg if (nflag == 0)
470 1.1 mrg savename = basename(file);
471 1.1 mrg else
472 1.1 mrg savename = NULL;
473 1.1 mrg out = gzopenfull(outfile, gzipflags, savename, mtime);
474 1.1 mrg #else
475 1.1 mrg out = gzopen(outfile, gzipflags);
476 1.1 mrg #endif
477 1.1 mrg } else
478 1.1 mrg out = gzdopen(STDOUT_FILENO, gzipflags);
479 1.1 mrg
480 1.1 mrg if (out == 0)
481 1.1 mrg maybe_err(1, "can't gz%sopen %s",
482 1.1 mrg cflag ? "d" : "",
483 1.1 mrg cflag ? "stdout" : outfile);
484 1.1 mrg
485 1.1 mrg gz_compress(in, out);
486 1.1 mrg
487 1.1 mrg /*
488 1.1 mrg * if we compressed to stdout, we don't know the size and
489 1.1 mrg * we don't know the new file name, punt. if we can't stat
490 1.1 mrg * the file, whine, otherwise set the size from the stat
491 1.1 mrg * buffer. we only blow away the file if we can stat the
492 1.1 mrg * output, just in case.
493 1.1 mrg */
494 1.1 mrg if (cflag == 0) {
495 1.1 mrg if (stat(outfile, &osb) < 0) {
496 1.1 mrg maybe_warn("couldn't stat: %s", outfile);
497 1.1 mrg maybe_warnx("leaving original %s", file);
498 1.1 mrg size = 0;
499 1.1 mrg } else {
500 1.1 mrg unlink(file);
501 1.1 mrg size = osb.st_size;
502 1.1 mrg }
503 1.1 mrg newfile = outfile;
504 1.1 mrg copymodes(outfile, &isb);
505 1.1 mrg } else {
506 1.1 mrg lose:
507 1.1 mrg size = 0;
508 1.1 mrg newfile = 0;
509 1.1 mrg }
510 1.1 mrg
511 1.1 mrg return (size);
512 1.1 mrg }
513 1.1 mrg
514 1.1 mrg /* uncompress the given file and remove the original */
515 1.1 mrg static ssize_t
516 1.1 mrg file_uncompress(char *file)
517 1.1 mrg {
518 1.1 mrg struct stat isb, osb;
519 1.5 mrg char buf[PATH_MAX];
520 1.1 mrg char *outfile = buf, *s;
521 1.1 mrg FILE *out;
522 1.1 mrg gzFile in;
523 1.1 mrg off_t size;
524 1.1 mrg ssize_t len = strlen(file);
525 1.9 mrg int fd;
526 1.9 mrg unsigned char header1[10], name[PATH_MAX + 1];
527 1.10 mrg enum filetype method;
528 1.9 mrg
529 1.9 mrg /* gather the old name info */
530 1.1 mrg
531 1.9 mrg fd = open(file, O_RDONLY);
532 1.9 mrg if (fd < 0)
533 1.9 mrg maybe_err(1, "can't open %s", file);
534 1.10 mrg if (read(fd, header1, 10) != 10) {
535 1.10 mrg /* we don't want to fail here. */
536 1.10 mrg if (fflag)
537 1.10 mrg goto close_it;
538 1.9 mrg maybe_err(1, "can't read %s", file);
539 1.10 mrg }
540 1.10 mrg
541 1.10 mrg if (header1[0] == GZIP_MAGIC0 &&
542 1.10 mrg (header1[1] == GZIP_MAGIC1 || header1[1] == GZIP_OMAGIC1))
543 1.10 mrg method = FT_GZIP;
544 1.10 mrg else if (memcmp(header1, BZIP2_MAGIC, 3) == 0 &&
545 1.10 mrg header1[3] >= '0' && header1[3] <= '9') {
546 1.10 mrg if (Sflag == NULL)
547 1.10 mrg suffix = BZ2_SUFFIX;
548 1.10 mrg method = FT_BZIP2;
549 1.10 mrg } else
550 1.10 mrg method = FT_UNKNOWN;
551 1.9 mrg
552 1.10 mrg if (fflag == 0 && method == FT_UNKNOWN)
553 1.9 mrg maybe_errx(1, "%s: not in gzip format", file);
554 1.9 mrg
555 1.10 mrg if (cflag == 0 || lflag) {
556 1.10 mrg s = &file[len - suffix_len + 1];
557 1.10 mrg if (strncmp(s, suffix, suffix_len) == 0) {
558 1.10 mrg (void)strncpy(outfile, file, len - suffix_len + 1);
559 1.10 mrg outfile[len - suffix_len + 1] = '\0';
560 1.10 mrg } else if (lflag == 0)
561 1.10 mrg maybe_errx(1, "unknown suffix %s", s);
562 1.10 mrg }
563 1.10 mrg
564 1.10 mrg if (method == FT_GZIP && (Nflag || lflag)) {
565 1.9 mrg if (header1[3] & ORIG_NAME) {
566 1.9 mrg size_t rbytes;
567 1.9 mrg int i;
568 1.9 mrg
569 1.9 mrg rbytes = read(fd, name, PATH_MAX + 1);
570 1.9 mrg if (rbytes < 0)
571 1.1 mrg maybe_err(1, "can't read %s", file);
572 1.9 mrg for (i = 0; i < rbytes && name[i]; i++)
573 1.9 mrg ;
574 1.9 mrg if (i < rbytes) {
575 1.9 mrg name[i] = 0;
576 1.9 mrg /* now maybe merge old dirname */
577 1.9 mrg if (strchr(outfile, '/') == 0)
578 1.9 mrg outfile = name;
579 1.9 mrg else {
580 1.9 mrg char *dir = dirname(outfile);
581 1.9 mrg if (asprintf(&outfile, "%s/%s", dir,
582 1.9 mrg name) == -1)
583 1.9 mrg maybe_err(1, "malloc");
584 1.1 mrg }
585 1.1 mrg }
586 1.1 mrg }
587 1.9 mrg }
588 1.10 mrg close_it:
589 1.9 mrg close(fd);
590 1.1 mrg
591 1.9 mrg if ((cflag == 0 || lflag) && fflag == 0) {
592 1.9 mrg if (lflag == 0 && stat(outfile, &osb) == 0) {
593 1.9 mrg maybe_warnx("%s already exists -- skipping", outfile);
594 1.9 mrg goto lose;
595 1.9 mrg }
596 1.9 mrg if (stat(file, &isb) == 0) {
597 1.9 mrg if (isb.st_nlink > 1 && lflag == 0) {
598 1.9 mrg maybe_warnx("%s has %d other links -- skipping",
599 1.9 mrg file, isb.st_nlink - 1);
600 1.1 mrg goto lose;
601 1.1 mrg }
602 1.9 mrg } else
603 1.9 mrg goto lose;
604 1.1 mrg }
605 1.5 mrg
606 1.10 mrg if (method == FT_BZIP2) {
607 1.10 mrg int in, out;
608 1.5 mrg
609 1.10 mrg if ((in = open(file, O_RDONLY)) == -1)
610 1.10 mrg maybe_err(1, "open for read: %s", file);
611 1.10 mrg if (cflag == 1)
612 1.10 mrg out = STDOUT_FILENO;
613 1.10 mrg else
614 1.10 mrg out = open(outfile, O_WRONLY|O_CREAT|O_EXCL, 0600);
615 1.10 mrg if (out == -1)
616 1.10 mrg maybe_err(1, "open for write: %s", outfile);
617 1.5 mrg
618 1.10 mrg if ((size = unbzip2(in, out)) == 0) {
619 1.10 mrg unlink(outfile);
620 1.10 mrg goto lose;
621 1.10 mrg }
622 1.10 mrg } else {
623 1.10 mrg if (lflag) {
624 1.10 mrg int fd;
625 1.1 mrg
626 1.10 mrg if ((fd = open(file, O_RDONLY)) == -1)
627 1.10 mrg maybe_err(1, "open");
628 1.10 mrg print_list(fd, isb.st_size, outfile, isb.st_mtime);
629 1.10 mrg return 0; /* XXX */
630 1.10 mrg }
631 1.10 mrg
632 1.10 mrg in = gzopen(file, gzipflags);
633 1.10 mrg if (in == NULL)
634 1.10 mrg maybe_err(1, "can't gzopen %s", file);
635 1.10 mrg
636 1.10 mrg if (cflag == 0) {
637 1.10 mrg int fd;
638 1.10 mrg
639 1.10 mrg /* Use open(2) directly to get a safe file. */
640 1.10 mrg fd = open(outfile, O_WRONLY|O_CREAT|O_EXCL, 0600);
641 1.10 mrg if (fd < 0)
642 1.10 mrg maybe_err(1, "can't open %s", outfile);
643 1.10 mrg out = fdopen(fd, "w");
644 1.10 mrg if (out == NULL)
645 1.10 mrg maybe_err(1, "can't fdopen %s", outfile);
646 1.10 mrg } else
647 1.10 mrg out = stdout;
648 1.1 mrg
649 1.10 mrg if ((size = gz_uncompress(in, out)) == 0) {
650 1.10 mrg unlink(outfile);
651 1.10 mrg goto lose;
652 1.10 mrg }
653 1.1 mrg
654 1.10 mrg /* close the file */
655 1.10 mrg if (fclose(out))
656 1.10 mrg maybe_err(1, "failed fclose");
657 1.10 mrg }
658 1.1 mrg
659 1.1 mrg /* if testing, or we uncompressed to stdout, this is all we need */
660 1.1 mrg if (tflag || cflag)
661 1.1 mrg return (size);
662 1.1 mrg
663 1.1 mrg /*
664 1.1 mrg * if we create a file...
665 1.1 mrg */
666 1.1 mrg if (cflag == 0) {
667 1.1 mrg /*
668 1.1 mrg * if we can't stat the file, or we are uncompressing to
669 1.1 mrg * stdin, don't remove the file.
670 1.1 mrg */
671 1.1 mrg if (stat(outfile, &osb) < 0) {
672 1.1 mrg maybe_warn("couldn't stat (leaving original): %s",
673 1.1 mrg outfile);
674 1.1 mrg goto lose;
675 1.1 mrg }
676 1.1 mrg if (osb.st_size != size) {
677 1.1 mrg maybe_warn("stat gave different size: %llu != %llu "
678 1.1 mrg "(leaving original)",
679 1.1 mrg (unsigned long long)size,
680 1.1 mrg (unsigned long long)osb.st_size);
681 1.1 mrg goto lose;
682 1.1 mrg }
683 1.1 mrg newfile = outfile;
684 1.1 mrg unlink(file);
685 1.1 mrg size = osb.st_size;
686 1.1 mrg copymodes(outfile, &isb);
687 1.1 mrg }
688 1.1 mrg return (size);
689 1.1 mrg
690 1.1 mrg lose:
691 1.1 mrg newfile = 0;
692 1.1 mrg return (0);
693 1.1 mrg }
694 1.1 mrg
695 1.1 mrg static void
696 1.1 mrg handle_stdin(void)
697 1.1 mrg {
698 1.1 mrg gzFile *file;
699 1.1 mrg
700 1.5 mrg if (fflag == 0 && lflag == 0 && isatty(STDIN_FILENO)) {
701 1.1 mrg maybe_warnx("standard input is a terminal -- ignoring");
702 1.1 mrg return;
703 1.1 mrg }
704 1.5 mrg
705 1.5 mrg if (lflag) {
706 1.5 mrg struct stat isb;
707 1.5 mrg
708 1.5 mrg if (fstat(STDIN_FILENO, &isb) < 0)
709 1.5 mrg maybe_err(1, "fstat");
710 1.7 mrg print_list(STDIN_FILENO, isb.st_size, "stdout", isb.st_mtime);
711 1.5 mrg return;
712 1.5 mrg }
713 1.5 mrg
714 1.1 mrg file = gzdopen(STDIN_FILENO, gzipflags);
715 1.1 mrg if (file == NULL)
716 1.1 mrg maybe_err(1, "can't gzdopen stdin");
717 1.1 mrg gz_uncompress(file, stdout);
718 1.1 mrg }
719 1.1 mrg
720 1.1 mrg static void
721 1.1 mrg handle_stdout(void)
722 1.1 mrg {
723 1.1 mrg gzFile *file;
724 1.1 mrg
725 1.1 mrg if (fflag == 0 && isatty(STDOUT_FILENO)) {
726 1.1 mrg maybe_warnx("standard output is a terminal -- ignoring");
727 1.1 mrg return;
728 1.1 mrg }
729 1.1 mrg file = gzdopen(STDOUT_FILENO, gzipflags);
730 1.1 mrg if (file == NULL)
731 1.1 mrg maybe_err(1, "can't gzdopen stdout");
732 1.1 mrg gz_compress(stdin, file);
733 1.1 mrg }
734 1.1 mrg
735 1.1 mrg /* do what is asked for, for the path name */
736 1.1 mrg static void
737 1.1 mrg handle_pathname(char *path)
738 1.1 mrg {
739 1.1 mrg char *opath = path, *s = 0;
740 1.1 mrg ssize_t len;
741 1.1 mrg struct stat sb;
742 1.1 mrg
743 1.1 mrg /* check for stdout/stdin */
744 1.1 mrg if (path[0] == '-' && path[1] == '\0') {
745 1.1 mrg if (dflag)
746 1.1 mrg handle_stdin();
747 1.1 mrg else
748 1.1 mrg handle_stdout();
749 1.1 mrg }
750 1.1 mrg
751 1.1 mrg retry:
752 1.1 mrg if (stat(path, &sb) < 0) {
753 1.1 mrg /* lets try <path>.gz if we're decompressing */
754 1.1 mrg if (dflag && s == 0 && errno == ENOENT) {
755 1.1 mrg len = strlen(path);
756 1.1 mrg s = malloc(len + suffix_len);
757 1.1 mrg if (s == 0)
758 1.1 mrg maybe_err(1, "malloc");
759 1.1 mrg memmove(s, path, len);
760 1.10 mrg memmove(&s[len], suffix, suffix_len);
761 1.1 mrg path = s;
762 1.1 mrg goto retry;
763 1.1 mrg }
764 1.1 mrg maybe_warn("can't stat: %s", opath);
765 1.1 mrg goto out;
766 1.1 mrg }
767 1.1 mrg
768 1.1 mrg if (S_ISDIR(sb.st_mode)) {
769 1.1 mrg if (rflag)
770 1.1 mrg handle_dir(path, &sb);
771 1.1 mrg else
772 1.1 mrg maybe_warn("%s is a directory", path);
773 1.1 mrg goto out;
774 1.1 mrg }
775 1.1 mrg
776 1.1 mrg if (S_ISREG(sb.st_mode))
777 1.1 mrg handle_file(path, &sb);
778 1.1 mrg
779 1.1 mrg out:
780 1.1 mrg if (s)
781 1.1 mrg free(s);
782 1.1 mrg return;
783 1.1 mrg }
784 1.1 mrg
785 1.1 mrg /* compress/decompress a file */
786 1.1 mrg static void
787 1.1 mrg handle_file(char *file, struct stat *sbp)
788 1.1 mrg {
789 1.1 mrg ssize_t usize, gsize;
790 1.1 mrg
791 1.1 mrg infile = file;
792 1.1 mrg if (dflag) {
793 1.1 mrg usize = file_uncompress(file);
794 1.1 mrg if (usize == 0)
795 1.1 mrg return;
796 1.1 mrg gsize = sbp->st_size;
797 1.1 mrg } else {
798 1.1 mrg gsize = file_compress(file);
799 1.1 mrg if (gsize == 0)
800 1.1 mrg return;
801 1.1 mrg usize = sbp->st_size;
802 1.1 mrg }
803 1.1 mrg
804 1.1 mrg if (vflag && !tflag)
805 1.1 mrg print_verbage(file, cflag == 0 ? newfile : 0, usize, gsize);
806 1.1 mrg }
807 1.1 mrg
808 1.1 mrg /* this is used with -r to recursively decend directories */
809 1.1 mrg static void
810 1.1 mrg handle_dir(char *dir, struct stat *sbp)
811 1.1 mrg {
812 1.1 mrg char *path_argv[2];
813 1.1 mrg FTS *fts;
814 1.1 mrg FTSENT *entry;
815 1.1 mrg
816 1.1 mrg path_argv[0] = dir;
817 1.1 mrg path_argv[1] = 0;
818 1.1 mrg fts = fts_open(path_argv, FTS_PHYSICAL, NULL);
819 1.1 mrg if (fts == NULL) {
820 1.1 mrg warn("couldn't fts_open %s", dir);
821 1.1 mrg return;
822 1.1 mrg }
823 1.1 mrg
824 1.1 mrg while ((entry = fts_read(fts))) {
825 1.1 mrg switch(entry->fts_info) {
826 1.1 mrg case FTS_D:
827 1.1 mrg case FTS_DP:
828 1.1 mrg continue;
829 1.1 mrg
830 1.1 mrg case FTS_DNR:
831 1.1 mrg case FTS_ERR:
832 1.1 mrg case FTS_NS:
833 1.1 mrg maybe_warn("%s", entry->fts_path);
834 1.1 mrg continue;
835 1.1 mrg case FTS_F:
836 1.1 mrg handle_file(entry->fts_name, entry->fts_statp);
837 1.1 mrg }
838 1.1 mrg }
839 1.1 mrg (void)fts_close(fts);
840 1.1 mrg }
841 1.1 mrg
842 1.6 mrg /* print a ratio */
843 1.6 mrg static void
844 1.6 mrg print_ratio(off_t in, off_t out, FILE *where)
845 1.6 mrg {
846 1.6 mrg u_int64_t percent;
847 1.6 mrg
848 1.6 mrg if (out == 0)
849 1.6 mrg percent = 0;
850 1.6 mrg else
851 1.10 mrg percent = 1000 - ((1000 * out) / in);
852 1.6 mrg fprintf(where, "%3lu.%1lu%%", (unsigned long)percent / 10UL,
853 1.6 mrg (unsigned long)percent % 10);
854 1.6 mrg }
855 1.6 mrg
856 1.1 mrg /* print compression statistics, and the new name (if there is one!) */
857 1.1 mrg static void
858 1.4 mrg print_verbage(char *file, char *nfile, ssize_t usize, ssize_t gsize)
859 1.1 mrg {
860 1.6 mrg fprintf(stderr, "%s:%s ", file,
861 1.6 mrg strlen(file) < 7 ? "\t\t" : "\t");
862 1.6 mrg print_ratio(usize, gsize, stderr);
863 1.4 mrg if (nfile)
864 1.4 mrg fprintf(stderr, " -- replaced with %s", nfile);
865 1.1 mrg fprintf(stderr, "\n");
866 1.1 mrg fflush(stderr);
867 1.1 mrg }
868 1.1 mrg
869 1.1 mrg /* print test results */
870 1.1 mrg static void
871 1.1 mrg print_test(char *file, int ok)
872 1.1 mrg {
873 1.1 mrg
874 1.1 mrg fprintf(stderr, "%s:%s %s\n", file,
875 1.1 mrg strlen(file) < 7 ? "\t\t" : "\t", ok ? "OK" : "NOT OK");
876 1.1 mrg fflush(stderr);
877 1.1 mrg }
878 1.1 mrg
879 1.5 mrg /* print a file's info ala --list */
880 1.5 mrg /* eg:
881 1.5 mrg compressed uncompressed ratio uncompressed_name
882 1.5 mrg 354841 1679360 78.8% /usr/pkgsrc/distfiles/libglade-2.0.1.tar
883 1.5 mrg */
884 1.5 mrg static void
885 1.7 mrg print_list(int fd, off_t in, const char *outfile, time_t ts)
886 1.5 mrg {
887 1.5 mrg static int first = 1;
888 1.6 mrg static off_t in_tot, out_tot;
889 1.6 mrg off_t out;
890 1.7 mrg u_int32_t crc;
891 1.5 mrg int rv;
892 1.5 mrg
893 1.7 mrg if (first) {
894 1.7 mrg if (vflag)
895 1.7 mrg printf("method crc date time ");
896 1.7 mrg if (qflag == 0)
897 1.7 mrg printf(" compressed uncompressed "
898 1.7 mrg "ratio uncompressed_name\n");
899 1.7 mrg }
900 1.5 mrg first = 0;
901 1.5 mrg
902 1.6 mrg /* print totals? */
903 1.6 mrg if (fd == -1) {
904 1.6 mrg in = in_tot;
905 1.6 mrg out = out_tot;
906 1.6 mrg } else {
907 1.6 mrg /* read the last 4 bytes - this is the uncompressed size */
908 1.7 mrg rv = lseek(fd, (off_t)(-8), SEEK_END);
909 1.6 mrg if (rv != -1) {
910 1.7 mrg unsigned char buf[8];
911 1.6 mrg u_int32_t usize;
912 1.6 mrg
913 1.6 mrg if (read(fd, (char *)buf, sizeof(buf)) != sizeof(buf))
914 1.6 mrg maybe_err(1, "read of uncompressed size");
915 1.7 mrg crc = buf[0] | buf[1] << 8 | buf[2] << 16 | buf[3] << 24;
916 1.7 mrg usize = buf[4] | buf[5] << 8 | buf[6] << 16 | buf[7] << 24;
917 1.6 mrg out = (off_t)usize;
918 1.6 mrg }
919 1.6 mrg }
920 1.5 mrg
921 1.7 mrg if (vflag && fd == -1)
922 1.7 mrg printf(" ");
923 1.7 mrg else if (vflag) {
924 1.7 mrg char *date = ctime(&ts);
925 1.7 mrg
926 1.7 mrg /* skip the day, 1/100th second, and year */
927 1.7 mrg date += 4;
928 1.7 mrg date[12] = 0;
929 1.7 mrg printf("%5s %08x %11s ", "defla"/*XXX*/, crc, date);
930 1.7 mrg }
931 1.6 mrg printf("%12llu %12llu ", (unsigned long long)in, (unsigned long long)out);
932 1.6 mrg print_ratio(in, out, stdout);
933 1.6 mrg printf(" %s\n", outfile);
934 1.6 mrg in_tot += in;
935 1.6 mrg out_tot += out;
936 1.5 mrg }
937 1.5 mrg
938 1.1 mrg /* display the usage of NetBSD gzip */
939 1.1 mrg static void
940 1.1 mrg usage(void)
941 1.1 mrg {
942 1.1 mrg
943 1.1 mrg fprintf(stderr, "%s\n", gzip_version);
944 1.1 mrg fprintf(stderr,
945 1.1 mrg "Usage: %s [-cdfhnNqrStvV123456789] [<file> [<file> ...]]\n"
946 1.11 mrg #ifndef SMALL
947 1.1 mrg " -c --stdout write to stdout, keep original files\n"
948 1.1 mrg " --to-stdout\n"
949 1.1 mrg " -d --decompress uncompress files\n"
950 1.1 mrg " --uncompress\n"
951 1.1 mrg " -f --force force overwriting & compress links\n"
952 1.1 mrg " -h --help display this help\n"
953 1.1 mrg " -n --no-name don't save original file name or time stamp\n"
954 1.1 mrg " -N --name save or restore original file name and time stamp\n"
955 1.1 mrg " -q --quiet output no warnings\n"
956 1.1 mrg " -r --recursive recursively compress files in directories\n"
957 1.1 mrg " -S .suf use suffix .suf instead of .gz\n"
958 1.1 mrg " --suffix .suf\n"
959 1.1 mrg " -t --test test compressed file\n"
960 1.1 mrg " -v --verbose print extra statistics\n"
961 1.1 mrg " -V --version display program version\n"
962 1.1 mrg " -1 --fast fastest (worst) compression\n"
963 1.1 mrg " -2 .. -8 set compression level\n"
964 1.1 mrg " -9 --best best (slowest) compression\n",
965 1.11 mrg #else
966 1.11 mrg ,
967 1.11 mrg #endif
968 1.1 mrg getprogname());
969 1.1 mrg fflush(stderr);
970 1.1 mrg exit(0);
971 1.1 mrg }
972 1.1 mrg
973 1.1 mrg /* display the version of NetBSD gzip */
974 1.1 mrg static void
975 1.1 mrg display_version(void)
976 1.1 mrg {
977 1.1 mrg
978 1.1 mrg fprintf(stderr, "%s\n", gzip_version);
979 1.1 mrg fflush(stderr);
980 1.1 mrg exit(0);
981 1.1 mrg }
982 1.10 mrg
983 1.10 mrg #include "unbzip2.c"
984