gzip.c revision 1.13 1 1.13 mrg /* $NetBSD: gzip.c,v 1.13 2004/01/02 01:34:01 mrg Exp $ */
2 1.1 mrg
3 1.1 mrg /*
4 1.1 mrg * Copyright (c) 1997, 1998, 2003 Matthew R. Green
5 1.1 mrg * All rights reserved.
6 1.1 mrg *
7 1.1 mrg * Redistribution and use in source and binary forms, with or without
8 1.1 mrg * modification, are permitted provided that the following conditions
9 1.1 mrg * are met:
10 1.1 mrg * 1. Redistributions of source code must retain the above copyright
11 1.1 mrg * notice, this list of conditions and the following disclaimer.
12 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mrg * notice, this list of conditions and the following disclaimer in the
14 1.1 mrg * documentation and/or other materials provided with the distribution.
15 1.1 mrg * 3. The name of the author may not be used to endorse or promote products
16 1.1 mrg * derived from this software without specific prior written permission.
17 1.1 mrg *
18 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
19 1.1 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
20 1.1 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
21 1.1 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
22 1.1 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
23 1.1 mrg * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
24 1.1 mrg * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
25 1.1 mrg * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
26 1.1 mrg * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 1.1 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28 1.1 mrg * SUCH DAMAGE.
29 1.1 mrg */
30 1.1 mrg
31 1.4 mrg #include <sys/cdefs.h>
32 1.4 mrg #ifndef lint
33 1.4 mrg __COPYRIGHT("@(#) Copyright (c) 1997, 1998, 2003 Matthew R. Green\n\
34 1.4 mrg All rights reserved.\n");
35 1.13 mrg __RCSID("$NetBSD: gzip.c,v 1.13 2004/01/02 01:34:01 mrg Exp $");
36 1.4 mrg #endif /* not lint */
37 1.4 mrg
38 1.1 mrg /*
39 1.1 mrg * gzip.c -- GPL free gzip using zlib.
40 1.1 mrg *
41 1.6 mrg * very minor portions of this code are (very loosely) derived from
42 1.1 mrg * the minigzip.c in the zlib distribution.
43 1.6 mrg *
44 1.6 mrg * TODO:
45 1.6 mrg * - handle .taz/.tgz files?
46 1.10 mrg * - use mmap where possible
47 1.1 mrg */
48 1.1 mrg
49 1.1 mrg #include <sys/param.h>
50 1.1 mrg #include <sys/stat.h>
51 1.1 mrg #include <sys/time.h>
52 1.1 mrg
53 1.1 mrg #include <unistd.h>
54 1.1 mrg #include <stdio.h>
55 1.1 mrg #include <string.h>
56 1.1 mrg #include <stdlib.h>
57 1.1 mrg #include <err.h>
58 1.1 mrg #include <errno.h>
59 1.1 mrg #include <fcntl.h>
60 1.1 mrg #include <zlib.h>
61 1.1 mrg #include <fts.h>
62 1.1 mrg #include <libgen.h>
63 1.1 mrg #include <stdarg.h>
64 1.1 mrg #include <getopt.h>
65 1.1 mrg
66 1.10 mrg /* what type of file are we dealing with */
67 1.10 mrg enum filetype {
68 1.10 mrg FT_GZIP,
69 1.10 mrg FT_BZIP2,
70 1.10 mrg FT_LAST,
71 1.10 mrg FT_UNKNOWN
72 1.10 mrg };
73 1.10 mrg
74 1.10 mrg #define BZ_NO_STDIO
75 1.10 mrg #include <bzlib.h>
76 1.10 mrg
77 1.10 mrg #define BZ2_SUFFIX ".bz2"
78 1.10 mrg #define BZIP2_MAGIC "\102\132\150"
79 1.10 mrg
80 1.10 mrg #define GZ_SUFFIX ".gz"
81 1.1 mrg
82 1.10 mrg #define BUFLEN (32 * 1024)
83 1.1 mrg
84 1.9 mrg #define GZIP_MAGIC0 0x1F
85 1.10 mrg #define GZIP_MAGIC1 0x8B
86 1.10 mrg #define GZIP_OMAGIC1 0x9E
87 1.9 mrg
88 1.9 mrg #define ORIG_NAME 0x08
89 1.1 mrg
90 1.1 mrg /* Define this if you have the NetBSD gzopenfull(3) extension to zlib(3) */
91 1.13 mrg #ifndef HAVE_ZLIB_GZOPENFULL
92 1.1 mrg #define HAVE_ZLIB_GZOPENFULL 0
93 1.13 mrg #endif
94 1.1 mrg
95 1.10 mrg static const char gzip_version[] = "NetBSD gzip 2.1";
96 1.1 mrg
97 1.3 jdolecek static char gzipflags[3]; /* `w' or `r', possible with [1-9] */
98 1.1 mrg static int cflag; /* stdout mode */
99 1.1 mrg static int dflag; /* decompress mode */
100 1.1 mrg static int fflag; /* force mode */
101 1.5 mrg static int lflag; /* list mode */
102 1.1 mrg static int nflag; /* don't save name/timestamp */
103 1.1 mrg static int Nflag; /* don't restore name/timestamp */
104 1.1 mrg static int qflag; /* quiet mode */
105 1.1 mrg static int rflag; /* recursive mode */
106 1.1 mrg static int tflag; /* test */
107 1.1 mrg static int vflag; /* verbose mode */
108 1.10 mrg static char *Sflag;
109 1.10 mrg static char *suffix;
110 1.1 mrg
111 1.10 mrg #define suffix_len (strlen(suffix) + 1) /* len + nul */
112 1.1 mrg static char *newfile; /* name of newly created file */
113 1.1 mrg static char *infile; /* name of file coming in */
114 1.1 mrg
115 1.1 mrg static void maybe_err(int rv, const char *fmt, ...);
116 1.9 mrg static void maybe_errx(int rv, const char *fmt, ...);
117 1.1 mrg static void maybe_warn(const char *fmt, ...);
118 1.1 mrg static void maybe_warnx(const char *fmt, ...);
119 1.1 mrg static void gz_compress(FILE *, gzFile);
120 1.1 mrg static off_t gz_uncompress(gzFile, FILE *);
121 1.1 mrg static void copymodes(const char *, struct stat *);
122 1.1 mrg static ssize_t file_compress(char *);
123 1.1 mrg static ssize_t file_uncompress(char *);
124 1.1 mrg static void handle_pathname(char *);
125 1.1 mrg static void handle_file(char *, struct stat *);
126 1.1 mrg static void handle_dir(char *, struct stat *);
127 1.1 mrg static void handle_stdin(void);
128 1.1 mrg static void handle_stdout(void);
129 1.6 mrg static void print_ratio(off_t, off_t, FILE *);
130 1.1 mrg static void print_verbage(char *, char *, ssize_t, ssize_t);
131 1.1 mrg static void print_test(char *, int);
132 1.7 mrg static void print_list(int fd, off_t, const char *, time_t);
133 1.10 mrg static void usage(void);
134 1.10 mrg static void display_version(void);
135 1.10 mrg static off_t unbzip2(int, int);
136 1.1 mrg
137 1.1 mrg int main(int, char *p[]);
138 1.1 mrg
139 1.11 mrg #ifdef SMALL
140 1.11 mrg #define getopt_long(a,b,c,d,e) getopt(a,b,c)
141 1.11 mrg #else
142 1.3 jdolecek static const struct option longopts[] = {
143 1.1 mrg { "stdout", no_argument, 0, 'c' },
144 1.1 mrg { "to-stdout", no_argument, 0, 'c' },
145 1.1 mrg { "decompress", no_argument, 0, 'd' },
146 1.1 mrg { "uncompress", no_argument, 0, 'd' },
147 1.1 mrg { "force", no_argument, 0, 'f' },
148 1.1 mrg { "help", no_argument, 0, 'h' },
149 1.5 mrg { "list", no_argument, 0, 'l' },
150 1.1 mrg { "no-name", no_argument, 0, 'n' },
151 1.1 mrg { "name", no_argument, 0, 'N' },
152 1.1 mrg { "quiet", no_argument, 0, 'q' },
153 1.1 mrg { "recursive", no_argument, 0, 'r' },
154 1.1 mrg { "suffix", required_argument, 0, 'S' },
155 1.1 mrg { "test", no_argument, 0, 't' },
156 1.1 mrg { "verbose", no_argument, 0, 'v' },
157 1.1 mrg { "version", no_argument, 0, 'V' },
158 1.1 mrg { "fast", no_argument, 0, '1' },
159 1.1 mrg { "best", no_argument, 0, '9' },
160 1.1 mrg #if 0
161 1.1 mrg /*
162 1.10 mrg * This is what else GNU gzip implements. --ascii isn't useful
163 1.10 mrg * on NetBSD, and I don't care to have a --license.
164 1.1 mrg */
165 1.1 mrg { "ascii", no_argument, 0, 'a' },
166 1.1 mrg { "license", no_argument, 0, 'L' },
167 1.1 mrg #endif
168 1.12 mrg { NULL, no_argument, 0, 0 },
169 1.1 mrg };
170 1.11 mrg #endif
171 1.1 mrg
172 1.1 mrg int
173 1.1 mrg main(int argc, char **argv)
174 1.1 mrg {
175 1.1 mrg const char *progname = getprogname();
176 1.1 mrg int ch;
177 1.1 mrg
178 1.1 mrg gzipflags[0] = 'w';
179 1.1 mrg gzipflags[1] = '\0';
180 1.1 mrg
181 1.10 mrg suffix = GZ_SUFFIX;;
182 1.10 mrg
183 1.1 mrg /*
184 1.1 mrg * XXX
185 1.1 mrg * handle being called `gunzip', `zcat' and `gzcat'
186 1.1 mrg */
187 1.1 mrg if (strcmp(progname, "gunzip") == 0)
188 1.1 mrg dflag = 1;
189 1.1 mrg else if (strcmp(progname, "zcat") == 0 ||
190 1.1 mrg strcmp(progname, "gzcat") == 0)
191 1.1 mrg dflag = cflag = 1;
192 1.1 mrg
193 1.1 mrg while ((ch = getopt_long(argc, argv, "cdfhHlnNqrS:tvV123456789",
194 1.1 mrg longopts, NULL)) != -1)
195 1.1 mrg switch (ch) {
196 1.1 mrg case 'c':
197 1.1 mrg cflag = 1;
198 1.1 mrg break;
199 1.1 mrg case 'd':
200 1.1 mrg dflag = 1;
201 1.1 mrg break;
202 1.1 mrg case 'f':
203 1.1 mrg fflag = 1;
204 1.1 mrg break;
205 1.5 mrg case 'l':
206 1.5 mrg lflag = 1;
207 1.5 mrg tflag = 1;
208 1.5 mrg dflag = 1;
209 1.5 mrg break;
210 1.1 mrg case 'n':
211 1.1 mrg nflag = 1;
212 1.1 mrg Nflag = 0;
213 1.1 mrg break;
214 1.1 mrg case 'N':
215 1.1 mrg nflag = 0;
216 1.1 mrg Nflag = 1;
217 1.1 mrg break;
218 1.1 mrg case 'q':
219 1.1 mrg qflag = 1;
220 1.1 mrg break;
221 1.1 mrg case 'r':
222 1.1 mrg rflag = 1;
223 1.1 mrg break;
224 1.1 mrg case 'S':
225 1.1 mrg Sflag = optarg;
226 1.1 mrg break;
227 1.1 mrg case 't':
228 1.1 mrg cflag = 1;
229 1.1 mrg tflag = 1;
230 1.1 mrg dflag = 1;
231 1.1 mrg break;
232 1.1 mrg case 'v':
233 1.1 mrg vflag = 1;
234 1.1 mrg break;
235 1.1 mrg case 'V':
236 1.1 mrg display_version();
237 1.1 mrg /* NOTREACHED */
238 1.1 mrg case '1': case '2': case '3':
239 1.1 mrg case '4': case '5': case '6':
240 1.1 mrg case '7': case '8': case '9':
241 1.1 mrg gzipflags[1] = (char)ch;
242 1.1 mrg gzipflags[2] = '\0';
243 1.1 mrg break;
244 1.12 mrg default:
245 1.12 mrg usage();
246 1.12 mrg /* NOTREACHED */
247 1.1 mrg }
248 1.1 mrg argv += optind;
249 1.1 mrg argc -= optind;
250 1.1 mrg if (dflag)
251 1.1 mrg gzipflags[0] = 'r';
252 1.1 mrg
253 1.1 mrg if (argc == 0) {
254 1.1 mrg if (dflag) /* stdin mode */
255 1.1 mrg handle_stdin();
256 1.1 mrg else /* stdout mode */
257 1.1 mrg handle_stdout();
258 1.1 mrg } else {
259 1.1 mrg do {
260 1.1 mrg handle_pathname(argv[0]);
261 1.5 mrg } while (*++argv);
262 1.1 mrg }
263 1.6 mrg if (qflag == 0 && lflag && argc > 1)
264 1.7 mrg print_list(-1, 0, "(totals)", 0);
265 1.1 mrg exit(0);
266 1.1 mrg }
267 1.1 mrg
268 1.1 mrg /* maybe print a warning */
269 1.1 mrg void
270 1.1 mrg maybe_warn(const char *fmt, ...)
271 1.1 mrg {
272 1.1 mrg va_list ap;
273 1.1 mrg
274 1.1 mrg if (qflag == 0) {
275 1.1 mrg va_start(ap, fmt);
276 1.1 mrg vwarn(fmt, ap);
277 1.1 mrg va_end(ap);
278 1.1 mrg }
279 1.1 mrg }
280 1.1 mrg
281 1.1 mrg void
282 1.1 mrg maybe_warnx(const char *fmt, ...)
283 1.1 mrg {
284 1.1 mrg va_list ap;
285 1.1 mrg
286 1.1 mrg if (qflag == 0) {
287 1.1 mrg va_start(ap, fmt);
288 1.1 mrg vwarnx(fmt, ap);
289 1.1 mrg va_end(ap);
290 1.1 mrg }
291 1.1 mrg }
292 1.1 mrg
293 1.1 mrg /* maybe print a warning */
294 1.1 mrg void
295 1.1 mrg maybe_err(int rv, const char *fmt, ...)
296 1.1 mrg {
297 1.1 mrg va_list ap;
298 1.1 mrg
299 1.1 mrg if (qflag == 0) {
300 1.1 mrg va_start(ap, fmt);
301 1.1 mrg vwarn(fmt, ap);
302 1.1 mrg va_end(ap);
303 1.1 mrg }
304 1.1 mrg exit(rv);
305 1.1 mrg }
306 1.1 mrg
307 1.9 mrg /* maybe print a warning */
308 1.9 mrg void
309 1.9 mrg maybe_errx(int rv, const char *fmt, ...)
310 1.9 mrg {
311 1.9 mrg va_list ap;
312 1.9 mrg
313 1.9 mrg if (qflag == 0) {
314 1.9 mrg va_start(ap, fmt);
315 1.9 mrg vwarnx(fmt, ap);
316 1.9 mrg va_end(ap);
317 1.9 mrg }
318 1.9 mrg exit(rv);
319 1.9 mrg }
320 1.9 mrg
321 1.1 mrg /* compress input to output then close both files */
322 1.1 mrg static void
323 1.1 mrg gz_compress(FILE *in, gzFile out)
324 1.1 mrg {
325 1.1 mrg char buf[BUFLEN];
326 1.1 mrg ssize_t len;
327 1.1 mrg int i;
328 1.1 mrg
329 1.1 mrg for (;;) {
330 1.1 mrg len = fread(buf, 1, sizeof(buf), in);
331 1.1 mrg if (ferror(in))
332 1.1 mrg maybe_err(1, "fread");
333 1.1 mrg if (len == 0)
334 1.1 mrg break;
335 1.1 mrg
336 1.1 mrg if ((ssize_t)gzwrite(out, buf, len) != len)
337 1.1 mrg maybe_err(1, gzerror(out, &i));
338 1.1 mrg }
339 1.1 mrg if (fclose(in) < 0)
340 1.1 mrg maybe_err(1, "failed fclose");
341 1.1 mrg if (gzclose(out) != Z_OK)
342 1.1 mrg maybe_err(1, "failed gzclose");
343 1.1 mrg }
344 1.1 mrg
345 1.1 mrg /* uncompress input to output then close the input */
346 1.1 mrg static off_t
347 1.1 mrg gz_uncompress(gzFile in, FILE *out)
348 1.1 mrg {
349 1.1 mrg char buf[BUFLEN];
350 1.1 mrg off_t size;
351 1.1 mrg ssize_t len;
352 1.1 mrg int i;
353 1.1 mrg
354 1.1 mrg for (size = 0;;) {
355 1.1 mrg len = gzread(in, buf, sizeof(buf));
356 1.1 mrg
357 1.1 mrg if (len < 0) {
358 1.1 mrg if (tflag) {
359 1.1 mrg print_test(infile, 0);
360 1.1 mrg return (0);
361 1.1 mrg } else
362 1.10 mrg maybe_errx(1, gzerror(in, &i));
363 1.1 mrg } else if (len == 0) {
364 1.1 mrg if (tflag)
365 1.1 mrg print_test(infile, 1);
366 1.1 mrg break;
367 1.1 mrg }
368 1.1 mrg
369 1.1 mrg size += len;
370 1.1 mrg
371 1.1 mrg /* don't write anything with -t */
372 1.1 mrg if (tflag)
373 1.1 mrg continue;
374 1.1 mrg
375 1.1 mrg if (fwrite(buf, 1, (unsigned)len, out) != (ssize_t)len)
376 1.1 mrg maybe_err(1, "failed fwrite");
377 1.1 mrg }
378 1.1 mrg if (gzclose(in) != Z_OK)
379 1.10 mrg maybe_errx(1, "failed gzclose");
380 1.1 mrg
381 1.1 mrg return (size);
382 1.1 mrg }
383 1.1 mrg
384 1.1 mrg /*
385 1.1 mrg * set the owner, mode, flags & utimes for a file
386 1.1 mrg */
387 1.1 mrg static void
388 1.1 mrg copymodes(const char *file, struct stat *sbp)
389 1.1 mrg {
390 1.1 mrg struct timeval times[2];
391 1.1 mrg
392 1.1 mrg /*
393 1.1 mrg * If we have no info on the input, give this file some
394 1.1 mrg * default values and return..
395 1.1 mrg */
396 1.1 mrg if (sbp == NULL) {
397 1.1 mrg mode_t mask = umask(022);
398 1.1 mrg
399 1.1 mrg (void)chmod(file, DEFFILEMODE & ~mask);
400 1.1 mrg (void)umask(mask);
401 1.1 mrg return;
402 1.1 mrg }
403 1.1 mrg
404 1.1 mrg /* if the chown fails, remove set-id bits as-per compress(1) */
405 1.1 mrg if (chown(file, sbp->st_uid, sbp->st_gid) < 0) {
406 1.1 mrg if (errno != EPERM)
407 1.1 mrg maybe_warn("couldn't chown: %s", file);
408 1.1 mrg sbp->st_mode &= ~(S_ISUID|S_ISGID);
409 1.1 mrg }
410 1.1 mrg
411 1.1 mrg /* we only allow set-id and the 9 normal permission bits */
412 1.1 mrg sbp->st_mode &= S_ISUID|S_ISGID|S_IRWXU|S_IRWXG|S_IRWXO;
413 1.1 mrg if (chmod(file, sbp->st_mode) < 0)
414 1.1 mrg maybe_warn("couldn't chmod: %s", file);
415 1.1 mrg
416 1.1 mrg /* only try flags if they exist already */
417 1.1 mrg if (sbp->st_flags != 0 && chflags(file, sbp->st_flags) < 0)
418 1.1 mrg maybe_warn("couldn't chflags: %s", file);
419 1.1 mrg
420 1.1 mrg TIMESPEC_TO_TIMEVAL(×[0], &sbp->st_atimespec);
421 1.1 mrg TIMESPEC_TO_TIMEVAL(×[1], &sbp->st_mtimespec);
422 1.1 mrg if (utimes(file, times) < 0)
423 1.1 mrg maybe_warn("couldn't utimes: %s", file);
424 1.1 mrg }
425 1.1 mrg
426 1.1 mrg /*
427 1.1 mrg * compress the given file: create a corresponding .gz file and remove the
428 1.1 mrg * original.
429 1.1 mrg */
430 1.1 mrg static ssize_t
431 1.1 mrg file_compress(char *file)
432 1.1 mrg {
433 1.1 mrg FILE *in;
434 1.1 mrg gzFile out;
435 1.1 mrg struct stat isb, osb;
436 1.5 mrg char outfile[MAXPATHLEN];
437 1.1 mrg ssize_t size;
438 1.1 mrg u_int32_t mtime = 0;
439 1.1 mrg
440 1.1 mrg if (cflag == 0) {
441 1.1 mrg (void)strncpy(outfile, file, MAXPATHLEN - suffix_len);
442 1.1 mrg outfile[MAXPATHLEN - suffix_len] = '\0';
443 1.10 mrg (void)strlcat(outfile, suffix, sizeof(outfile));
444 1.1 mrg
445 1.1 mrg if (fflag == 0) {
446 1.1 mrg if (stat(outfile, &osb) == 0) {
447 1.1 mrg maybe_warnx("%s already exists -- skipping",
448 1.1 mrg outfile);
449 1.1 mrg goto lose;
450 1.1 mrg }
451 1.1 mrg }
452 1.1 mrg if (stat(file, &isb) == 0) {
453 1.1 mrg if (isb.st_nlink > 1) {
454 1.1 mrg maybe_warnx("%s has %d other link%s -- "
455 1.1 mrg "skipping", file, isb.st_nlink-1,
456 1.1 mrg isb.st_nlink == 1 ? "" : "s");
457 1.1 mrg goto lose;
458 1.1 mrg }
459 1.1 mrg if (nflag == 0)
460 1.1 mrg mtime = (u_int32_t)isb.st_mtime;
461 1.1 mrg }
462 1.1 mrg }
463 1.1 mrg in = fopen(file, "r");
464 1.1 mrg if (in == 0)
465 1.1 mrg maybe_err(1, "can't fopen %s", file);
466 1.1 mrg
467 1.1 mrg if (cflag == 0) {
468 1.1 mrg #if HAVE_ZLIB_GZOPENFULL
469 1.1 mrg char *savename;
470 1.1 mrg
471 1.1 mrg if (nflag == 0)
472 1.1 mrg savename = basename(file);
473 1.1 mrg else
474 1.1 mrg savename = NULL;
475 1.1 mrg out = gzopenfull(outfile, gzipflags, savename, mtime);
476 1.1 mrg #else
477 1.1 mrg out = gzopen(outfile, gzipflags);
478 1.1 mrg #endif
479 1.1 mrg } else
480 1.1 mrg out = gzdopen(STDOUT_FILENO, gzipflags);
481 1.1 mrg
482 1.1 mrg if (out == 0)
483 1.1 mrg maybe_err(1, "can't gz%sopen %s",
484 1.1 mrg cflag ? "d" : "",
485 1.1 mrg cflag ? "stdout" : outfile);
486 1.1 mrg
487 1.1 mrg gz_compress(in, out);
488 1.1 mrg
489 1.1 mrg /*
490 1.1 mrg * if we compressed to stdout, we don't know the size and
491 1.1 mrg * we don't know the new file name, punt. if we can't stat
492 1.1 mrg * the file, whine, otherwise set the size from the stat
493 1.1 mrg * buffer. we only blow away the file if we can stat the
494 1.1 mrg * output, just in case.
495 1.1 mrg */
496 1.1 mrg if (cflag == 0) {
497 1.1 mrg if (stat(outfile, &osb) < 0) {
498 1.1 mrg maybe_warn("couldn't stat: %s", outfile);
499 1.1 mrg maybe_warnx("leaving original %s", file);
500 1.1 mrg size = 0;
501 1.1 mrg } else {
502 1.1 mrg unlink(file);
503 1.1 mrg size = osb.st_size;
504 1.1 mrg }
505 1.1 mrg newfile = outfile;
506 1.1 mrg copymodes(outfile, &isb);
507 1.1 mrg } else {
508 1.1 mrg lose:
509 1.1 mrg size = 0;
510 1.1 mrg newfile = 0;
511 1.1 mrg }
512 1.1 mrg
513 1.1 mrg return (size);
514 1.1 mrg }
515 1.1 mrg
516 1.1 mrg /* uncompress the given file and remove the original */
517 1.1 mrg static ssize_t
518 1.1 mrg file_uncompress(char *file)
519 1.1 mrg {
520 1.1 mrg struct stat isb, osb;
521 1.5 mrg char buf[PATH_MAX];
522 1.1 mrg char *outfile = buf, *s;
523 1.1 mrg FILE *out;
524 1.1 mrg gzFile in;
525 1.1 mrg off_t size;
526 1.1 mrg ssize_t len = strlen(file);
527 1.9 mrg int fd;
528 1.9 mrg unsigned char header1[10], name[PATH_MAX + 1];
529 1.10 mrg enum filetype method;
530 1.9 mrg
531 1.9 mrg /* gather the old name info */
532 1.1 mrg
533 1.9 mrg fd = open(file, O_RDONLY);
534 1.9 mrg if (fd < 0)
535 1.9 mrg maybe_err(1, "can't open %s", file);
536 1.10 mrg if (read(fd, header1, 10) != 10) {
537 1.10 mrg /* we don't want to fail here. */
538 1.10 mrg if (fflag)
539 1.10 mrg goto close_it;
540 1.9 mrg maybe_err(1, "can't read %s", file);
541 1.10 mrg }
542 1.10 mrg
543 1.10 mrg if (header1[0] == GZIP_MAGIC0 &&
544 1.10 mrg (header1[1] == GZIP_MAGIC1 || header1[1] == GZIP_OMAGIC1))
545 1.10 mrg method = FT_GZIP;
546 1.10 mrg else if (memcmp(header1, BZIP2_MAGIC, 3) == 0 &&
547 1.10 mrg header1[3] >= '0' && header1[3] <= '9') {
548 1.10 mrg if (Sflag == NULL)
549 1.10 mrg suffix = BZ2_SUFFIX;
550 1.10 mrg method = FT_BZIP2;
551 1.10 mrg } else
552 1.10 mrg method = FT_UNKNOWN;
553 1.9 mrg
554 1.10 mrg if (fflag == 0 && method == FT_UNKNOWN)
555 1.9 mrg maybe_errx(1, "%s: not in gzip format", file);
556 1.9 mrg
557 1.10 mrg if (cflag == 0 || lflag) {
558 1.10 mrg s = &file[len - suffix_len + 1];
559 1.10 mrg if (strncmp(s, suffix, suffix_len) == 0) {
560 1.10 mrg (void)strncpy(outfile, file, len - suffix_len + 1);
561 1.10 mrg outfile[len - suffix_len + 1] = '\0';
562 1.10 mrg } else if (lflag == 0)
563 1.10 mrg maybe_errx(1, "unknown suffix %s", s);
564 1.10 mrg }
565 1.10 mrg
566 1.10 mrg if (method == FT_GZIP && (Nflag || lflag)) {
567 1.9 mrg if (header1[3] & ORIG_NAME) {
568 1.9 mrg size_t rbytes;
569 1.9 mrg int i;
570 1.9 mrg
571 1.9 mrg rbytes = read(fd, name, PATH_MAX + 1);
572 1.9 mrg if (rbytes < 0)
573 1.1 mrg maybe_err(1, "can't read %s", file);
574 1.9 mrg for (i = 0; i < rbytes && name[i]; i++)
575 1.9 mrg ;
576 1.9 mrg if (i < rbytes) {
577 1.9 mrg name[i] = 0;
578 1.9 mrg /* now maybe merge old dirname */
579 1.9 mrg if (strchr(outfile, '/') == 0)
580 1.9 mrg outfile = name;
581 1.9 mrg else {
582 1.9 mrg char *dir = dirname(outfile);
583 1.9 mrg if (asprintf(&outfile, "%s/%s", dir,
584 1.9 mrg name) == -1)
585 1.9 mrg maybe_err(1, "malloc");
586 1.1 mrg }
587 1.1 mrg }
588 1.1 mrg }
589 1.9 mrg }
590 1.10 mrg close_it:
591 1.9 mrg close(fd);
592 1.1 mrg
593 1.9 mrg if ((cflag == 0 || lflag) && fflag == 0) {
594 1.9 mrg if (lflag == 0 && stat(outfile, &osb) == 0) {
595 1.9 mrg maybe_warnx("%s already exists -- skipping", outfile);
596 1.9 mrg goto lose;
597 1.9 mrg }
598 1.9 mrg if (stat(file, &isb) == 0) {
599 1.9 mrg if (isb.st_nlink > 1 && lflag == 0) {
600 1.9 mrg maybe_warnx("%s has %d other links -- skipping",
601 1.9 mrg file, isb.st_nlink - 1);
602 1.1 mrg goto lose;
603 1.1 mrg }
604 1.9 mrg } else
605 1.9 mrg goto lose;
606 1.1 mrg }
607 1.5 mrg
608 1.10 mrg if (method == FT_BZIP2) {
609 1.10 mrg int in, out;
610 1.5 mrg
611 1.10 mrg if ((in = open(file, O_RDONLY)) == -1)
612 1.10 mrg maybe_err(1, "open for read: %s", file);
613 1.10 mrg if (cflag == 1)
614 1.10 mrg out = STDOUT_FILENO;
615 1.10 mrg else
616 1.10 mrg out = open(outfile, O_WRONLY|O_CREAT|O_EXCL, 0600);
617 1.10 mrg if (out == -1)
618 1.10 mrg maybe_err(1, "open for write: %s", outfile);
619 1.5 mrg
620 1.10 mrg if ((size = unbzip2(in, out)) == 0) {
621 1.10 mrg unlink(outfile);
622 1.10 mrg goto lose;
623 1.10 mrg }
624 1.10 mrg } else {
625 1.10 mrg if (lflag) {
626 1.10 mrg int fd;
627 1.1 mrg
628 1.10 mrg if ((fd = open(file, O_RDONLY)) == -1)
629 1.10 mrg maybe_err(1, "open");
630 1.10 mrg print_list(fd, isb.st_size, outfile, isb.st_mtime);
631 1.10 mrg return 0; /* XXX */
632 1.10 mrg }
633 1.10 mrg
634 1.10 mrg in = gzopen(file, gzipflags);
635 1.10 mrg if (in == NULL)
636 1.10 mrg maybe_err(1, "can't gzopen %s", file);
637 1.10 mrg
638 1.10 mrg if (cflag == 0) {
639 1.10 mrg int fd;
640 1.10 mrg
641 1.10 mrg /* Use open(2) directly to get a safe file. */
642 1.10 mrg fd = open(outfile, O_WRONLY|O_CREAT|O_EXCL, 0600);
643 1.10 mrg if (fd < 0)
644 1.10 mrg maybe_err(1, "can't open %s", outfile);
645 1.10 mrg out = fdopen(fd, "w");
646 1.10 mrg if (out == NULL)
647 1.10 mrg maybe_err(1, "can't fdopen %s", outfile);
648 1.10 mrg } else
649 1.10 mrg out = stdout;
650 1.1 mrg
651 1.10 mrg if ((size = gz_uncompress(in, out)) == 0) {
652 1.10 mrg unlink(outfile);
653 1.10 mrg goto lose;
654 1.10 mrg }
655 1.1 mrg
656 1.10 mrg /* close the file */
657 1.10 mrg if (fclose(out))
658 1.10 mrg maybe_err(1, "failed fclose");
659 1.10 mrg }
660 1.1 mrg
661 1.1 mrg /* if testing, or we uncompressed to stdout, this is all we need */
662 1.1 mrg if (tflag || cflag)
663 1.1 mrg return (size);
664 1.1 mrg
665 1.1 mrg /*
666 1.1 mrg * if we create a file...
667 1.1 mrg */
668 1.1 mrg if (cflag == 0) {
669 1.1 mrg /*
670 1.1 mrg * if we can't stat the file, or we are uncompressing to
671 1.1 mrg * stdin, don't remove the file.
672 1.1 mrg */
673 1.1 mrg if (stat(outfile, &osb) < 0) {
674 1.1 mrg maybe_warn("couldn't stat (leaving original): %s",
675 1.1 mrg outfile);
676 1.1 mrg goto lose;
677 1.1 mrg }
678 1.1 mrg if (osb.st_size != size) {
679 1.1 mrg maybe_warn("stat gave different size: %llu != %llu "
680 1.1 mrg "(leaving original)",
681 1.1 mrg (unsigned long long)size,
682 1.1 mrg (unsigned long long)osb.st_size);
683 1.1 mrg goto lose;
684 1.1 mrg }
685 1.1 mrg newfile = outfile;
686 1.1 mrg unlink(file);
687 1.1 mrg size = osb.st_size;
688 1.1 mrg copymodes(outfile, &isb);
689 1.1 mrg }
690 1.1 mrg return (size);
691 1.1 mrg
692 1.1 mrg lose:
693 1.1 mrg newfile = 0;
694 1.1 mrg return (0);
695 1.1 mrg }
696 1.1 mrg
697 1.1 mrg static void
698 1.1 mrg handle_stdin(void)
699 1.1 mrg {
700 1.1 mrg gzFile *file;
701 1.1 mrg
702 1.5 mrg if (fflag == 0 && lflag == 0 && isatty(STDIN_FILENO)) {
703 1.1 mrg maybe_warnx("standard input is a terminal -- ignoring");
704 1.1 mrg return;
705 1.1 mrg }
706 1.5 mrg
707 1.5 mrg if (lflag) {
708 1.5 mrg struct stat isb;
709 1.5 mrg
710 1.5 mrg if (fstat(STDIN_FILENO, &isb) < 0)
711 1.5 mrg maybe_err(1, "fstat");
712 1.7 mrg print_list(STDIN_FILENO, isb.st_size, "stdout", isb.st_mtime);
713 1.5 mrg return;
714 1.5 mrg }
715 1.5 mrg
716 1.1 mrg file = gzdopen(STDIN_FILENO, gzipflags);
717 1.1 mrg if (file == NULL)
718 1.1 mrg maybe_err(1, "can't gzdopen stdin");
719 1.1 mrg gz_uncompress(file, stdout);
720 1.1 mrg }
721 1.1 mrg
722 1.1 mrg static void
723 1.1 mrg handle_stdout(void)
724 1.1 mrg {
725 1.1 mrg gzFile *file;
726 1.1 mrg
727 1.1 mrg if (fflag == 0 && isatty(STDOUT_FILENO)) {
728 1.1 mrg maybe_warnx("standard output is a terminal -- ignoring");
729 1.1 mrg return;
730 1.1 mrg }
731 1.1 mrg file = gzdopen(STDOUT_FILENO, gzipflags);
732 1.1 mrg if (file == NULL)
733 1.1 mrg maybe_err(1, "can't gzdopen stdout");
734 1.1 mrg gz_compress(stdin, file);
735 1.1 mrg }
736 1.1 mrg
737 1.1 mrg /* do what is asked for, for the path name */
738 1.1 mrg static void
739 1.1 mrg handle_pathname(char *path)
740 1.1 mrg {
741 1.1 mrg char *opath = path, *s = 0;
742 1.1 mrg ssize_t len;
743 1.1 mrg struct stat sb;
744 1.1 mrg
745 1.1 mrg /* check for stdout/stdin */
746 1.1 mrg if (path[0] == '-' && path[1] == '\0') {
747 1.1 mrg if (dflag)
748 1.1 mrg handle_stdin();
749 1.1 mrg else
750 1.1 mrg handle_stdout();
751 1.1 mrg }
752 1.1 mrg
753 1.1 mrg retry:
754 1.1 mrg if (stat(path, &sb) < 0) {
755 1.1 mrg /* lets try <path>.gz if we're decompressing */
756 1.1 mrg if (dflag && s == 0 && errno == ENOENT) {
757 1.1 mrg len = strlen(path);
758 1.1 mrg s = malloc(len + suffix_len);
759 1.1 mrg if (s == 0)
760 1.1 mrg maybe_err(1, "malloc");
761 1.1 mrg memmove(s, path, len);
762 1.10 mrg memmove(&s[len], suffix, suffix_len);
763 1.1 mrg path = s;
764 1.1 mrg goto retry;
765 1.1 mrg }
766 1.1 mrg maybe_warn("can't stat: %s", opath);
767 1.1 mrg goto out;
768 1.1 mrg }
769 1.1 mrg
770 1.1 mrg if (S_ISDIR(sb.st_mode)) {
771 1.1 mrg if (rflag)
772 1.1 mrg handle_dir(path, &sb);
773 1.1 mrg else
774 1.1 mrg maybe_warn("%s is a directory", path);
775 1.1 mrg goto out;
776 1.1 mrg }
777 1.1 mrg
778 1.1 mrg if (S_ISREG(sb.st_mode))
779 1.1 mrg handle_file(path, &sb);
780 1.1 mrg
781 1.1 mrg out:
782 1.1 mrg if (s)
783 1.1 mrg free(s);
784 1.1 mrg return;
785 1.1 mrg }
786 1.1 mrg
787 1.1 mrg /* compress/decompress a file */
788 1.1 mrg static void
789 1.1 mrg handle_file(char *file, struct stat *sbp)
790 1.1 mrg {
791 1.1 mrg ssize_t usize, gsize;
792 1.1 mrg
793 1.1 mrg infile = file;
794 1.1 mrg if (dflag) {
795 1.1 mrg usize = file_uncompress(file);
796 1.1 mrg if (usize == 0)
797 1.1 mrg return;
798 1.1 mrg gsize = sbp->st_size;
799 1.1 mrg } else {
800 1.1 mrg gsize = file_compress(file);
801 1.1 mrg if (gsize == 0)
802 1.1 mrg return;
803 1.1 mrg usize = sbp->st_size;
804 1.1 mrg }
805 1.1 mrg
806 1.1 mrg if (vflag && !tflag)
807 1.1 mrg print_verbage(file, cflag == 0 ? newfile : 0, usize, gsize);
808 1.1 mrg }
809 1.1 mrg
810 1.1 mrg /* this is used with -r to recursively decend directories */
811 1.1 mrg static void
812 1.1 mrg handle_dir(char *dir, struct stat *sbp)
813 1.1 mrg {
814 1.1 mrg char *path_argv[2];
815 1.1 mrg FTS *fts;
816 1.1 mrg FTSENT *entry;
817 1.1 mrg
818 1.1 mrg path_argv[0] = dir;
819 1.1 mrg path_argv[1] = 0;
820 1.1 mrg fts = fts_open(path_argv, FTS_PHYSICAL, NULL);
821 1.1 mrg if (fts == NULL) {
822 1.1 mrg warn("couldn't fts_open %s", dir);
823 1.1 mrg return;
824 1.1 mrg }
825 1.1 mrg
826 1.1 mrg while ((entry = fts_read(fts))) {
827 1.1 mrg switch(entry->fts_info) {
828 1.1 mrg case FTS_D:
829 1.1 mrg case FTS_DP:
830 1.1 mrg continue;
831 1.1 mrg
832 1.1 mrg case FTS_DNR:
833 1.1 mrg case FTS_ERR:
834 1.1 mrg case FTS_NS:
835 1.1 mrg maybe_warn("%s", entry->fts_path);
836 1.1 mrg continue;
837 1.1 mrg case FTS_F:
838 1.1 mrg handle_file(entry->fts_name, entry->fts_statp);
839 1.1 mrg }
840 1.1 mrg }
841 1.1 mrg (void)fts_close(fts);
842 1.1 mrg }
843 1.1 mrg
844 1.6 mrg /* print a ratio */
845 1.6 mrg static void
846 1.6 mrg print_ratio(off_t in, off_t out, FILE *where)
847 1.6 mrg {
848 1.6 mrg u_int64_t percent;
849 1.6 mrg
850 1.6 mrg if (out == 0)
851 1.6 mrg percent = 0;
852 1.6 mrg else
853 1.10 mrg percent = 1000 - ((1000 * out) / in);
854 1.6 mrg fprintf(where, "%3lu.%1lu%%", (unsigned long)percent / 10UL,
855 1.6 mrg (unsigned long)percent % 10);
856 1.6 mrg }
857 1.6 mrg
858 1.1 mrg /* print compression statistics, and the new name (if there is one!) */
859 1.1 mrg static void
860 1.4 mrg print_verbage(char *file, char *nfile, ssize_t usize, ssize_t gsize)
861 1.1 mrg {
862 1.6 mrg fprintf(stderr, "%s:%s ", file,
863 1.6 mrg strlen(file) < 7 ? "\t\t" : "\t");
864 1.6 mrg print_ratio(usize, gsize, stderr);
865 1.4 mrg if (nfile)
866 1.4 mrg fprintf(stderr, " -- replaced with %s", nfile);
867 1.1 mrg fprintf(stderr, "\n");
868 1.1 mrg fflush(stderr);
869 1.1 mrg }
870 1.1 mrg
871 1.1 mrg /* print test results */
872 1.1 mrg static void
873 1.1 mrg print_test(char *file, int ok)
874 1.1 mrg {
875 1.1 mrg
876 1.1 mrg fprintf(stderr, "%s:%s %s\n", file,
877 1.1 mrg strlen(file) < 7 ? "\t\t" : "\t", ok ? "OK" : "NOT OK");
878 1.1 mrg fflush(stderr);
879 1.1 mrg }
880 1.1 mrg
881 1.5 mrg /* print a file's info ala --list */
882 1.5 mrg /* eg:
883 1.5 mrg compressed uncompressed ratio uncompressed_name
884 1.5 mrg 354841 1679360 78.8% /usr/pkgsrc/distfiles/libglade-2.0.1.tar
885 1.5 mrg */
886 1.5 mrg static void
887 1.7 mrg print_list(int fd, off_t in, const char *outfile, time_t ts)
888 1.5 mrg {
889 1.5 mrg static int first = 1;
890 1.6 mrg static off_t in_tot, out_tot;
891 1.6 mrg off_t out;
892 1.7 mrg u_int32_t crc;
893 1.5 mrg int rv;
894 1.5 mrg
895 1.7 mrg if (first) {
896 1.7 mrg if (vflag)
897 1.7 mrg printf("method crc date time ");
898 1.7 mrg if (qflag == 0)
899 1.7 mrg printf(" compressed uncompressed "
900 1.7 mrg "ratio uncompressed_name\n");
901 1.7 mrg }
902 1.5 mrg first = 0;
903 1.5 mrg
904 1.6 mrg /* print totals? */
905 1.6 mrg if (fd == -1) {
906 1.6 mrg in = in_tot;
907 1.6 mrg out = out_tot;
908 1.6 mrg } else {
909 1.6 mrg /* read the last 4 bytes - this is the uncompressed size */
910 1.7 mrg rv = lseek(fd, (off_t)(-8), SEEK_END);
911 1.6 mrg if (rv != -1) {
912 1.7 mrg unsigned char buf[8];
913 1.6 mrg u_int32_t usize;
914 1.6 mrg
915 1.6 mrg if (read(fd, (char *)buf, sizeof(buf)) != sizeof(buf))
916 1.6 mrg maybe_err(1, "read of uncompressed size");
917 1.7 mrg crc = buf[0] | buf[1] << 8 | buf[2] << 16 | buf[3] << 24;
918 1.7 mrg usize = buf[4] | buf[5] << 8 | buf[6] << 16 | buf[7] << 24;
919 1.6 mrg out = (off_t)usize;
920 1.6 mrg }
921 1.6 mrg }
922 1.5 mrg
923 1.7 mrg if (vflag && fd == -1)
924 1.7 mrg printf(" ");
925 1.7 mrg else if (vflag) {
926 1.7 mrg char *date = ctime(&ts);
927 1.7 mrg
928 1.7 mrg /* skip the day, 1/100th second, and year */
929 1.7 mrg date += 4;
930 1.7 mrg date[12] = 0;
931 1.7 mrg printf("%5s %08x %11s ", "defla"/*XXX*/, crc, date);
932 1.7 mrg }
933 1.6 mrg printf("%12llu %12llu ", (unsigned long long)in, (unsigned long long)out);
934 1.6 mrg print_ratio(in, out, stdout);
935 1.6 mrg printf(" %s\n", outfile);
936 1.6 mrg in_tot += in;
937 1.6 mrg out_tot += out;
938 1.5 mrg }
939 1.5 mrg
940 1.1 mrg /* display the usage of NetBSD gzip */
941 1.1 mrg static void
942 1.1 mrg usage(void)
943 1.1 mrg {
944 1.1 mrg
945 1.1 mrg fprintf(stderr, "%s\n", gzip_version);
946 1.1 mrg fprintf(stderr,
947 1.1 mrg "Usage: %s [-cdfhnNqrStvV123456789] [<file> [<file> ...]]\n"
948 1.11 mrg #ifndef SMALL
949 1.1 mrg " -c --stdout write to stdout, keep original files\n"
950 1.1 mrg " --to-stdout\n"
951 1.1 mrg " -d --decompress uncompress files\n"
952 1.1 mrg " --uncompress\n"
953 1.1 mrg " -f --force force overwriting & compress links\n"
954 1.1 mrg " -h --help display this help\n"
955 1.1 mrg " -n --no-name don't save original file name or time stamp\n"
956 1.1 mrg " -N --name save or restore original file name and time stamp\n"
957 1.1 mrg " -q --quiet output no warnings\n"
958 1.1 mrg " -r --recursive recursively compress files in directories\n"
959 1.1 mrg " -S .suf use suffix .suf instead of .gz\n"
960 1.1 mrg " --suffix .suf\n"
961 1.1 mrg " -t --test test compressed file\n"
962 1.1 mrg " -v --verbose print extra statistics\n"
963 1.1 mrg " -V --version display program version\n"
964 1.1 mrg " -1 --fast fastest (worst) compression\n"
965 1.1 mrg " -2 .. -8 set compression level\n"
966 1.1 mrg " -9 --best best (slowest) compression\n",
967 1.11 mrg #else
968 1.11 mrg ,
969 1.11 mrg #endif
970 1.1 mrg getprogname());
971 1.1 mrg fflush(stderr);
972 1.1 mrg exit(0);
973 1.1 mrg }
974 1.1 mrg
975 1.1 mrg /* display the version of NetBSD gzip */
976 1.1 mrg static void
977 1.1 mrg display_version(void)
978 1.1 mrg {
979 1.1 mrg
980 1.1 mrg fprintf(stderr, "%s\n", gzip_version);
981 1.1 mrg fflush(stderr);
982 1.1 mrg exit(0);
983 1.1 mrg }
984 1.10 mrg
985 1.10 mrg #include "unbzip2.c"
986