file.c revision 1.1.1.2 1 1.1.1.2 cjep /* $NetBSD: file.c,v 1.1.1.2 2004/01/02 15:00:27 cjep Exp $ */
2 1.1.1.2 cjep
3 1.1 cjep /*-
4 1.1 cjep * Copyright (c) 1999 James Howard and Dag-Erling Codan Smrgrav
5 1.1 cjep * All rights reserved.
6 1.1 cjep *
7 1.1 cjep * Redistribution and use in source and binary forms, with or without
8 1.1 cjep * modification, are permitted provided that the following conditions
9 1.1 cjep * are met:
10 1.1 cjep * 1. Redistributions of source code must retain the above copyright
11 1.1 cjep * notice, this list of conditions and the following disclaimer.
12 1.1 cjep * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 cjep * notice, this list of conditions and the following disclaimer in the
14 1.1 cjep * documentation and/or other materials provided with the distribution.
15 1.1 cjep *
16 1.1 cjep * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 1.1 cjep * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 1.1 cjep * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 1.1 cjep * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 1.1 cjep * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 1.1 cjep * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 1.1 cjep * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 1.1 cjep * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 1.1 cjep * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 cjep * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 cjep * SUCH DAMAGE.
27 1.1 cjep *
28 1.1 cjep */
29 1.1 cjep
30 1.1.1.2 cjep #include <sys/cdefs.h>
31 1.1.1.2 cjep #ifndef lint
32 1.1.1.2 cjep __RCSID("$NetBSD: file.c,v 1.1.1.2 2004/01/02 15:00:27 cjep Exp $");
33 1.1.1.2 cjep #endif /* not lint */
34 1.1.1.2 cjep
35 1.1 cjep #include <sys/param.h>
36 1.1 cjep
37 1.1 cjep #include <err.h>
38 1.1 cjep #include <stdio.h>
39 1.1 cjep #include <stdlib.h>
40 1.1 cjep #include <zlib.h>
41 1.1 cjep
42 1.1 cjep #include "grep.h"
43 1.1 cjep
44 1.1.1.2 cjep static char fname[MAXPATHLEN];
45 1.1.1.2 cjep static char *lnbuf;
46 1.1.1.2 cjep static int lnbuflen;
47 1.1 cjep
48 1.1 cjep #define FILE_STDIO 0
49 1.1 cjep #define FILE_MMAP 1
50 1.1 cjep #define FILE_GZIP 2
51 1.1 cjep
52 1.1 cjep struct file {
53 1.1.1.2 cjep int type;
54 1.1.1.2 cjep FILE *f;
55 1.1.1.2 cjep mmf_t *mmf;
56 1.1.1.2 cjep gzFile *gzf;
57 1.1 cjep };
58 1.1 cjep
59 1.1 cjep static char *
60 1.1.1.2 cjep grepfgetln(FILE *f, size_t *len)
61 1.1.1.2 cjep {
62 1.1.1.2 cjep size_t n;
63 1.1.1.2 cjep int c;
64 1.1.1.2 cjep
65 1.1.1.2 cjep for (n = 0; ; ++n) {
66 1.1.1.2 cjep c = getc(f);
67 1.1.1.2 cjep if (c == EOF) {
68 1.1.1.2 cjep if (feof(f))
69 1.1.1.2 cjep break;
70 1.1.1.2 cjep err(2, "%s", fname);
71 1.1.1.2 cjep /* ERROR */
72 1.1.1.2 cjep
73 1.1.1.2 cjep }
74 1.1.1.2 cjep if (c == line_endchar)
75 1.1.1.2 cjep break;
76 1.1.1.2 cjep if (n >= lnbuflen) {
77 1.1.1.2 cjep lnbuflen *= 2;
78 1.1.1.2 cjep lnbuf = grep_realloc(lnbuf, ++lnbuflen);
79 1.1.1.2 cjep }
80 1.1.1.2 cjep lnbuf[n] = c;
81 1.1.1.2 cjep }
82 1.1.1.2 cjep if (feof(f) && n == 0)
83 1.1.1.2 cjep return NULL;
84 1.1.1.2 cjep *len = n;
85 1.1.1.2 cjep return lnbuf;
86 1.1.1.2 cjep }
87 1.1.1.2 cjep
88 1.1.1.2 cjep static char *
89 1.1 cjep gzfgetln(gzFile *f, size_t *len)
90 1.1 cjep {
91 1.1.1.2 cjep size_t n;
92 1.1.1.2 cjep int c;
93 1.1 cjep
94 1.1 cjep for (n = 0; ; ++n) {
95 1.1 cjep c = gzgetc(f);
96 1.1 cjep if (c == -1) {
97 1.1 cjep const char *gzerrstr;
98 1.1 cjep int gzerr;
99 1.1 cjep
100 1.1 cjep if (gzeof(f))
101 1.1 cjep break;
102 1.1.1.2 cjep
103 1.1 cjep gzerrstr = gzerror(f, &gzerr);
104 1.1 cjep if (gzerr == Z_ERRNO)
105 1.1.1.2 cjep err(2, "%s", fname);
106 1.1 cjep else
107 1.1.1.2 cjep errx(2, "%s: %s", fname, gzerrstr);
108 1.1 cjep }
109 1.1.1.2 cjep if (c == line_endchar)
110 1.1 cjep break;
111 1.1 cjep if (n >= lnbuflen) {
112 1.1 cjep lnbuflen *= 2;
113 1.1 cjep lnbuf = grep_realloc(lnbuf, ++lnbuflen);
114 1.1 cjep }
115 1.1 cjep lnbuf[n] = c;
116 1.1 cjep }
117 1.1 cjep
118 1.1 cjep if (gzeof(f) && n == 0)
119 1.1 cjep return NULL;
120 1.1 cjep *len = n;
121 1.1 cjep return lnbuf;
122 1.1 cjep }
123 1.1 cjep
124 1.1 cjep file_t *
125 1.1 cjep grep_fdopen(int fd, char *mode)
126 1.1 cjep {
127 1.1 cjep file_t *f;
128 1.1 cjep
129 1.1 cjep if (fd == 0)
130 1.1 cjep sprintf(fname, "(standard input)");
131 1.1 cjep else
132 1.1 cjep sprintf(fname, "(fd %d)", fd);
133 1.1.1.2 cjep
134 1.1 cjep f = grep_malloc(sizeof *f);
135 1.1.1.2 cjep
136 1.1.1.2 cjep if (zgrep) {
137 1.1 cjep f->type = FILE_GZIP;
138 1.1 cjep if ((f->gzf = gzdopen(fd, mode)) != NULL)
139 1.1 cjep return f;
140 1.1 cjep } else {
141 1.1 cjep f->type = FILE_STDIO;
142 1.1 cjep if ((f->f = fdopen(fd, mode)) != NULL)
143 1.1 cjep return f;
144 1.1 cjep }
145 1.1.1.2 cjep
146 1.1 cjep free(f);
147 1.1 cjep return NULL;
148 1.1 cjep }
149 1.1 cjep
150 1.1 cjep file_t *
151 1.1 cjep grep_open(char *path, char *mode)
152 1.1 cjep {
153 1.1 cjep file_t *f;
154 1.1 cjep
155 1.1 cjep snprintf(fname, MAXPATHLEN, "%s", path);
156 1.1.1.2 cjep
157 1.1 cjep f = grep_malloc(sizeof *f);
158 1.1.1.2 cjep
159 1.1.1.2 cjep if (zgrep) {
160 1.1 cjep f->type = FILE_GZIP;
161 1.1 cjep if ((f->gzf = gzopen(fname, mode)) != NULL)
162 1.1 cjep return f;
163 1.1 cjep } else {
164 1.1 cjep /* try mmap first; if it fails, try stdio */
165 1.1 cjep if ((f->mmf = mmopen(fname, mode)) != NULL) {
166 1.1 cjep f->type = FILE_MMAP;
167 1.1 cjep return f;
168 1.1 cjep }
169 1.1 cjep f->type = FILE_STDIO;
170 1.1 cjep if ((f->f = fopen(path, mode)) != NULL)
171 1.1 cjep return f;
172 1.1 cjep }
173 1.1.1.2 cjep
174 1.1 cjep free(f);
175 1.1 cjep return NULL;
176 1.1 cjep }
177 1.1 cjep
178 1.1 cjep int
179 1.1 cjep grep_bin_file(file_t *f)
180 1.1 cjep {
181 1.1 cjep switch (f->type) {
182 1.1 cjep case FILE_STDIO:
183 1.1 cjep return bin_file(f->f);
184 1.1 cjep case FILE_MMAP:
185 1.1.1.2 cjep return mmbin_file(f->mmf);
186 1.1 cjep case FILE_GZIP:
187 1.1 cjep return gzbin_file(f->gzf);
188 1.1 cjep default:
189 1.1 cjep /* can't happen */
190 1.1.1.2 cjep errx(2, "invalid file type");
191 1.1 cjep }
192 1.1 cjep }
193 1.1 cjep
194 1.1 cjep char *
195 1.1 cjep grep_fgetln(file_t *f, size_t *l)
196 1.1 cjep {
197 1.1 cjep switch (f->type) {
198 1.1 cjep case FILE_STDIO:
199 1.1.1.2 cjep if (line_endchar == '\n')
200 1.1.1.2 cjep return fgetln(f->f, l);
201 1.1.1.2 cjep else
202 1.1.1.2 cjep return grepfgetln(f->f, l);
203 1.1 cjep case FILE_MMAP:
204 1.1 cjep return mmfgetln(f->mmf, l);
205 1.1 cjep case FILE_GZIP:
206 1.1 cjep return gzfgetln(f->gzf, l);
207 1.1 cjep default:
208 1.1 cjep /* can't happen */
209 1.1.1.2 cjep errx(2, "invalid file type");
210 1.1 cjep }
211 1.1 cjep }
212 1.1 cjep
213 1.1 cjep void
214 1.1 cjep grep_close(file_t *f)
215 1.1 cjep {
216 1.1 cjep switch (f->type) {
217 1.1 cjep case FILE_STDIO:
218 1.1 cjep fclose(f->f);
219 1.1 cjep break;
220 1.1 cjep case FILE_MMAP:
221 1.1 cjep mmclose(f->mmf);
222 1.1 cjep break;
223 1.1 cjep case FILE_GZIP:
224 1.1 cjep gzclose(f->gzf);
225 1.1 cjep break;
226 1.1 cjep default:
227 1.1 cjep /* can't happen */
228 1.1.1.2 cjep errx(2, "invalid file type");
229 1.1 cjep }
230 1.1 cjep }
231