savecore.c revision 1.18 1 /*-
2 * Copyright (c) 1986, 1992, 1993
3 * The Regents of the University of California. All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 3. All advertising materials mentioning features or use of this software
14 * must display the following acknowledgement:
15 * This product includes software developed by the University of
16 * California, Berkeley and its contributors.
17 * 4. Neither the name of the University nor the names of its contributors
18 * may be used to endorse or promote products derived from this software
19 * without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 * SUCH DAMAGE.
32 */
33
34 #ifndef lint
35 static char copyright[] =
36 "@(#) Copyright (c) 1986, 1992, 1993\n\
37 The Regents of the University of California. All rights reserved.\n";
38 #endif /* not lint */
39
40 #ifndef lint
41 /*static char sccsid[] = "from: @(#)savecore.c 8.3 (Berkeley) 1/2/94";*/
42 static char *rcsid = "$Id: savecore.c,v 1.18 1994/10/31 04:37:32 cgd Exp $";
43 #endif /* not lint */
44
45 #include <sys/param.h>
46 #include <sys/stat.h>
47 #include <sys/mount.h>
48 #include <sys/syslog.h>
49 #include <sys/time.h>
50
51 #include <dirent.h>
52 #include <errno.h>
53 #include <fcntl.h>
54 #include <nlist.h>
55 #include <paths.h>
56 #include <stdio.h>
57 #include <stdlib.h>
58 #include <string.h>
59 #include <tzfile.h>
60 #include <unistd.h>
61
62 extern FILE *zopen __P((const char *fname, const char *mode, int bits));
63
64 #define ok(number) ((number) - KERNBASE)
65
66 struct nlist current_nl[] = { /* Namelist for currently running system. */
67 #define X_DUMPDEV 0
68 { "_dumpdev" },
69 #define X_DUMPLO 1
70 { "_dumplo" },
71 #define X_TIME 2
72 { "_time" },
73 #define X_DUMPSIZE 3
74 { "_dumpsize" },
75 #define X_VERSION 4
76 { "_version" },
77 #define X_PANICSTR 5
78 { "_panicstr" },
79 #define X_DUMPMAG 6
80 { "_dumpmag" },
81 { "" },
82 };
83 int cursyms[] = { X_DUMPDEV, X_DUMPLO, X_VERSION, X_DUMPMAG, -1 };
84 int dumpsyms[] = { X_TIME, X_DUMPSIZE, X_VERSION, X_PANICSTR, X_DUMPMAG, -1 };
85
86 struct nlist dump_nl[] = { /* Name list for dumped system. */
87 { "_dumpdev" }, /* Entries MUST be the same as */
88 { "_dumplo" }, /* those in current_nl[]. */
89 { "_time" },
90 { "_dumpsize" },
91 { "_version" },
92 { "_panicstr" },
93 { "_dumpmag" },
94 { "" },
95 };
96
97 /* Types match kernel declarations. */
98 long dumplo; /* where dump starts on dumpdev */
99 int dumpmag; /* magic number in dump */
100 int dumpsize; /* amount of memory dumped */
101
102 char *kernel;
103 char *dirname; /* directory to save dumps in */
104 char *ddname; /* name of dump device */
105 dev_t dumpdev; /* dump device */
106 int dumpfd; /* read/write descriptor on block dev */
107 time_t now; /* current date */
108 char panic_mesg[1024];
109 int panicstr;
110 char vers[1024];
111
112 int clear, compress, force, verbose; /* flags */
113
114 void check_kmem __P((void));
115 int check_space __P((void));
116 void clear_dump __P((void));
117 int Create __P((char *, int));
118 int dump_exists __P((void));
119 char *find_dev __P((dev_t, int));
120 int get_crashtime __P((void));
121 void kmem_setup __P((void));
122 void log __P((int, char *, ...));
123 void Lseek __P((int, off_t, int));
124 int Open __P((char *, int rw));
125 int Read __P((int, void *, int));
126 char *rawname __P((char *s));
127 void save_core __P((void));
128 void usage __P((void));
129 void Write __P((int, void *, int));
130
131 int
132 main(argc, argv)
133 int argc;
134 char *argv[];
135 {
136 int ch;
137
138 openlog("savecore", LOG_PERROR, LOG_DAEMON);
139
140 while ((ch = getopt(argc, argv, "cdfNvz")) != EOF)
141 switch(ch) {
142 case 'c':
143 clear = 1;
144 break;
145 case 'd': /* Not documented. */
146 case 'v':
147 verbose = 1;
148 break;
149 case 'f':
150 force = 1;
151 break;
152 case 'N':
153 kernel = optarg;
154 break;
155 case 'z':
156 compress = 1;
157 break;
158 case '?':
159 default:
160 usage();
161 }
162 argc -= optind;
163 argv += optind;
164
165 if (!clear) {
166 if (argc != 1 && argc != 2)
167 usage();
168 dirname = argv[0];
169 }
170 if (argc == 2)
171 kernel = argv[1];
172
173 (void)time(&now);
174 kmem_setup();
175
176 if (clear) {
177 clear_dump();
178 exit(0);
179 }
180
181 if (!dump_exists() && !force)
182 exit(1);
183
184 check_kmem();
185
186 if (panicstr)
187 syslog(LOG_ALERT, "reboot after panic: %s", panic_mesg);
188 else
189 syslog(LOG_ALERT, "reboot");
190
191 if ((!get_crashtime() || !check_space()) && !force)
192 exit(1);
193
194 save_core();
195
196 clear_dump();
197 exit(0);
198 }
199
200 void
201 kmem_setup()
202 {
203 FILE *fp;
204 int kmem, i;
205 char *dump_sys;
206
207 /*
208 * Some names we need for the currently running system, others for
209 * the system that was running when the dump was made. The values
210 * obtained from the current system are used to look for things in
211 * /dev/kmem that cannot be found in the dump_sys namelist, but are
212 * presumed to be the same (since the disk partitions are probably
213 * the same!)
214 */
215 if ((nlist(_PATH_UNIX, current_nl)) == -1)
216 syslog(LOG_ERR, "%s: nlist: %s", _PATH_UNIX, strerror(errno));
217 for (i = 0; cursyms[i] != -1; i++)
218 if (current_nl[cursyms[i]].n_value == 0) {
219 syslog(LOG_ERR, "%s: %s not in namelist",
220 _PATH_UNIX, current_nl[cursyms[i]].n_name);
221 exit(1);
222 }
223
224 dump_sys = kernel ? kernel : _PATH_UNIX;
225 if ((nlist(dump_sys, dump_nl)) == -1)
226 syslog(LOG_ERR, "%s: nlist: %s", dump_sys, strerror(errno));
227 for (i = 0; dumpsyms[i] != -1; i++)
228 if (dump_nl[dumpsyms[i]].n_value == 0) {
229 syslog(LOG_ERR, "%s: %s not in namelist",
230 dump_sys, dump_nl[dumpsyms[i]].n_name);
231 exit(1);
232 }
233
234 kmem = Open(_PATH_KMEM, O_RDONLY);
235 Lseek(kmem, (off_t)current_nl[X_DUMPDEV].n_value, L_SET);
236 (void)Read(kmem, &dumpdev, sizeof(dumpdev));
237 if (dumpdev == NODEV) {
238 syslog(LOG_WARNING, "no core dump (no dumpdev)");
239 exit(1);
240 }
241 Lseek(kmem, (off_t)current_nl[X_DUMPLO].n_value, L_SET);
242 (void)Read(kmem, &dumplo, sizeof(dumplo));
243 if (verbose)
244 (void)printf("dumplo = %d (%d * %d)\n",
245 dumplo, dumplo/DEV_BSIZE, DEV_BSIZE);
246 Lseek(kmem, (off_t)current_nl[X_DUMPMAG].n_value, L_SET);
247 (void)Read(kmem, &dumpmag, sizeof(dumpmag));
248 dumplo *= DEV_BSIZE;
249 ddname = find_dev(dumpdev, S_IFBLK);
250 dumpfd = Open(ddname, O_RDWR);
251 fp = fdopen(kmem, "r");
252 if (fp == NULL) {
253 syslog(LOG_ERR, "%s: fdopen: %m", _PATH_KMEM);
254 exit(1);
255 }
256 if (kernel)
257 return;
258 (void)fseek(fp, (off_t)current_nl[X_VERSION].n_value, L_SET);
259 (void)fgets(vers, sizeof(vers), fp);
260
261 /* Don't fclose(fp), we use dumpfd later. */
262 }
263
264 void
265 check_kmem()
266 {
267 register char *cp;
268 FILE *fp;
269 char core_vers[1024];
270
271 fp = fdopen(dumpfd, "r");
272 if (fp == NULL) {
273 syslog(LOG_ERR, "%s: fdopen: %m", ddname);
274 exit(1);
275 }
276 fseek(fp, (off_t)(dumplo + ok(dump_nl[X_VERSION].n_value)), L_SET);
277 fgets(core_vers, sizeof(core_vers), fp);
278 if (strcmp(vers, core_vers) && kernel == 0)
279 syslog(LOG_WARNING,
280 "warning: %s version mismatch:\n\t%s\nand\t%s\n",
281 _PATH_UNIX, vers, core_vers);
282 (void)fseek(fp,
283 (off_t)(dumplo + ok(dump_nl[X_PANICSTR].n_value)), L_SET);
284 (void)fread(&panicstr, sizeof(panicstr), 1, fp);
285 if (panicstr) {
286 (void)fseek(fp, dumplo + ok(panicstr), L_SET);
287 cp = panic_mesg;
288 do
289 *cp = getc(fp);
290 while (*cp++ && cp < &panic_mesg[sizeof(panic_mesg)]);
291 }
292 /* Don't fclose(fp), we use dumpfd later. */
293 }
294
295 void
296 clear_dump()
297 {
298 long newdumplo;
299
300 newdumplo = 0;
301 Lseek(dumpfd, (off_t)(dumplo + ok(dump_nl[X_DUMPMAG].n_value)), L_SET);
302 Write(dumpfd, &newdumplo, sizeof(newdumplo));
303 }
304
305 int
306 dump_exists()
307 {
308 int newdumpmag;
309
310 Lseek(dumpfd, (off_t)(dumplo + ok(dump_nl[X_DUMPMAG].n_value)), L_SET);
311 (void)Read(dumpfd, &newdumpmag, sizeof(newdumpmag));
312 if (newdumpmag != dumpmag) {
313 if (verbose)
314 syslog(LOG_WARNING, "magic number mismatch (%x != %x)",
315 newdumpmag, dumpmag);
316 syslog(LOG_WARNING, "no core dump");
317 return (0);
318 }
319 return (1);
320 }
321
322 char buf[1024 * 1024];
323
324 FILE *zopen __P((char *, char *, int));
325
326 void
327 save_core()
328 {
329 register FILE *fp;
330 register int bounds, ifd, nr, nw, ofd;
331 char *rawp, path[MAXPATHLEN];
332
333 /*
334 * Get the current number and update the bounds file. Do the update
335 * now, because may fail later and don't want to overwrite anything.
336 */
337 (void)snprintf(path, sizeof(path), "%s/bounds", dirname);
338 if ((fp = fopen(path, "r")) == NULL)
339 goto err1;
340 if (fgets(buf, sizeof(buf), fp) == NULL) {
341 if (ferror(fp))
342 err1: syslog(LOG_WARNING, "%s: %s", path, strerror(errno));
343 bounds = 0;
344 } else
345 bounds = atoi(buf);
346 if (fp != NULL)
347 (void)fclose(fp);
348 if ((fp = fopen(path, "w")) == NULL)
349 syslog(LOG_ERR, "%s: %m", path);
350 else {
351 (void)fprintf(fp, "%d\n", bounds + 1);
352 (void)fclose(fp);
353 }
354 (void)fclose(fp);
355
356 /* Create the core file. */
357 (void)snprintf(path, sizeof(path), "%s/netbsd.%d%s.core",
358 dirname, bounds, compress ? ".Z" : "");
359 if (compress) {
360 if ((fp = zopen(path, "w", 0)) == NULL) {
361 syslog(LOG_ERR, "%s: %s", path, strerror(errno));
362 exit(1);
363 }
364 } else
365 ofd = Create(path, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH);
366
367 /* Open the raw device. */
368 rawp = rawname(ddname);
369 if ((ifd = open(rawp, O_RDONLY)) == -1) {
370 syslog(LOG_WARNING, "%s: %m; using block device", rawp);
371 ifd = dumpfd;
372 }
373
374 /* Read the dump size. */
375 Lseek(dumpfd, (off_t)(dumplo + ok(dump_nl[X_DUMPSIZE].n_value)), L_SET);
376 (void)Read(dumpfd, &dumpsize, sizeof(dumpsize));
377
378 /* Seek to the start of the core. */
379 Lseek(ifd, (off_t)dumplo, L_SET);
380
381 /* Copy the core file. */
382 dumpsize *= getpagesize();
383 syslog(LOG_NOTICE, "writing %score to %s",
384 compress ? "compressed " : "", path);
385 for (; dumpsize > 0; dumpsize -= nr) {
386 (void)printf("%6dK\r", dumpsize / 1024);
387 (void)fflush(stdout);
388 nr = read(ifd, buf, MIN(dumpsize, sizeof(buf)));
389 if (nr <= 0) {
390 if (nr == 0)
391 syslog(LOG_WARNING,
392 "WARNING: EOF on dump device");
393 else
394 syslog(LOG_ERR, "%s: %m", rawp);
395 goto err2;
396 }
397 if (compress)
398 nw = fwrite(buf, 1, nr, fp);
399 else
400 nw = write(ofd, buf, nr);
401 if (nw != nr) {
402 syslog(LOG_ERR, "%s: %s",
403 path, strerror(nw == 0 ? EIO : errno));
404 err2: syslog(LOG_WARNING,
405 "WARNING: core may be incomplete");
406 (void)printf("\n");
407 exit(1);
408 }
409 }
410 (void)printf("\n");
411 (void)close(ifd);
412 if (compress)
413 (void)fclose(fp);
414 else
415 (void)close(ofd);
416
417 /* Copy the kernel. */
418 ifd = Open(kernel ? kernel : _PATH_UNIX, O_RDONLY);
419 (void)snprintf(path, sizeof(path), "%s/netbsd.%d%s",
420 dirname, bounds, compress ? ".Z" : "");
421 if (compress) {
422 if ((fp = zopen(path, "w", 0)) == NULL) {
423 syslog(LOG_ERR, "%s: %s", path, strerror(errno));
424 exit(1);
425 }
426 } else
427 ofd = Create(path, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH);
428 syslog(LOG_NOTICE, "writing %skernel to %s",
429 compress ? "compressed " : "", path);
430 while ((nr = read(ifd, buf, sizeof(buf))) > 0) {
431 if (compress)
432 nw = fwrite(buf, 1, nr, fp);
433 else
434 nw = write(ofd, buf, nr);
435 if (nw != nr) {
436 syslog(LOG_ERR, "%s: %s",
437 path, strerror(nw == 0 ? EIO : errno));
438 syslog(LOG_WARNING,
439 "WARNING: kernel may be incomplete");
440 exit(1);
441 }
442 }
443 if (nr < 0) {
444 syslog(LOG_ERR, "%s: %s",
445 kernel ? kernel : _PATH_UNIX, strerror(errno));
446 syslog(LOG_WARNING,
447 "WARNING: kernel may be incomplete");
448 exit(1);
449 }
450 if (compress)
451 (void)fclose(fp);
452 else
453 (void)close(ofd);
454 }
455
456 char *
457 find_dev(dev, type)
458 register dev_t dev;
459 register int type;
460 {
461 register DIR *dfd;
462 struct dirent *dir;
463 struct stat sb;
464 char *dp, devname[MAXPATHLEN + 1];
465
466 if ((dfd = opendir(_PATH_DEV)) == NULL) {
467 syslog(LOG_ERR, "%s: %s", _PATH_DEV, strerror(errno));
468 exit(1);
469 }
470 (void)strcpy(devname, _PATH_DEV);
471 while ((dir = readdir(dfd))) {
472 (void)strcpy(devname + sizeof(_PATH_DEV) - 1, dir->d_name);
473 if (lstat(devname, &sb)) {
474 syslog(LOG_ERR, "%s: %s", devname, strerror(errno));
475 continue;
476 }
477 if ((sb.st_mode & S_IFMT) != type)
478 continue;
479 if (dev == sb.st_rdev) {
480 closedir(dfd);
481 if ((dp = strdup(devname)) == NULL) {
482 syslog(LOG_ERR, "%s", strerror(errno));
483 exit(1);
484 }
485 return (dp);
486 }
487 }
488 closedir(dfd);
489 syslog(LOG_ERR, "can't find device %d/%d", major(dev), minor(dev));
490 exit(1);
491 }
492
493 char *
494 rawname(s)
495 char *s;
496 {
497 char *sl, name[MAXPATHLEN];
498
499 if ((sl = strrchr(s, '/')) == NULL || sl[1] == '0') {
500 syslog(LOG_ERR,
501 "can't make raw dump device name from %s", s);
502 return (s);
503 }
504 (void)snprintf(name, sizeof(name), "%.*s/r%s", sl - s, s, sl + 1);
505 if ((sl = strdup(name)) == NULL) {
506 syslog(LOG_ERR, "%s", strerror(errno));
507 exit(1);
508 }
509 return (sl);
510 }
511
512 int
513 get_crashtime()
514 {
515 time_t dumptime; /* Time the dump was taken. */
516
517 Lseek(dumpfd, (off_t)(dumplo + ok(dump_nl[X_TIME].n_value)), L_SET);
518 (void)Read(dumpfd, &dumptime, sizeof(dumptime));
519 if (dumptime == 0) {
520 if (verbose)
521 syslog(LOG_ERR, "dump time is zero");
522 return (0);
523 }
524 (void)printf("savecore: system went down at %s", ctime(&dumptime));
525 #define LEEWAY (7 * SECSPERDAY)
526 if (dumptime < now - LEEWAY || dumptime > now + LEEWAY) {
527 (void)printf("dump time is unreasonable\n");
528 return (0);
529 }
530 return (1);
531 }
532
533 int
534 check_space()
535 {
536 register FILE *fp;
537 char *tkernel;
538 off_t minfree, spacefree, kernelsize, needed;
539 struct stat st;
540 struct statfs fsbuf;
541 char buf[100], path[MAXPATHLEN];
542
543 tkernel = kernel ? kernel : _PATH_UNIX;
544 if (stat(tkernel, &st) < 0) {
545 syslog(LOG_ERR, "%s: %m", tkernel);
546 exit(1);
547 }
548 kernelsize = st.st_blocks * S_BLKSIZE;
549 if (statfs(dirname, &fsbuf) < 0) {
550 syslog(LOG_ERR, "%s: %m", dirname);
551 exit(1);
552 }
553 spacefree = (fsbuf.f_bavail * fsbuf.f_bsize) / 1024;
554
555 (void)snprintf(path, sizeof(path), "%s/minfree", dirname);
556 if ((fp = fopen(path, "r")) == NULL)
557 minfree = 0;
558 else {
559 if (fgets(buf, sizeof(buf), fp) == NULL)
560 minfree = 0;
561 else
562 minfree = atoi(buf);
563 (void)fclose(fp);
564 }
565
566 needed = (dumpsize + kernelsize) / 1024;
567 if (minfree > 0 && spacefree - needed < minfree) {
568 syslog(LOG_WARNING,
569 "no dump, not enough free space on device");
570 return (0);
571 }
572 if (spacefree - needed < minfree)
573 syslog(LOG_WARNING,
574 "dump performed, but free space threshold crossed");
575 return (1);
576 }
577
578 int
579 Open(name, rw)
580 char *name;
581 int rw;
582 {
583 int fd;
584
585 if ((fd = open(name, rw, 0)) < 0) {
586 syslog(LOG_ERR, "%s: %m", name);
587 exit(1);
588 }
589 return (fd);
590 }
591
592 int
593 Read(fd, bp, size)
594 int fd, size;
595 void *bp;
596 {
597 int nr;
598
599 nr = read(fd, bp, size);
600 if (nr != size) {
601 syslog(LOG_ERR, "read: %m");
602 exit(1);
603 }
604 return (nr);
605 }
606
607 void
608 Lseek(fd, off, flag)
609 int fd, flag;
610 off_t off;
611 {
612 off_t ret;
613
614 ret = lseek(fd, off, flag);
615 if (ret == -1) {
616 syslog(LOG_ERR, "lseek: %m");
617 exit(1);
618 }
619 }
620
621 int
622 Create(file, mode)
623 char *file;
624 int mode;
625 {
626 register int fd;
627
628 fd = open(file, O_WRONLY | O_CREAT | O_TRUNC, mode);
629 if (fd < 0) {
630 syslog(LOG_ERR, "%s: %m", file);
631 exit(1);
632 }
633 return (fd);
634 }
635
636 void
637 Write(fd, bp, size)
638 int fd, size;
639 void *bp;
640 {
641 int n;
642
643 if ((n = write(fd, bp, size)) < size) {
644 syslog(LOG_ERR, "write: %s", strerror(n == -1 ? errno : EIO));
645 exit(1);
646 }
647 }
648
649 void
650 usage()
651 {
652 (void)syslog(LOG_ERR, "usage: savecore [-cfvz] [-N system] directory");
653 exit(1);
654 }
655