mkindex.c revision 1.4       1  1.4  hubertf /*	$NetBSD: mkindex.c,v 1.4 1998/09/11 13:16:05 hubertf Exp $	*/
      2  1.2      cgd 
      3  1.1      jtc /*-
      4  1.1      jtc  * Copyright (c) 1993
      5  1.1      jtc  *	The Regents of the University of California.  All rights reserved.
      6  1.1      jtc  *
      7  1.1      jtc  * This code is derived from software contributed to Berkeley by
      8  1.1      jtc  * Barry Brachman.
      9  1.1      jtc  *
     10  1.1      jtc  * Redistribution and use in source and binary forms, with or without
     11  1.1      jtc  * modification, are permitted provided that the following conditions
     12  1.1      jtc  * are met:
     13  1.1      jtc  * 1. Redistributions of source code must retain the above copyright
     14  1.1      jtc  *    notice, this list of conditions and the following disclaimer.
     15  1.1      jtc  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1      jtc  *    notice, this list of conditions and the following disclaimer in the
     17  1.1      jtc  *    documentation and/or other materials provided with the distribution.
     18  1.1      jtc  * 3. All advertising materials mentioning features or use of this software
     19  1.1      jtc  *    must display the following acknowledgement:
     20  1.1      jtc  *	This product includes software developed by the University of
     21  1.1      jtc  *	California, Berkeley and its contributors.
     22  1.1      jtc  * 4. Neither the name of the University nor the names of its contributors
     23  1.1      jtc  *    may be used to endorse or promote products derived from this software
     24  1.1      jtc  *    without specific prior written permission.
     25  1.1      jtc  *
     26  1.1      jtc  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     27  1.1      jtc  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     28  1.1      jtc  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     29  1.1      jtc  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     30  1.1      jtc  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     31  1.1      jtc  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     32  1.1      jtc  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     33  1.1      jtc  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     34  1.1      jtc  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     35  1.1      jtc  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     36  1.1      jtc  * SUCH DAMAGE.
     37  1.1      jtc  */
     38  1.1      jtc 
     39  1.1      jtc #ifndef lint
     40  1.1      jtc static char copyright[] =
     41  1.1      jtc "@(#) Copyright (c) 1993\n\
     42  1.1      jtc 	The Regents of the University of California.  All rights reserved.\n";
     43  1.1      jtc #endif /* not lint */
     44  1.1      jtc 
     45  1.1      jtc #ifndef lint
     46  1.2      cgd #if 0
     47  1.1      jtc static char sccsid[] = "@(#)mkindex.c	8.1 (Berkeley) 6/11/93";
     48  1.2      cgd #else
     49  1.4  hubertf static char rcsid[] = "$NetBSD: mkindex.c,v 1.4 1998/09/11 13:16:05 hubertf Exp $";
     50  1.2      cgd #endif
     51  1.1      jtc #endif /* not lint */
     52  1.1      jtc 
     53  1.1      jtc #include <stdio.h>
     54  1.1      jtc 
     55  1.1      jtc #include "bog.h"
     56  1.1      jtc 
     57  1.1      jtc char *nextword __P((FILE *, char *, int *, int *));
     58  1.1      jtc 
     59  1.1      jtc int
     60  1.4  hubertf main(void)
     61  1.1      jtc {
     62  1.1      jtc 	int clen, rlen, prev;
     63  1.1      jtc 	long off, start;
     64  1.1      jtc 	char buf[MAXWORDLEN + 1];
     65  1.1      jtc 
     66  1.1      jtc 	prev = '\0';
     67  1.1      jtc 	off = start = 0L;
     68  1.1      jtc 	while (nextword(stdin, buf, &clen, &rlen) != NULL) {
     69  1.1      jtc 		if (*buf != prev) {
     70  1.1      jtc 			if (prev != '\0')
     71  1.1      jtc 				printf("%c %6ld %6ld\n", prev, start, off - 1);
     72  1.1      jtc 			prev = *buf;
     73  1.1      jtc 			start = off;
     74  1.1      jtc 		}
     75  1.1      jtc 		off += clen + 1;
     76  1.1      jtc 	}
     77  1.1      jtc 	printf("%c %6ld %6ld\n", prev, start, off - 1);
     78  1.1      jtc 	exit(0);
     79  1.1      jtc }
     80  1.1      jtc 
     81  1.1      jtc /*
     82  1.1      jtc  * Return the next word in the compressed dictionary in 'buffer' or
     83  1.1      jtc  * NULL on end-of-file
     84  1.1      jtc  * Also set clen to the length of the compressed word (for mkindex) and
     85  1.1      jtc  * rlen to the strlen() of the real word
     86  1.1      jtc  */
     87  1.1      jtc char *
     88  1.1      jtc nextword(fp, buffer, clen, rlen)
     89  1.1      jtc 	FILE *fp;
     90  1.1      jtc 	char *buffer;
     91  1.1      jtc 	int *clen, *rlen;
     92  1.1      jtc {
     93  1.3    lukem 	int ch, pcount;
     94  1.3    lukem 	char *p, *q;
     95  1.1      jtc 	static char buf[MAXWORDLEN + 1];
     96  1.1      jtc 	static int first = 1;
     97  1.1      jtc 	static int lastch = 0;
     98  1.1      jtc 
     99  1.1      jtc    	if (first) {
    100  1.1      jtc 		if ((pcount = getc(fp)) == EOF)
    101  1.1      jtc 			return (NULL);
    102  1.1      jtc 		first = 0;
    103  1.1      jtc 	}
    104  1.1      jtc 	else if ((pcount = lastch) == EOF)
    105  1.1      jtc 		return (NULL);
    106  1.1      jtc 
    107  1.1      jtc 	p = buf + (*clen = pcount);
    108  1.1      jtc 
    109  1.1      jtc 	while ((ch = getc(fp)) != EOF && ch >= 'a')
    110  1.1      jtc 			*p++ = ch;
    111  1.1      jtc 		lastch = ch;
    112  1.1      jtc 	*p = '\0';
    113  1.1      jtc 
    114  1.1      jtc 	*rlen = (int) (p - buf);
    115  1.1      jtc 	*clen = *rlen - *clen;
    116  1.1      jtc 
    117  1.1      jtc 	p = buf;
    118  1.1      jtc 	q = buffer;
    119  1.1      jtc 	while ((*q++ = *p) != '\0') {
    120  1.1      jtc 		if (*p++ == 'q')
    121  1.1      jtc 			*q++ = 'u';
    122  1.1      jtc 	}
    123  1.1      jtc 	return (buffer);
    124  1.1      jtc }
    125