Home | History | Annotate | Line # | Download | only in mkindex
mkindex.c revision 1.1
      1  1.1  jtc /*-
      2  1.1  jtc  * Copyright (c) 1993
      3  1.1  jtc  *	The Regents of the University of California.  All rights reserved.
      4  1.1  jtc  *
      5  1.1  jtc  * This code is derived from software contributed to Berkeley by
      6  1.1  jtc  * Barry Brachman.
      7  1.1  jtc  *
      8  1.1  jtc  * Redistribution and use in source and binary forms, with or without
      9  1.1  jtc  * modification, are permitted provided that the following conditions
     10  1.1  jtc  * are met:
     11  1.1  jtc  * 1. Redistributions of source code must retain the above copyright
     12  1.1  jtc  *    notice, this list of conditions and the following disclaimer.
     13  1.1  jtc  * 2. Redistributions in binary form must reproduce the above copyright
     14  1.1  jtc  *    notice, this list of conditions and the following disclaimer in the
     15  1.1  jtc  *    documentation and/or other materials provided with the distribution.
     16  1.1  jtc  * 3. All advertising materials mentioning features or use of this software
     17  1.1  jtc  *    must display the following acknowledgement:
     18  1.1  jtc  *	This product includes software developed by the University of
     19  1.1  jtc  *	California, Berkeley and its contributors.
     20  1.1  jtc  * 4. Neither the name of the University nor the names of its contributors
     21  1.1  jtc  *    may be used to endorse or promote products derived from this software
     22  1.1  jtc  *    without specific prior written permission.
     23  1.1  jtc  *
     24  1.1  jtc  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     25  1.1  jtc  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     26  1.1  jtc  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     27  1.1  jtc  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     28  1.1  jtc  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     29  1.1  jtc  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     30  1.1  jtc  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     31  1.1  jtc  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     32  1.1  jtc  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     33  1.1  jtc  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     34  1.1  jtc  * SUCH DAMAGE.
     35  1.1  jtc  */
     36  1.1  jtc 
     37  1.1  jtc #ifndef lint
     38  1.1  jtc static char copyright[] =
     39  1.1  jtc "@(#) Copyright (c) 1993\n\
     40  1.1  jtc 	The Regents of the University of California.  All rights reserved.\n";
     41  1.1  jtc #endif /* not lint */
     42  1.1  jtc 
     43  1.1  jtc #ifndef lint
     44  1.1  jtc static char sccsid[] = "@(#)mkindex.c	8.1 (Berkeley) 6/11/93";
     45  1.1  jtc #endif /* not lint */
     46  1.1  jtc 
     47  1.1  jtc #include <stdio.h>
     48  1.1  jtc 
     49  1.1  jtc #include "bog.h"
     50  1.1  jtc 
     51  1.1  jtc char *nextword __P((FILE *, char *, int *, int *));
     52  1.1  jtc 
     53  1.1  jtc int
     54  1.1  jtc main(argc, argv)
     55  1.1  jtc 	int argc;
     56  1.1  jtc 	char *argv[];
     57  1.1  jtc {
     58  1.1  jtc 	int clen, rlen, prev;
     59  1.1  jtc 	long off, start;
     60  1.1  jtc 	char buf[MAXWORDLEN + 1];
     61  1.1  jtc 
     62  1.1  jtc 	prev = '\0';
     63  1.1  jtc 	off = start = 0L;
     64  1.1  jtc 	while (nextword(stdin, buf, &clen, &rlen) != NULL) {
     65  1.1  jtc 		if (*buf != prev) {
     66  1.1  jtc 			if (prev != '\0')
     67  1.1  jtc 				printf("%c %6ld %6ld\n", prev, start, off - 1);
     68  1.1  jtc 			prev = *buf;
     69  1.1  jtc 			start = off;
     70  1.1  jtc 		}
     71  1.1  jtc 		off += clen + 1;
     72  1.1  jtc 	}
     73  1.1  jtc 	printf("%c %6ld %6ld\n", prev, start, off - 1);
     74  1.1  jtc 	exit(0);
     75  1.1  jtc }
     76  1.1  jtc 
     77  1.1  jtc /*
     78  1.1  jtc  * Return the next word in the compressed dictionary in 'buffer' or
     79  1.1  jtc  * NULL on end-of-file
     80  1.1  jtc  * Also set clen to the length of the compressed word (for mkindex) and
     81  1.1  jtc  * rlen to the strlen() of the real word
     82  1.1  jtc  */
     83  1.1  jtc char *
     84  1.1  jtc nextword(fp, buffer, clen, rlen)
     85  1.1  jtc 	FILE *fp;
     86  1.1  jtc 	char *buffer;
     87  1.1  jtc 	int *clen, *rlen;
     88  1.1  jtc {
     89  1.1  jtc 	register int ch, pcount;
     90  1.1  jtc 	register char *p, *q;
     91  1.1  jtc 	static char buf[MAXWORDLEN + 1];
     92  1.1  jtc 	static int first = 1;
     93  1.1  jtc 	static int lastch = 0;
     94  1.1  jtc 
     95  1.1  jtc    	if (first) {
     96  1.1  jtc 		if ((pcount = getc(fp)) == EOF)
     97  1.1  jtc 			return (NULL);
     98  1.1  jtc 		first = 0;
     99  1.1  jtc 	}
    100  1.1  jtc 	else if ((pcount = lastch) == EOF)
    101  1.1  jtc 		return (NULL);
    102  1.1  jtc 
    103  1.1  jtc 	p = buf + (*clen = pcount);
    104  1.1  jtc 
    105  1.1  jtc 	while ((ch = getc(fp)) != EOF && ch >= 'a')
    106  1.1  jtc 			*p++ = ch;
    107  1.1  jtc 		lastch = ch;
    108  1.1  jtc 	*p = '\0';
    109  1.1  jtc 
    110  1.1  jtc 	*rlen = (int) (p - buf);
    111  1.1  jtc 	*clen = *rlen - *clen;
    112  1.1  jtc 
    113  1.1  jtc 	p = buf;
    114  1.1  jtc 	q = buffer;
    115  1.1  jtc 	while ((*q++ = *p) != '\0') {
    116  1.1  jtc 		if (*p++ == 'q')
    117  1.1  jtc 			*q++ = 'u';
    118  1.1  jtc 	}
    119  1.1  jtc 	return (buffer);
    120  1.1  jtc }
    121