Home | History | Annotate | Line # | Download | only in makemandb
apropos.c revision 1.7.2.3
      1  1.7.2.3    tls /*	$NetBSD: apropos.c,v 1.7.2.3 2013/06/23 06:29:05 tls Exp $	*/
      2      1.1  joerg /*-
      3      1.1  joerg  * Copyright (c) 2011 Abhinav Upadhyay <er.abhinav.upadhyay (at) gmail.com>
      4      1.1  joerg  * All rights reserved.
      5      1.1  joerg  *
      6      1.1  joerg  * This code was developed as part of Google's Summer of Code 2011 program.
      7      1.1  joerg  *
      8      1.1  joerg  * Redistribution and use in source and binary forms, with or without
      9      1.1  joerg  * modification, are permitted provided that the following conditions
     10      1.1  joerg  * are met:
     11      1.1  joerg  *
     12      1.1  joerg  * 1. Redistributions of source code must retain the above copyright
     13      1.1  joerg  *    notice, this list of conditions and the following disclaimer.
     14      1.1  joerg  * 2. Redistributions in binary form must reproduce the above copyright
     15      1.1  joerg  *    notice, this list of conditions and the following disclaimer in
     16      1.1  joerg  *    the documentation and/or other materials provided with the
     17      1.1  joerg  *    distribution.
     18      1.1  joerg  *
     19      1.1  joerg  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     20      1.1  joerg  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     21      1.1  joerg  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
     22      1.1  joerg  * FOR A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE
     23      1.1  joerg  * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
     24      1.1  joerg  * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
     25      1.1  joerg  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     26      1.1  joerg  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     27      1.1  joerg  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     28      1.1  joerg  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
     29      1.1  joerg  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     30      1.1  joerg  * SUCH DAMAGE.
     31      1.1  joerg  */
     32      1.1  joerg 
     33      1.1  joerg #include <sys/cdefs.h>
     34  1.7.2.3    tls __RCSID("$NetBSD: apropos.c,v 1.7.2.3 2013/06/23 06:29:05 tls Exp $");
     35      1.1  joerg 
     36      1.1  joerg #include <err.h>
     37      1.1  joerg #include <search.h>
     38      1.1  joerg #include <stdio.h>
     39      1.1  joerg #include <stdlib.h>
     40      1.1  joerg #include <string.h>
     41      1.1  joerg #include <unistd.h>
     42      1.1  joerg #include <util.h>
     43      1.1  joerg 
     44      1.1  joerg #include "apropos-utils.h"
     45      1.1  joerg #include "sqlite3.h"
     46      1.1  joerg 
     47      1.1  joerg typedef struct apropos_flags {
     48      1.1  joerg 	int sec_nums[SECMAX];
     49      1.1  joerg 	int nresults;
     50      1.1  joerg 	int pager;
     51      1.1  joerg 	int no_context;
     52  1.7.2.3    tls 	query_format format;
     53  1.7.2.3    tls 	int legacy;
     54      1.1  joerg 	const char *machine;
     55      1.1  joerg } apropos_flags;
     56      1.1  joerg 
     57      1.1  joerg typedef struct callback_data {
     58      1.1  joerg 	int count;
     59      1.1  joerg 	FILE *out;
     60      1.1  joerg 	apropos_flags *aflags;
     61      1.1  joerg } callback_data;
     62      1.1  joerg 
     63      1.1  joerg static char *remove_stopwords(const char *);
     64      1.1  joerg static int query_callback(void *, const char * , const char *, const char *,
     65      1.1  joerg 	const char *, size_t);
     66      1.1  joerg __dead static void usage(void);
     67      1.1  joerg 
     68      1.1  joerg #define _PATH_PAGER	"/usr/bin/more -s"
     69      1.1  joerg 
     70  1.7.2.3    tls static void
     71  1.7.2.3    tls parseargs(int argc, char **argv, struct apropos_flags *aflags)
     72      1.1  joerg {
     73  1.7.2.3    tls 	int ch;
     74  1.7.2.3    tls 	while ((ch = getopt(argc, argv, "123456789Cchiln:PprS:s:")) != -1) {
     75      1.1  joerg 		switch (ch) {
     76      1.1  joerg 		case '1':
     77      1.1  joerg 		case '2':
     78      1.1  joerg 		case '3':
     79      1.1  joerg 		case '4':
     80      1.1  joerg 		case '5':
     81      1.1  joerg 		case '6':
     82      1.1  joerg 		case '7':
     83      1.1  joerg 		case '8':
     84      1.1  joerg 		case '9':
     85  1.7.2.3    tls 			aflags->sec_nums[ch - '1'] = 1;
     86      1.1  joerg 			break;
     87      1.1  joerg 		case 'C':
     88  1.7.2.3    tls 			aflags->no_context = 1;
     89      1.1  joerg 			break;
     90      1.1  joerg 		case 'c':
     91  1.7.2.3    tls 			aflags->no_context = 0;
     92  1.7.2.3    tls 			break;
     93  1.7.2.3    tls 		case 'h':
     94  1.7.2.3    tls 			aflags->format = APROPOS_HTML;
     95  1.7.2.3    tls 			break;
     96  1.7.2.3    tls 		case 'i':
     97  1.7.2.3    tls 			aflags->format = APROPOS_TERM;
     98  1.7.2.3    tls 			break;
     99  1.7.2.3    tls 		case 'l':
    100  1.7.2.3    tls 			aflags->legacy = 1;
    101  1.7.2.3    tls 			aflags->no_context = 1;
    102  1.7.2.3    tls 			aflags->format = APROPOS_NONE;
    103      1.1  joerg 			break;
    104      1.1  joerg 		case 'n':
    105  1.7.2.3    tls 			aflags->nresults = atoi(optarg);
    106      1.1  joerg 			break;
    107  1.7.2.3    tls 		case 'p':	// user wants a pager
    108  1.7.2.3    tls 			aflags->pager = 1;
    109  1.7.2.3    tls 			/*FALLTHROUGH*/
    110  1.7.2.3    tls 		case 'P':
    111  1.7.2.3    tls 			aflags->format = APROPOS_PAGER;
    112      1.1  joerg 			break;
    113  1.7.2.2    tls 		case 'r':
    114  1.7.2.3    tls 			aflags->format = APROPOS_NONE;
    115  1.7.2.2    tls 			break;
    116      1.1  joerg 		case 'S':
    117  1.7.2.3    tls 			aflags->machine = optarg;
    118      1.1  joerg 			break;
    119      1.5  joerg 		case 's':
    120  1.7.2.3    tls 			ch = atoi(optarg);
    121  1.7.2.3    tls 			if (ch < 1 || ch > 9)
    122      1.5  joerg 				errx(EXIT_FAILURE, "Invalid section");
    123  1.7.2.3    tls 			aflags->sec_nums[ch - 1] = 1;
    124      1.5  joerg 			break;
    125      1.1  joerg 		case '?':
    126      1.1  joerg 		default:
    127      1.1  joerg 			usage();
    128      1.1  joerg 		}
    129      1.1  joerg 	}
    130  1.7.2.3    tls }
    131  1.7.2.3    tls 
    132  1.7.2.3    tls int
    133  1.7.2.3    tls main(int argc, char *argv[])
    134  1.7.2.3    tls {
    135  1.7.2.3    tls 	query_args args;
    136  1.7.2.3    tls 	char *query = NULL;	// the user query
    137  1.7.2.3    tls 	char *errmsg = NULL;
    138  1.7.2.3    tls 	char *str;
    139  1.7.2.3    tls 	int rc = 0;
    140  1.7.2.3    tls 	int s;
    141  1.7.2.3    tls 	callback_data cbdata;
    142  1.7.2.3    tls 	cbdata.out = stdout;		// the default output stream
    143  1.7.2.3    tls 	cbdata.count = 0;
    144  1.7.2.3    tls 	apropos_flags aflags;
    145  1.7.2.3    tls 	cbdata.aflags = &aflags;
    146  1.7.2.3    tls 	sqlite3 *db;
    147  1.7.2.3    tls 	setprogname(argv[0]);
    148  1.7.2.3    tls 	if (argc < 2)
    149  1.7.2.3    tls 		usage();
    150  1.7.2.3    tls 
    151  1.7.2.3    tls 	memset(&aflags, 0, sizeof(aflags));
    152  1.7.2.3    tls 
    153  1.7.2.3    tls 	if (!isatty(STDOUT_FILENO))
    154  1.7.2.3    tls 		aflags.format = APROPOS_NONE;
    155  1.7.2.3    tls 	else
    156  1.7.2.3    tls 		aflags.format = APROPOS_TERM;
    157  1.7.2.3    tls 
    158  1.7.2.3    tls 	if ((str = getenv("APROPOS")) != NULL) {
    159  1.7.2.3    tls 		char **ptr = emalloc((strlen(str) + 2) * sizeof(*ptr));
    160  1.7.2.3    tls #define WS "\t\n\r "
    161  1.7.2.3    tls 		ptr[0] = __UNCONST(getprogname());
    162  1.7.2.3    tls 		for (s = 1, str = strtok(str, WS); str;
    163  1.7.2.3    tls 		    str = strtok(NULL, WS), s++)
    164  1.7.2.3    tls 			ptr[s] = str;
    165  1.7.2.3    tls 		ptr[s] = NULL;
    166  1.7.2.3    tls 		parseargs(s, ptr, &aflags);
    167  1.7.2.3    tls 		free(ptr);
    168  1.7.2.3    tls 		optreset = 1;
    169  1.7.2.3    tls 		optind = 1;
    170  1.7.2.3    tls 	}
    171  1.7.2.3    tls 
    172  1.7.2.3    tls 	parseargs(argc, argv, &aflags);
    173  1.7.2.3    tls 
    174  1.7.2.3    tls 	/*
    175  1.7.2.3    tls 	 * If the user specifies a section number as an option, the
    176  1.7.2.3    tls 	 * corresponding index element in sec_nums is set to the string
    177  1.7.2.3    tls 	 * representing that section number.
    178  1.7.2.3    tls 	 */
    179  1.7.2.2    tls 
    180      1.1  joerg 	argc -= optind;
    181      1.1  joerg 	argv += optind;
    182  1.7.2.2    tls 
    183      1.1  joerg 	if (!argc)
    184      1.1  joerg 		usage();
    185      1.1  joerg 
    186      1.1  joerg 	str = NULL;
    187      1.1  joerg 	while (argc--)
    188      1.1  joerg 		concat(&str, *argv++);
    189      1.1  joerg 	/* Eliminate any stopwords from the query */
    190      1.1  joerg 	query = remove_stopwords(lower(str));
    191      1.1  joerg 	free(str);
    192      1.1  joerg 
    193      1.1  joerg 	/* if any error occured in remove_stopwords, exit */
    194      1.1  joerg 	if (query == NULL)
    195      1.1  joerg 		errx(EXIT_FAILURE, "Try using more relevant keywords");
    196      1.1  joerg 
    197  1.7.2.1    tls 	if ((db = init_db(MANDB_READONLY, MANCONF)) == NULL)
    198      1.1  joerg 		exit(EXIT_FAILURE);
    199      1.1  joerg 
    200      1.1  joerg 	/* If user wants to page the output, then set some settings */
    201      1.1  joerg 	if (aflags.pager) {
    202      1.1  joerg 		const char *pager = getenv("PAGER");
    203      1.1  joerg 		if (pager == NULL)
    204      1.1  joerg 			pager = _PATH_PAGER;
    205      1.1  joerg 		/* Open a pipe to the pager */
    206      1.1  joerg 		if ((cbdata.out = popen(pager, "w")) == NULL) {
    207      1.1  joerg 			close_db(db);
    208      1.1  joerg 			err(EXIT_FAILURE, "pipe failed");
    209      1.1  joerg 		}
    210      1.1  joerg 	}
    211      1.1  joerg 
    212      1.1  joerg 	args.search_str = query;
    213      1.1  joerg 	args.sec_nums = aflags.sec_nums;
    214  1.7.2.3    tls 	args.legacy = aflags.legacy;
    215  1.7.2.3    tls 	args.nrec = aflags.nresults ? aflags.nresults : -1;
    216      1.1  joerg 	args.offset = 0;
    217      1.1  joerg 	args.machine = aflags.machine;
    218      1.1  joerg 	args.callback = &query_callback;
    219      1.1  joerg 	args.callback_data = &cbdata;
    220      1.1  joerg 	args.errmsg = &errmsg;
    221      1.1  joerg 
    222  1.7.2.3    tls 	if (aflags.format == APROPOS_HTML) {
    223  1.7.2.3    tls 		fprintf(cbdata.out, "<html>\n<header>\n<title>apropos results "
    224  1.7.2.3    tls 		    "for %s</title></header>\n<body>\n<table cellpadding=\"4\""
    225  1.7.2.3    tls 		    "style=\"border: 1px solid #000000; border-collapse:"
    226  1.7.2.3    tls 		    "collapse;\" border=\"1\">\n", query);
    227  1.7.2.3    tls 	}
    228  1.7.2.3    tls 	rc = run_query(db, aflags.format, &args);
    229  1.7.2.3    tls 	if (aflags.format == APROPOS_HTML)
    230  1.7.2.3    tls 		fprintf(cbdata.out, "</table>\n</body>\n</html>\n");
    231      1.1  joerg 
    232      1.1  joerg 	free(query);
    233      1.1  joerg 	close_db(db);
    234      1.1  joerg 	if (errmsg) {
    235      1.1  joerg 		warnx("%s", errmsg);
    236      1.1  joerg 		free(errmsg);
    237      1.1  joerg 		exit(EXIT_FAILURE);
    238      1.1  joerg 	}
    239      1.1  joerg 
    240      1.1  joerg 	if (rc < 0) {
    241      1.1  joerg 		/* Something wrong with the database. Exit */
    242      1.1  joerg 		exit(EXIT_FAILURE);
    243      1.1  joerg 	}
    244  1.7.2.2    tls 
    245      1.1  joerg 	if (cbdata.count == 0) {
    246      1.1  joerg 		warnx("No relevant results obtained.\n"
    247  1.7.2.3    tls 		    "Please make sure that you spelled all the terms correctly "
    248  1.7.2.3    tls 		    "or try using better keywords.");
    249      1.1  joerg 	}
    250      1.1  joerg 	return 0;
    251      1.1  joerg }
    252      1.1  joerg 
    253      1.1  joerg /*
    254      1.1  joerg  * query_callback --
    255      1.1  joerg  *  Callback function for run_query.
    256      1.1  joerg  *  It simply outputs the results from do_query. If the user specified the -p
    257      1.1  joerg  *  option, then the output is sent to a pager, otherwise stdout is the default
    258      1.1  joerg  *  output stream.
    259      1.1  joerg  */
    260      1.1  joerg static int
    261      1.1  joerg query_callback(void *data, const char *section, const char *name,
    262      1.1  joerg 	const char *name_desc, const char *snippet, size_t snippet_length)
    263      1.1  joerg {
    264      1.1  joerg 	callback_data *cbdata = (callback_data *) data;
    265      1.1  joerg 	FILE *out = cbdata->out;
    266      1.1  joerg 	cbdata->count++;
    267  1.7.2.3    tls 	if (cbdata->aflags->format != APROPOS_HTML) {
    268  1.7.2.3    tls 	    fprintf(out, cbdata->aflags->legacy ? "%s(%s) - %s\n" :
    269  1.7.2.3    tls 		"%s (%s)\t%s\n", name, section, name_desc);
    270  1.7.2.3    tls 	    if (cbdata->aflags->no_context == 0)
    271  1.7.2.3    tls 		    fprintf(out, "%s\n\n", snippet);
    272  1.7.2.3    tls 	} else {
    273  1.7.2.3    tls 	    fprintf(out, "<tr><td>%s(%s)</td><td>%s</td></tr>\n", name,
    274  1.7.2.3    tls 		section, name_desc);
    275  1.7.2.3    tls 	    if (cbdata->aflags->no_context == 0)
    276  1.7.2.3    tls 		    fprintf(out, "<tr><td colspan=2>%s</td></tr>\n", snippet);
    277  1.7.2.3    tls 	}
    278      1.1  joerg 
    279      1.1  joerg 	return 0;
    280      1.1  joerg }
    281      1.1  joerg 
    282      1.1  joerg #include "stopwords.c"
    283      1.1  joerg 
    284      1.1  joerg /*
    285      1.1  joerg  * remove_stopwords--
    286      1.1  joerg  *  Scans the query and removes any stop words from it.
    287      1.1  joerg  *  Returns the modified query or NULL, if it contained only stop words.
    288      1.1  joerg  */
    289      1.1  joerg 
    290      1.1  joerg static char *
    291      1.1  joerg remove_stopwords(const char *query)
    292      1.1  joerg {
    293      1.1  joerg 	size_t len, idx;
    294      1.1  joerg 	char *output, *buf;
    295      1.1  joerg 	const char *sep, *next;
    296      1.1  joerg 
    297      1.1  joerg 	output = buf = emalloc(strlen(query) + 1);
    298      1.1  joerg 
    299      1.1  joerg 	for (; query[0] != '\0'; query = next) {
    300      1.1  joerg 		sep = strchr(query, ' ');
    301      1.1  joerg 		if (sep == NULL) {
    302      1.1  joerg 			len = strlen(query);
    303      1.1  joerg 			next = query + len;
    304      1.1  joerg 		} else {
    305      1.1  joerg 			len = sep - query;
    306      1.1  joerg 			next = sep + 1;
    307      1.1  joerg 		}
    308      1.1  joerg 		if (len == 0)
    309      1.1  joerg 			continue;
    310      1.1  joerg 		idx = stopwords_hash(query, len);
    311      1.1  joerg 		if (memcmp(stopwords[idx], query, len) == 0 &&
    312      1.1  joerg 		    stopwords[idx][len] == '\0')
    313      1.1  joerg 			continue;
    314      1.1  joerg 		memcpy(buf, query, len);
    315      1.1  joerg 		buf += len;
    316      1.1  joerg 		*buf++ = ' ';
    317      1.1  joerg 	}
    318      1.1  joerg 
    319      1.1  joerg 	if (output == buf) {
    320      1.1  joerg 		free(output);
    321      1.1  joerg 		return NULL;
    322      1.1  joerg 	}
    323      1.1  joerg 	buf[-1] = '\0';
    324      1.1  joerg 	return output;
    325      1.1  joerg }
    326      1.1  joerg 
    327      1.1  joerg /*
    328      1.1  joerg  * usage --
    329      1.1  joerg  *	print usage message and die
    330      1.1  joerg  */
    331      1.1  joerg static void
    332      1.1  joerg usage(void)
    333      1.1  joerg {
    334  1.7.2.3    tls 	fprintf(stderr, "Usage: %s [-123456789Ccilpr] [-n results] "
    335  1.7.2.3    tls 	    "[-S machine] [-s section] query\n",
    336  1.7.2.3    tls 	    getprogname());
    337      1.1  joerg 	exit(1);
    338      1.1  joerg }
    339