Home | History | Annotate | Line # | Download | only in makemandb
apropos.c revision 1.9
      1  1.9  christos /*	$NetBSD: apropos.c,v 1.9 2013/01/14 18:04:58 christos Exp $	*/
      2  1.1     joerg /*-
      3  1.1     joerg  * Copyright (c) 2011 Abhinav Upadhyay <er.abhinav.upadhyay (at) gmail.com>
      4  1.1     joerg  * All rights reserved.
      5  1.1     joerg  *
      6  1.1     joerg  * This code was developed as part of Google's Summer of Code 2011 program.
      7  1.1     joerg  *
      8  1.1     joerg  * Redistribution and use in source and binary forms, with or without
      9  1.1     joerg  * modification, are permitted provided that the following conditions
     10  1.1     joerg  * are met:
     11  1.1     joerg  *
     12  1.1     joerg  * 1. Redistributions of source code must retain the above copyright
     13  1.1     joerg  *    notice, this list of conditions and the following disclaimer.
     14  1.1     joerg  * 2. Redistributions in binary form must reproduce the above copyright
     15  1.1     joerg  *    notice, this list of conditions and the following disclaimer in
     16  1.1     joerg  *    the documentation and/or other materials provided with the
     17  1.1     joerg  *    distribution.
     18  1.1     joerg  *
     19  1.1     joerg  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     20  1.1     joerg  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     21  1.1     joerg  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
     22  1.1     joerg  * FOR A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE
     23  1.1     joerg  * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
     24  1.1     joerg  * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
     25  1.1     joerg  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     26  1.1     joerg  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     27  1.1     joerg  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     28  1.1     joerg  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
     29  1.1     joerg  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     30  1.1     joerg  * SUCH DAMAGE.
     31  1.1     joerg  */
     32  1.1     joerg 
     33  1.1     joerg #include <sys/cdefs.h>
     34  1.9  christos __RCSID("$NetBSD: apropos.c,v 1.9 2013/01/14 18:04:58 christos Exp $");
     35  1.1     joerg 
     36  1.1     joerg #include <err.h>
     37  1.1     joerg #include <search.h>
     38  1.1     joerg #include <stdio.h>
     39  1.1     joerg #include <stdlib.h>
     40  1.1     joerg #include <string.h>
     41  1.1     joerg #include <unistd.h>
     42  1.1     joerg #include <util.h>
     43  1.9  christos #include <term.h>
     44  1.1     joerg 
     45  1.1     joerg #include "apropos-utils.h"
     46  1.1     joerg #include "sqlite3.h"
     47  1.1     joerg 
     48  1.1     joerg typedef struct apropos_flags {
     49  1.1     joerg 	int sec_nums[SECMAX];
     50  1.1     joerg 	int nresults;
     51  1.1     joerg 	int pager;
     52  1.1     joerg 	int no_context;
     53  1.1     joerg 	const char *machine;
     54  1.1     joerg } apropos_flags;
     55  1.1     joerg 
     56  1.1     joerg typedef struct callback_data {
     57  1.1     joerg 	int count;
     58  1.1     joerg 	FILE *out;
     59  1.1     joerg 	apropos_flags *aflags;
     60  1.1     joerg } callback_data;
     61  1.1     joerg 
     62  1.1     joerg static char *remove_stopwords(const char *);
     63  1.1     joerg static int query_callback(void *, const char * , const char *, const char *,
     64  1.1     joerg 	const char *, size_t);
     65  1.1     joerg __dead static void usage(void);
     66  1.1     joerg 
     67  1.1     joerg #define _PATH_PAGER	"/usr/bin/more -s"
     68  1.1     joerg 
     69  1.9  christos static int
     70  1.9  christos term_init(int fd, const char *sa[3])
     71  1.9  christos {
     72  1.9  christos 	if (!isatty(fd))
     73  1.9  christos 		return 0;
     74  1.9  christos 
     75  1.9  christos 	TERMINAL *ti;
     76  1.9  christos 	int error;
     77  1.9  christos 	if (ti_setupterm(&ti, NULL, fd, &error) == -1)
     78  1.9  christos 		return 0;
     79  1.9  christos 
     80  1.9  christos 	const char *rmso = ti_getstr(ti, "rmso");
     81  1.9  christos 	if (rmso == NULL)
     82  1.9  christos 		goto out;
     83  1.9  christos 
     84  1.9  christos 	const char *smso = ti_getstr(ti, "smso");
     85  1.9  christos 	if (smso == NULL)
     86  1.9  christos 		goto out;
     87  1.9  christos 
     88  1.9  christos 	sa[0] = estrdup(smso);
     89  1.9  christos 	sa[1] = estrdup(rmso);
     90  1.9  christos 	sa[2] = estrdup("...");
     91  1.9  christos 	del_curterm(ti);
     92  1.9  christos 	return 1;
     93  1.9  christos out:
     94  1.9  christos 	del_curterm(ti);
     95  1.9  christos 	return 0;
     96  1.9  christos 
     97  1.9  christos }
     98  1.9  christos 
     99  1.1     joerg int
    100  1.1     joerg main(int argc, char *argv[])
    101  1.1     joerg {
    102  1.9  christos 	const char *snippet_args[3];
    103  1.1     joerg 	query_args args;
    104  1.1     joerg 	char *query = NULL;	// the user query
    105  1.1     joerg 	char *errmsg = NULL;
    106  1.1     joerg 	char *str;
    107  1.3     joerg 	int ch, rc = 0;
    108  1.5     joerg 	int s;
    109  1.1     joerg 	callback_data cbdata;
    110  1.1     joerg 	cbdata.out = stdout;		// the default output stream
    111  1.1     joerg 	cbdata.count = 0;
    112  1.1     joerg 	apropos_flags aflags;
    113  1.1     joerg 	cbdata.aflags = &aflags;
    114  1.1     joerg 	sqlite3 *db;
    115  1.1     joerg 	setprogname(argv[0]);
    116  1.1     joerg 	if (argc < 2)
    117  1.1     joerg 		usage();
    118  1.1     joerg 
    119  1.1     joerg 	memset(&aflags, 0, sizeof(aflags));
    120  1.1     joerg 
    121  1.1     joerg 	/*If the user specifies a section number as an option, the corresponding
    122  1.1     joerg 	 * index element in sec_nums is set to the string representing that
    123  1.1     joerg 	 * section number.
    124  1.1     joerg 	 */
    125  1.5     joerg 	while ((ch = getopt(argc, argv, "123456789Ccn:pS:s:")) != -1) {
    126  1.1     joerg 		switch (ch) {
    127  1.1     joerg 		case '1':
    128  1.1     joerg 		case '2':
    129  1.1     joerg 		case '3':
    130  1.1     joerg 		case '4':
    131  1.1     joerg 		case '5':
    132  1.1     joerg 		case '6':
    133  1.1     joerg 		case '7':
    134  1.1     joerg 		case '8':
    135  1.1     joerg 		case '9':
    136  1.4     joerg 			aflags.sec_nums[ch - '1'] = 1;
    137  1.1     joerg 			break;
    138  1.1     joerg 		case 'C':
    139  1.1     joerg 			aflags.no_context = 1;
    140  1.1     joerg 			break;
    141  1.1     joerg 		case 'c':
    142  1.1     joerg 			aflags.no_context = 0;
    143  1.1     joerg 			break;
    144  1.1     joerg 		case 'n':
    145  1.1     joerg 			aflags.nresults = atoi(optarg);
    146  1.1     joerg 			break;
    147  1.1     joerg 		case 'p':	//user wants to view more than 10 results and page them
    148  1.1     joerg 			aflags.pager = 1;
    149  1.1     joerg 			aflags.nresults = -1;	// Fetch all records
    150  1.1     joerg 			break;
    151  1.1     joerg 		case 'S':
    152  1.1     joerg 			aflags.machine = optarg;
    153  1.1     joerg 			break;
    154  1.5     joerg 		case 's':
    155  1.5     joerg 			s = atoi(optarg);
    156  1.5     joerg 			if (s < 1 || s > 9)
    157  1.5     joerg 				errx(EXIT_FAILURE, "Invalid section");
    158  1.5     joerg 			aflags.sec_nums[s - 1] = 1;
    159  1.5     joerg 			break;
    160  1.1     joerg 		case '?':
    161  1.1     joerg 		default:
    162  1.1     joerg 			usage();
    163  1.1     joerg 		}
    164  1.1     joerg 	}
    165  1.1     joerg 
    166  1.1     joerg 	argc -= optind;
    167  1.1     joerg 	argv += optind;
    168  1.1     joerg 
    169  1.1     joerg 	if (!argc)
    170  1.1     joerg 		usage();
    171  1.1     joerg 
    172  1.1     joerg 	str = NULL;
    173  1.1     joerg 	while (argc--)
    174  1.1     joerg 		concat(&str, *argv++);
    175  1.1     joerg 	/* Eliminate any stopwords from the query */
    176  1.1     joerg 	query = remove_stopwords(lower(str));
    177  1.1     joerg 	free(str);
    178  1.1     joerg 
    179  1.1     joerg 	/* if any error occured in remove_stopwords, exit */
    180  1.1     joerg 	if (query == NULL)
    181  1.1     joerg 		errx(EXIT_FAILURE, "Try using more relevant keywords");
    182  1.1     joerg 
    183  1.8       wiz 	if ((db = init_db(MANDB_READONLY, MANCONF)) == NULL)
    184  1.1     joerg 		exit(EXIT_FAILURE);
    185  1.1     joerg 
    186  1.1     joerg 	/* If user wants to page the output, then set some settings */
    187  1.1     joerg 	if (aflags.pager) {
    188  1.1     joerg 		const char *pager = getenv("PAGER");
    189  1.1     joerg 		if (pager == NULL)
    190  1.1     joerg 			pager = _PATH_PAGER;
    191  1.1     joerg 		/* Open a pipe to the pager */
    192  1.1     joerg 		if ((cbdata.out = popen(pager, "w")) == NULL) {
    193  1.1     joerg 			close_db(db);
    194  1.1     joerg 			err(EXIT_FAILURE, "pipe failed");
    195  1.1     joerg 		}
    196  1.1     joerg 	}
    197  1.1     joerg 
    198  1.1     joerg 	args.search_str = query;
    199  1.1     joerg 	args.sec_nums = aflags.sec_nums;
    200  1.1     joerg 	args.nrec = aflags.nresults ? aflags.nresults : 10;
    201  1.1     joerg 	args.offset = 0;
    202  1.1     joerg 	args.machine = aflags.machine;
    203  1.1     joerg 	args.callback = &query_callback;
    204  1.1     joerg 	args.callback_data = &cbdata;
    205  1.1     joerg 	args.errmsg = &errmsg;
    206  1.1     joerg 
    207  1.1     joerg 
    208  1.9  christos 	if (term_init(STDOUT_FILENO, snippet_args))
    209  1.9  christos 		rc = run_query(db, snippet_args, &args);
    210  1.9  christos 	else
    211  1.9  christos 		rc = run_query_pager(db, &args);
    212  1.9  christos 
    213  1.1     joerg 	free(query);
    214  1.1     joerg 	close_db(db);
    215  1.1     joerg 	if (errmsg) {
    216  1.1     joerg 		warnx("%s", errmsg);
    217  1.1     joerg 		free(errmsg);
    218  1.1     joerg 		exit(EXIT_FAILURE);
    219  1.1     joerg 	}
    220  1.1     joerg 
    221  1.1     joerg 	if (rc < 0) {
    222  1.1     joerg 		/* Something wrong with the database. Exit */
    223  1.1     joerg 		exit(EXIT_FAILURE);
    224  1.1     joerg 	}
    225  1.1     joerg 
    226  1.1     joerg 	if (cbdata.count == 0) {
    227  1.1     joerg 		warnx("No relevant results obtained.\n"
    228  1.5     joerg 			  "Please make sure that you spelled all the terms correctly "
    229  1.5     joerg 			  "or try using better keywords.");
    230  1.1     joerg 	}
    231  1.1     joerg 	return 0;
    232  1.1     joerg }
    233  1.1     joerg 
    234  1.1     joerg /*
    235  1.1     joerg  * query_callback --
    236  1.1     joerg  *  Callback function for run_query.
    237  1.1     joerg  *  It simply outputs the results from do_query. If the user specified the -p
    238  1.1     joerg  *  option, then the output is sent to a pager, otherwise stdout is the default
    239  1.1     joerg  *  output stream.
    240  1.1     joerg  */
    241  1.1     joerg static int
    242  1.1     joerg query_callback(void *data, const char *section, const char *name,
    243  1.1     joerg 	const char *name_desc, const char *snippet, size_t snippet_length)
    244  1.1     joerg {
    245  1.1     joerg 	callback_data *cbdata = (callback_data *) data;
    246  1.1     joerg 	FILE *out = cbdata->out;
    247  1.1     joerg 	cbdata->count++;
    248  1.6       wiz 	fprintf(out, "%s (%s)\t%s\n", name, section, name_desc);
    249  1.1     joerg 
    250  1.1     joerg 	if (cbdata->aflags->no_context == 0)
    251  1.1     joerg 		fprintf(out, "%s\n\n", snippet);
    252  1.1     joerg 
    253  1.1     joerg 	return 0;
    254  1.1     joerg }
    255  1.1     joerg 
    256  1.1     joerg #include "stopwords.c"
    257  1.1     joerg 
    258  1.1     joerg /*
    259  1.1     joerg  * remove_stopwords--
    260  1.1     joerg  *  Scans the query and removes any stop words from it.
    261  1.1     joerg  *  Returns the modified query or NULL, if it contained only stop words.
    262  1.1     joerg  */
    263  1.1     joerg 
    264  1.1     joerg static char *
    265  1.1     joerg remove_stopwords(const char *query)
    266  1.1     joerg {
    267  1.1     joerg 	size_t len, idx;
    268  1.1     joerg 	char *output, *buf;
    269  1.1     joerg 	const char *sep, *next;
    270  1.1     joerg 
    271  1.1     joerg 	output = buf = emalloc(strlen(query) + 1);
    272  1.1     joerg 
    273  1.1     joerg 	for (; query[0] != '\0'; query = next) {
    274  1.1     joerg 		sep = strchr(query, ' ');
    275  1.1     joerg 		if (sep == NULL) {
    276  1.1     joerg 			len = strlen(query);
    277  1.1     joerg 			next = query + len;
    278  1.1     joerg 		} else {
    279  1.1     joerg 			len = sep - query;
    280  1.1     joerg 			next = sep + 1;
    281  1.1     joerg 		}
    282  1.1     joerg 		if (len == 0)
    283  1.1     joerg 			continue;
    284  1.1     joerg 		idx = stopwords_hash(query, len);
    285  1.1     joerg 		if (memcmp(stopwords[idx], query, len) == 0 &&
    286  1.1     joerg 		    stopwords[idx][len] == '\0')
    287  1.1     joerg 			continue;
    288  1.1     joerg 		memcpy(buf, query, len);
    289  1.1     joerg 		buf += len;
    290  1.1     joerg 		*buf++ = ' ';
    291  1.1     joerg 	}
    292  1.1     joerg 
    293  1.1     joerg 	if (output == buf) {
    294  1.1     joerg 		free(output);
    295  1.1     joerg 		return NULL;
    296  1.1     joerg 	}
    297  1.1     joerg 	buf[-1] = '\0';
    298  1.1     joerg 	return output;
    299  1.1     joerg }
    300  1.1     joerg 
    301  1.1     joerg /*
    302  1.1     joerg  * usage --
    303  1.1     joerg  *	print usage message and die
    304  1.1     joerg  */
    305  1.1     joerg static void
    306  1.1     joerg usage(void)
    307  1.1     joerg {
    308  1.1     joerg 	fprintf(stderr,
    309  1.7       wiz 		"Usage: %s [-n Number of records] [-123456789Ccp] [-S machine] query\n",
    310  1.1     joerg 		getprogname());
    311  1.1     joerg 	exit(1);
    312  1.1     joerg }
    313