keyword-gen.c revision 1.4 1 1.4 christos /* $NetBSD: keyword-gen.c,v 1.4 2013/12/28 03:20:14 christos Exp $ */
2 1.1 kardel
3 1.1 kardel /*
4 1.1 kardel * keyword-gen.c -- generate keyword scanner finite state machine and
5 1.1 kardel * keyword_text array.
6 1.4 christos *
7 1.4 christos * This program is run to generate ntp_keyword.h
8 1.4 christos * After making a change here, two output files should be committed at
9 1.4 christos * the same time as keyword-gen.c:
10 1.4 christos * ntp_keyword.h
11 1.4 christos * keyword-gen-utd
12 1.4 christos *
13 1.4 christos * keyword-gen-utd is a sentinel used by Makefile.am to avoid compiling
14 1.4 christos * keyword_gen.c and generating ntp_keyword.h if the input keyword-gen.c
15 1.4 christos * has not changed. This is not solely an optimization, it also breaks
16 1.4 christos * a dependency chain that otherwise would cause programs to be compiled
17 1.4 christos * when running "make dist" or "make distdir". We want these to package
18 1.4 christos * the existing source without building anything but a tarball. See
19 1.4 christos * [Bug 1470].
20 1.1 kardel */
21 1.1 kardel #include <config.h>
22 1.1 kardel #include <stdio.h>
23 1.1 kardel #include <stdlib.h>
24 1.1 kardel #include <time.h>
25 1.1 kardel
26 1.1 kardel #include <ntp_stdlib.h>
27 1.1 kardel #include <ntp_config.h>
28 1.1 kardel #include <lib_strbuf.h>
29 1.1 kardel #include "ntp_scanner.h"
30 1.1 kardel #include "ntp_parser.h"
31 1.1 kardel
32 1.1 kardel
33 1.1 kardel /* Define a structure to hold a (keyword, token) pair */
34 1.1 kardel struct key_tok {
35 1.1 kardel char * key; /* Keyword */
36 1.4 christos u_short token; /* Associated Token */
37 1.1 kardel follby followedby; /* nonzero indicates the next token(s)
38 1.1 kardel forced to be string(s) */
39 1.1 kardel };
40 1.1 kardel
41 1.1 kardel struct key_tok ntp_keywords[] = {
42 1.3 kardel { "...", T_Ellipsis, FOLLBY_TOKEN },
43 1.4 christos { "allpeers", T_Allpeers, FOLLBY_TOKEN },
44 1.1 kardel { "automax", T_Automax, FOLLBY_TOKEN },
45 1.1 kardel { "broadcast", T_Broadcast, FOLLBY_STRING },
46 1.1 kardel { "broadcastclient", T_Broadcastclient, FOLLBY_TOKEN },
47 1.1 kardel { "broadcastdelay", T_Broadcastdelay, FOLLBY_TOKEN },
48 1.4 christos { "ctl", T_Ctl, FOLLBY_TOKEN },
49 1.1 kardel { "disable", T_Disable, FOLLBY_TOKEN },
50 1.1 kardel { "driftfile", T_Driftfile, FOLLBY_STRING },
51 1.1 kardel { "enable", T_Enable, FOLLBY_TOKEN },
52 1.1 kardel { "end", T_End, FOLLBY_TOKEN },
53 1.1 kardel { "filegen", T_Filegen, FOLLBY_TOKEN },
54 1.1 kardel { "fudge", T_Fudge, FOLLBY_STRING },
55 1.4 christos { "io", T_Io, FOLLBY_TOKEN },
56 1.1 kardel { "includefile", T_Includefile, FOLLBY_STRING },
57 1.1 kardel { "leapfile", T_Leapfile, FOLLBY_STRING },
58 1.1 kardel { "logconfig", T_Logconfig, FOLLBY_STRINGS_TO_EOC },
59 1.1 kardel { "logfile", T_Logfile, FOLLBY_STRING },
60 1.1 kardel { "manycastclient", T_Manycastclient, FOLLBY_STRING },
61 1.1 kardel { "manycastserver", T_Manycastserver, FOLLBY_STRINGS_TO_EOC },
62 1.4 christos { "mem", T_Mem, FOLLBY_TOKEN },
63 1.1 kardel { "multicastclient", T_Multicastclient, FOLLBY_STRINGS_TO_EOC },
64 1.1 kardel { "peer", T_Peer, FOLLBY_STRING },
65 1.1 kardel { "phone", T_Phone, FOLLBY_STRINGS_TO_EOC },
66 1.1 kardel { "pidfile", T_Pidfile, FOLLBY_STRING },
67 1.1 kardel { "pool", T_Pool, FOLLBY_STRING },
68 1.1 kardel { "discard", T_Discard, FOLLBY_TOKEN },
69 1.4 christos { "reset", T_Reset, FOLLBY_TOKEN },
70 1.1 kardel { "restrict", T_Restrict, FOLLBY_TOKEN },
71 1.4 christos { "rlimit", T_Rlimit, FOLLBY_TOKEN },
72 1.1 kardel { "server", T_Server, FOLLBY_STRING },
73 1.1 kardel { "setvar", T_Setvar, FOLLBY_STRING },
74 1.1 kardel { "statistics", T_Statistics, FOLLBY_TOKEN },
75 1.1 kardel { "statsdir", T_Statsdir, FOLLBY_STRING },
76 1.4 christos { "sys", T_Sys, FOLLBY_TOKEN },
77 1.1 kardel { "tick", T_Tick, FOLLBY_TOKEN },
78 1.4 christos { "timer", T_Timer, FOLLBY_TOKEN },
79 1.1 kardel { "tinker", T_Tinker, FOLLBY_TOKEN },
80 1.1 kardel { "tos", T_Tos, FOLLBY_TOKEN },
81 1.1 kardel { "trap", T_Trap, FOLLBY_STRING },
82 1.1 kardel { "unconfig", T_Unconfig, FOLLBY_STRING },
83 1.1 kardel { "unpeer", T_Unpeer, FOLLBY_STRING },
84 1.1 kardel /* authentication_command */
85 1.1 kardel { "controlkey", T_ControlKey, FOLLBY_TOKEN },
86 1.1 kardel { "crypto", T_Crypto, FOLLBY_TOKEN },
87 1.1 kardel { "keys", T_Keys, FOLLBY_STRING },
88 1.1 kardel { "keysdir", T_Keysdir, FOLLBY_STRING },
89 1.1 kardel { "ntpsigndsocket", T_NtpSignDsocket, FOLLBY_STRING },
90 1.1 kardel { "requestkey", T_Requestkey, FOLLBY_TOKEN },
91 1.1 kardel { "revoke", T_Revoke, FOLLBY_TOKEN },
92 1.1 kardel { "trustedkey", T_Trustedkey, FOLLBY_TOKEN },
93 1.1 kardel /* IPv4/IPv6 protocol override flag */
94 1.1 kardel { "-4", T_Ipv4_flag, FOLLBY_TOKEN },
95 1.1 kardel { "-6", T_Ipv6_flag, FOLLBY_TOKEN },
96 1.1 kardel /* option */
97 1.1 kardel { "autokey", T_Autokey, FOLLBY_TOKEN },
98 1.1 kardel { "burst", T_Burst, FOLLBY_TOKEN },
99 1.1 kardel { "iburst", T_Iburst, FOLLBY_TOKEN },
100 1.1 kardel { "key", T_Key, FOLLBY_TOKEN },
101 1.1 kardel { "maxpoll", T_Maxpoll, FOLLBY_TOKEN },
102 1.2 christos { "mdnstries", T_Mdnstries, FOLLBY_TOKEN },
103 1.1 kardel { "minpoll", T_Minpoll, FOLLBY_TOKEN },
104 1.1 kardel { "mode", T_Mode, FOLLBY_TOKEN },
105 1.1 kardel { "noselect", T_Noselect, FOLLBY_TOKEN },
106 1.1 kardel { "preempt", T_Preempt, FOLLBY_TOKEN },
107 1.1 kardel { "true", T_True, FOLLBY_TOKEN },
108 1.1 kardel { "prefer", T_Prefer, FOLLBY_TOKEN },
109 1.1 kardel { "ttl", T_Ttl, FOLLBY_TOKEN },
110 1.1 kardel { "version", T_Version, FOLLBY_TOKEN },
111 1.1 kardel { "xleave", T_Xleave, FOLLBY_TOKEN },
112 1.1 kardel /* crypto_command */
113 1.1 kardel { "host", T_Host, FOLLBY_STRING },
114 1.1 kardel { "ident", T_Ident, FOLLBY_STRING },
115 1.1 kardel { "pw", T_Pw, FOLLBY_STRING },
116 1.1 kardel { "randfile", T_Randfile, FOLLBY_STRING },
117 1.1 kardel { "digest", T_Digest, FOLLBY_STRING },
118 1.1 kardel /*** MONITORING COMMANDS ***/
119 1.1 kardel /* stat */
120 1.1 kardel { "clockstats", T_Clockstats, FOLLBY_TOKEN },
121 1.1 kardel { "cryptostats", T_Cryptostats, FOLLBY_TOKEN },
122 1.1 kardel { "loopstats", T_Loopstats, FOLLBY_TOKEN },
123 1.1 kardel { "peerstats", T_Peerstats, FOLLBY_TOKEN },
124 1.1 kardel { "rawstats", T_Rawstats, FOLLBY_TOKEN },
125 1.1 kardel { "sysstats", T_Sysstats, FOLLBY_TOKEN },
126 1.1 kardel { "protostats", T_Protostats, FOLLBY_TOKEN },
127 1.1 kardel { "timingstats", T_Timingstats, FOLLBY_TOKEN },
128 1.1 kardel /* filegen_option */
129 1.1 kardel { "file", T_File, FOLLBY_STRING },
130 1.1 kardel { "link", T_Link, FOLLBY_TOKEN },
131 1.1 kardel { "nolink", T_Nolink, FOLLBY_TOKEN },
132 1.1 kardel { "type", T_Type, FOLLBY_TOKEN },
133 1.1 kardel /* filegen_type */
134 1.1 kardel { "age", T_Age, FOLLBY_TOKEN },
135 1.1 kardel { "day", T_Day, FOLLBY_TOKEN },
136 1.1 kardel { "month", T_Month, FOLLBY_TOKEN },
137 1.1 kardel { "none", T_None, FOLLBY_TOKEN },
138 1.1 kardel { "pid", T_Pid, FOLLBY_TOKEN },
139 1.1 kardel { "week", T_Week, FOLLBY_TOKEN },
140 1.1 kardel { "year", T_Year, FOLLBY_TOKEN },
141 1.1 kardel /*** ORPHAN MODE COMMANDS ***/
142 1.1 kardel /* tos_option */
143 1.1 kardel { "minclock", T_Minclock, FOLLBY_TOKEN },
144 1.1 kardel { "maxclock", T_Maxclock, FOLLBY_TOKEN },
145 1.1 kardel { "minsane", T_Minsane, FOLLBY_TOKEN },
146 1.1 kardel { "floor", T_Floor, FOLLBY_TOKEN },
147 1.1 kardel { "ceiling", T_Ceiling, FOLLBY_TOKEN },
148 1.1 kardel { "cohort", T_Cohort, FOLLBY_TOKEN },
149 1.1 kardel { "mindist", T_Mindist, FOLLBY_TOKEN },
150 1.1 kardel { "maxdist", T_Maxdist, FOLLBY_TOKEN },
151 1.1 kardel { "beacon", T_Beacon, FOLLBY_TOKEN },
152 1.1 kardel { "orphan", T_Orphan, FOLLBY_TOKEN },
153 1.4 christos { "orphanwait", T_Orphanwait, FOLLBY_TOKEN },
154 1.4 christos { "nonvolatile", T_Nonvolatile, FOLLBY_TOKEN },
155 1.1 kardel /* access_control_flag */
156 1.1 kardel { "default", T_Default, FOLLBY_TOKEN },
157 1.4 christos { "source", T_Source, FOLLBY_TOKEN },
158 1.1 kardel { "flake", T_Flake, FOLLBY_TOKEN },
159 1.1 kardel { "ignore", T_Ignore, FOLLBY_TOKEN },
160 1.1 kardel { "limited", T_Limited, FOLLBY_TOKEN },
161 1.1 kardel { "mssntp", T_Mssntp, FOLLBY_TOKEN },
162 1.1 kardel { "kod", T_Kod, FOLLBY_TOKEN },
163 1.1 kardel { "lowpriotrap", T_Lowpriotrap, FOLLBY_TOKEN },
164 1.1 kardel { "mask", T_Mask, FOLLBY_TOKEN },
165 1.1 kardel { "nomodify", T_Nomodify, FOLLBY_TOKEN },
166 1.4 christos { "nomrulist", T_Nomrulist, FOLLBY_TOKEN },
167 1.1 kardel { "nopeer", T_Nopeer, FOLLBY_TOKEN },
168 1.1 kardel { "noquery", T_Noquery, FOLLBY_TOKEN },
169 1.1 kardel { "noserve", T_Noserve, FOLLBY_TOKEN },
170 1.1 kardel { "notrap", T_Notrap, FOLLBY_TOKEN },
171 1.1 kardel { "notrust", T_Notrust, FOLLBY_TOKEN },
172 1.1 kardel { "ntpport", T_Ntpport, FOLLBY_TOKEN },
173 1.1 kardel /* discard_option */
174 1.1 kardel { "average", T_Average, FOLLBY_TOKEN },
175 1.1 kardel { "minimum", T_Minimum, FOLLBY_TOKEN },
176 1.1 kardel { "monitor", T_Monitor, FOLLBY_TOKEN },
177 1.4 christos /* mru_option */
178 1.4 christos { "incalloc", T_Incalloc, FOLLBY_TOKEN },
179 1.4 christos { "incmem", T_Incmem, FOLLBY_TOKEN },
180 1.4 christos { "initalloc", T_Initalloc, FOLLBY_TOKEN },
181 1.4 christos { "initmem", T_Initmem, FOLLBY_TOKEN },
182 1.4 christos { "mindepth", T_Mindepth, FOLLBY_TOKEN },
183 1.4 christos { "maxage", T_Maxage, FOLLBY_TOKEN },
184 1.4 christos { "maxdepth", T_Maxdepth, FOLLBY_TOKEN },
185 1.4 christos { "maxmem", T_Maxmem, FOLLBY_TOKEN },
186 1.4 christos { "mru", T_Mru, FOLLBY_TOKEN },
187 1.1 kardel /* fudge_factor */
188 1.4 christos { "abbrev", T_Abbrev, FOLLBY_STRING },
189 1.1 kardel { "flag1", T_Flag1, FOLLBY_TOKEN },
190 1.1 kardel { "flag2", T_Flag2, FOLLBY_TOKEN },
191 1.1 kardel { "flag3", T_Flag3, FOLLBY_TOKEN },
192 1.1 kardel { "flag4", T_Flag4, FOLLBY_TOKEN },
193 1.1 kardel { "refid", T_Refid, FOLLBY_STRING },
194 1.1 kardel { "stratum", T_Stratum, FOLLBY_TOKEN },
195 1.1 kardel { "time1", T_Time1, FOLLBY_TOKEN },
196 1.1 kardel { "time2", T_Time2, FOLLBY_TOKEN },
197 1.1 kardel /* system_option */
198 1.1 kardel { "auth", T_Auth, FOLLBY_TOKEN },
199 1.1 kardel { "bclient", T_Bclient, FOLLBY_TOKEN },
200 1.1 kardel { "calibrate", T_Calibrate, FOLLBY_TOKEN },
201 1.1 kardel { "kernel", T_Kernel, FOLLBY_TOKEN },
202 1.1 kardel { "ntp", T_Ntp, FOLLBY_TOKEN },
203 1.4 christos { "mode7", T_Mode7, FOLLBY_TOKEN },
204 1.1 kardel { "stats", T_Stats, FOLLBY_TOKEN },
205 1.4 christos /* rlimit_option */
206 1.4 christos { "memlock", T_Memlock, FOLLBY_TOKEN },
207 1.4 christos { "stacksize", T_Stacksize, FOLLBY_TOKEN },
208 1.4 christos { "filenum", T_Filenum, FOLLBY_TOKEN },
209 1.1 kardel /* tinker_option */
210 1.1 kardel { "step", T_Step, FOLLBY_TOKEN },
211 1.1 kardel { "panic", T_Panic, FOLLBY_TOKEN },
212 1.1 kardel { "dispersion", T_Dispersion, FOLLBY_TOKEN },
213 1.1 kardel { "stepout", T_Stepout, FOLLBY_TOKEN },
214 1.1 kardel { "allan", T_Allan, FOLLBY_TOKEN },
215 1.1 kardel { "huffpuff", T_Huffpuff, FOLLBY_TOKEN },
216 1.1 kardel { "freq", T_Freq, FOLLBY_TOKEN },
217 1.1 kardel /* miscellaneous_command */
218 1.1 kardel { "port", T_Port, FOLLBY_TOKEN },
219 1.1 kardel { "interface", T_Interface, FOLLBY_TOKEN },
220 1.1 kardel { "saveconfigdir", T_Saveconfigdir, FOLLBY_STRING },
221 1.1 kardel /* interface_command (ignore and interface already defined) */
222 1.1 kardel { "nic", T_Nic, FOLLBY_TOKEN },
223 1.1 kardel { "all", T_All, FOLLBY_TOKEN },
224 1.1 kardel { "ipv4", T_Ipv4, FOLLBY_TOKEN },
225 1.1 kardel { "ipv6", T_Ipv6, FOLLBY_TOKEN },
226 1.1 kardel { "wildcard", T_Wildcard, FOLLBY_TOKEN },
227 1.1 kardel { "listen", T_Listen, FOLLBY_TOKEN },
228 1.1 kardel { "drop", T_Drop, FOLLBY_TOKEN },
229 1.1 kardel /* simulator commands */
230 1.1 kardel { "simulate", T_Simulate, FOLLBY_TOKEN },
231 1.1 kardel { "simulation_duration",T_Sim_Duration, FOLLBY_TOKEN },
232 1.1 kardel { "beep_delay", T_Beep_Delay, FOLLBY_TOKEN },
233 1.1 kardel { "duration", T_Duration, FOLLBY_TOKEN },
234 1.1 kardel { "server_offset", T_Server_Offset, FOLLBY_TOKEN },
235 1.1 kardel { "freq_offset", T_Freq_Offset, FOLLBY_TOKEN },
236 1.1 kardel { "wander", T_Wander, FOLLBY_TOKEN },
237 1.1 kardel { "jitter", T_Jitter, FOLLBY_TOKEN },
238 1.1 kardel { "prop_delay", T_Prop_Delay, FOLLBY_TOKEN },
239 1.1 kardel { "proc_delay", T_Proc_Delay, FOLLBY_TOKEN },
240 1.1 kardel };
241 1.1 kardel
242 1.1 kardel typedef struct big_scan_state_tag {
243 1.1 kardel char ch; /* Character this state matches on */
244 1.1 kardel char followedby; /* Forces next token(s) to T_String */
245 1.1 kardel u_short finishes_token; /* nonzero ID if last keyword char */
246 1.1 kardel u_short match_next_s; /* next state to check matching ch */
247 1.1 kardel u_short other_next_s; /* next state to check if not ch */
248 1.1 kardel } big_scan_state;
249 1.1 kardel
250 1.1 kardel /*
251 1.1 kardel * Note: to increase MAXSTATES beyond 2048, be aware it is currently
252 1.1 kardel * crammed into 11 bits in scan_state form. Raising to 4096 would be
253 1.1 kardel * relatively easy by storing the followedby value in a separate
254 1.1 kardel * array with one entry per token, and shrinking the char value to
255 1.1 kardel * 7 bits to free a bit for accepting/non-accepting. More than 4096
256 1.1 kardel * states will require expanding scan_state beyond 32 bits each.
257 1.1 kardel */
258 1.4 christos #define MAXSTATES 2048
259 1.4 christos #define MAX_TOK_LEN 63
260 1.1 kardel
261 1.1 kardel const char * current_keyword;/* for error reporting */
262 1.1 kardel big_scan_state sst[MAXSTATES]; /* scanner FSM state entries */
263 1.4 christos u_short sst_highwater; /* next entry index to consider */
264 1.1 kardel char * symb[1024]; /* map token ID to symbolic name */
265 1.1 kardel
266 1.1 kardel /* for libntp */
267 1.1 kardel const char * progname = "keyword-gen";
268 1.1 kardel
269 1.1 kardel int main (int, char **);
270 1.1 kardel static void generate_preamble (void);
271 1.1 kardel static void generate_fsm (void);
272 1.1 kardel static void generate_token_text (void);
273 1.4 christos static u_short create_keyword_scanner (void);
274 1.4 christos static u_short create_scan_states (char *, u_short, follby, u_short);
275 1.4 christos int compare_key_tok_id (const void *, const void *);
276 1.4 christos int compare_key_tok_text (const void *, const void *);
277 1.1 kardel void populate_symb (char *);
278 1.4 christos const char * symbname (u_short);
279 1.1 kardel
280 1.1 kardel
281 1.1 kardel int main(int argc, char **argv)
282 1.1 kardel {
283 1.1 kardel if (argc < 2) {
284 1.1 kardel fprintf(stderr, "Usage:\n%s t_header.h\n", argv[0]);
285 1.1 kardel exit(1);
286 1.1 kardel }
287 1.4 christos debug = 1;
288 1.4 christos
289 1.1 kardel populate_symb(argv[1]);
290 1.1 kardel
291 1.1 kardel generate_preamble();
292 1.1 kardel generate_token_text();
293 1.1 kardel generate_fsm();
294 1.1 kardel
295 1.1 kardel return 0;
296 1.1 kardel }
297 1.1 kardel
298 1.1 kardel
299 1.1 kardel static void
300 1.1 kardel generate_preamble(void)
301 1.1 kardel {
302 1.1 kardel time_t now;
303 1.1 kardel char timestamp[128];
304 1.1 kardel char preamble[] =
305 1.1 kardel "/*\n"
306 1.1 kardel " * ntp_keyword.h\n"
307 1.1 kardel " * \n"
308 1.1 kardel " * NOTE: edit this file with caution, it is generated by keyword-gen.c\n"
309 1.1 kardel " *\t Generated %s UTC diff_ignore_line\n"
310 1.1 kardel " *\n"
311 1.1 kardel " */\n"
312 1.1 kardel "#include \"ntp_scanner.h\"\n"
313 1.1 kardel "#include \"ntp_parser.h\"\n"
314 1.1 kardel "\n";
315 1.1 kardel
316 1.1 kardel time(&now);
317 1.1 kardel if (!strftime(timestamp, sizeof(timestamp),
318 1.1 kardel "%Y-%m-%d %H:%M:%S", gmtime(&now)))
319 1.1 kardel timestamp[0] = '\0';
320 1.1 kardel
321 1.1 kardel printf(preamble, timestamp);
322 1.1 kardel }
323 1.1 kardel
324 1.1 kardel
325 1.1 kardel static void
326 1.1 kardel generate_fsm(void)
327 1.1 kardel {
328 1.4 christos char rprefix[MAX_TOK_LEN + 1];
329 1.4 christos char prefix[MAX_TOK_LEN + 1];
330 1.4 christos char token_id_comment[16 + MAX_TOK_LEN + 1];
331 1.4 christos size_t prefix_len;
332 1.4 christos char *p;
333 1.4 christos char *r;
334 1.4 christos u_short initial_state;
335 1.4 christos u_short this_state;
336 1.4 christos u_short prev_state;
337 1.4 christos u_short state;
338 1.4 christos u_short i;
339 1.4 christos u_short token;
340 1.1 kardel
341 1.1 kardel /*
342 1.1 kardel * Sort ntp_keywords in alphabetical keyword order. This is
343 1.1 kardel * not necessary, but minimizes nonfunctional changes in the
344 1.1 kardel * generated finite state machine when keywords are modified.
345 1.1 kardel */
346 1.1 kardel qsort(ntp_keywords, COUNTOF(ntp_keywords),
347 1.1 kardel sizeof(ntp_keywords[0]), compare_key_tok_text);
348 1.1 kardel
349 1.1 kardel /*
350 1.1 kardel * To save space, reserve the state array entry matching each
351 1.1 kardel * token number for its terminal state, so the token identifier
352 1.1 kardel * does not need to be stored in each state, but can be
353 1.1 kardel * recovered trivially. To mark the entry reserved,
354 1.1 kardel * finishes_token is nonzero.
355 1.1 kardel */
356 1.1 kardel
357 1.1 kardel for (i = 0; i < COUNTOF(ntp_keywords); i++) {
358 1.1 kardel token = ntp_keywords[i].token;
359 1.1 kardel if (1 > token || token >= COUNTOF(sst)) {
360 1.1 kardel fprintf(stderr,
361 1.1 kardel "keyword-gen sst[%u] too small "
362 1.1 kardel "for keyword '%s' id %d\n",
363 1.2 christos (int)COUNTOF(sst),
364 1.1 kardel ntp_keywords[i].key,
365 1.1 kardel token);
366 1.1 kardel exit(4);
367 1.1 kardel }
368 1.1 kardel sst[token].finishes_token = token;
369 1.1 kardel }
370 1.1 kardel
371 1.1 kardel initial_state = create_keyword_scanner();
372 1.1 kardel
373 1.1 kardel fprintf(stderr,
374 1.1 kardel "%d keywords consumed %d states of %d max.\n",
375 1.1 kardel (int)COUNTOF(ntp_keywords),
376 1.1 kardel sst_highwater - 1,
377 1.1 kardel (int)COUNTOF(sst) - 1);
378 1.1 kardel
379 1.1 kardel printf("#define SCANNER_INIT_S %d\n\n", initial_state);
380 1.1 kardel
381 1.1 kardel printf("const scan_state sst[%d] = {\n"
382 1.1 kardel "/*SS_T( ch,\tf-by, match, other ),\t\t\t\t */\n"
383 1.1 kardel " 0,\t\t\t\t /* %5d %-17s */\n",
384 1.1 kardel sst_highwater,
385 1.1 kardel 0, "");
386 1.1 kardel
387 1.1 kardel for (i = 1; i < sst_highwater; i++) {
388 1.1 kardel
389 1.1 kardel /* verify fields will fit */
390 1.1 kardel if (sst[i].followedby & ~0x3) {
391 1.1 kardel fprintf(stderr,
392 1.1 kardel "keyword-gen internal error "
393 1.1 kardel "sst[%d].followedby %d too big\n",
394 1.1 kardel i, sst[i].followedby);
395 1.1 kardel exit(7);
396 1.1 kardel }
397 1.1 kardel
398 1.1 kardel if (sst_highwater <= sst[i].match_next_s
399 1.1 kardel || sst[i].match_next_s & ~0x7ff) {
400 1.1 kardel fprintf(stderr,
401 1.1 kardel "keyword-gen internal error "
402 1.1 kardel "sst[%d].match_next_s %d too big\n",
403 1.1 kardel i, sst[i].match_next_s);
404 1.1 kardel exit(8);
405 1.1 kardel }
406 1.1 kardel
407 1.1 kardel if (sst_highwater <= sst[i].other_next_s
408 1.1 kardel || sst[i].other_next_s & ~0x7ff) {
409 1.1 kardel fprintf(stderr,
410 1.1 kardel "keyword-gen internal error "
411 1.1 kardel "sst[%d].other_next_s %d too big\n",
412 1.1 kardel i, sst[i].other_next_s);
413 1.1 kardel exit(9);
414 1.1 kardel }
415 1.1 kardel
416 1.4 christos if (sst[i].finishes_token) {
417 1.1 kardel snprintf(token_id_comment,
418 1.1 kardel sizeof(token_id_comment), "%5d %-17s",
419 1.1 kardel i, symbname(sst[i].finishes_token));
420 1.1 kardel if (i != sst[i].finishes_token) {
421 1.1 kardel fprintf(stderr,
422 1.1 kardel "keyword-gen internal error "
423 1.1 kardel "entry %d finishes token %d\n",
424 1.1 kardel i, sst[i].finishes_token);
425 1.1 kardel exit(5);
426 1.1 kardel }
427 1.4 christos } else {
428 1.4 christos /*
429 1.4 christos * Determine the keyword prefix that leads to this
430 1.4 christos * state. This is expensive but keyword-gen is run
431 1.4 christos * only when it changes. Distributing keyword-gen-utd
432 1.4 christos * achieves that, which is why it must be committed
433 1.4 christos * at the same time as keyword-gen.c and ntp_keyword.h.
434 1.4 christos *
435 1.4 christos * Scan the state array iteratively looking for a state
436 1.4 christos * which leads to the current one, collecting matching
437 1.4 christos * characters along the way. There is only one such
438 1.4 christos * path back to the starting state given the way our
439 1.4 christos * scanner state machine is built and the practice of
440 1.4 christos * using the spelling of the keyword as its T_* token
441 1.4 christos * identifier, which results in never having two
442 1.4 christos * spellings result in the same T_* value.
443 1.4 christos */
444 1.4 christos prefix_len = 0;
445 1.4 christos prev_state = 0;
446 1.4 christos this_state = i;
447 1.4 christos do {
448 1.4 christos for (state = 1; state < sst_highwater; state++)
449 1.4 christos if (sst[state].other_next_s == this_state) {
450 1.4 christos this_state = state;
451 1.4 christos break;
452 1.4 christos } else if (sst[state].match_next_s == this_state) {
453 1.4 christos this_state = state;
454 1.4 christos rprefix[prefix_len] = sst[state].ch;
455 1.4 christos prefix_len++;
456 1.4 christos break;
457 1.4 christos }
458 1.4 christos } while (this_state != initial_state);
459 1.4 christos
460 1.4 christos if (prefix_len) {
461 1.4 christos /* reverse rprefix into prefix */
462 1.4 christos p = prefix + prefix_len;
463 1.4 christos r = rprefix;
464 1.4 christos while (r < rprefix + prefix_len)
465 1.4 christos *--p = *r++;
466 1.4 christos }
467 1.4 christos prefix[prefix_len] = '\0';
468 1.4 christos
469 1.4 christos snprintf(token_id_comment,
470 1.4 christos sizeof(token_id_comment), "%5d %-17s",
471 1.4 christos i, (initial_state == i)
472 1.4 christos ? "[initial state]"
473 1.4 christos : prefix);
474 1.1 kardel }
475 1.1 kardel
476 1.1 kardel printf(" S_ST( '%c',\t%d, %5u, %5u )%s /* %s */\n",
477 1.1 kardel sst[i].ch,
478 1.1 kardel sst[i].followedby,
479 1.1 kardel sst[i].match_next_s,
480 1.1 kardel sst[i].other_next_s,
481 1.1 kardel (i + 1 < sst_highwater)
482 1.1 kardel ? ","
483 1.1 kardel : " ",
484 1.1 kardel token_id_comment);
485 1.1 kardel }
486 1.1 kardel
487 1.1 kardel printf("};\n\n");
488 1.1 kardel }
489 1.1 kardel
490 1.1 kardel
491 1.1 kardel /* Define a function to create the states of the scanner. This function
492 1.1 kardel * is used by the create_keyword_scanner function below.
493 1.1 kardel *
494 1.1 kardel * This function takes a suffix of a keyword, the token to be returned on
495 1.1 kardel * recognizing the complete keyword, and any pre-existing state that exists
496 1.1 kardel * for some other keyword that has the same prefix as the current one.
497 1.1 kardel */
498 1.4 christos static u_short
499 1.1 kardel create_scan_states(
500 1.1 kardel char * text,
501 1.4 christos u_short token,
502 1.1 kardel follby followedby,
503 1.4 christos u_short prev_state
504 1.1 kardel )
505 1.1 kardel {
506 1.4 christos u_short my_state;
507 1.4 christos u_short return_state;
508 1.4 christos u_short prev_char_s;
509 1.4 christos u_short curr_char_s;
510 1.1 kardel
511 1.1 kardel return_state = prev_state;
512 1.1 kardel curr_char_s = prev_state;
513 1.1 kardel prev_char_s = 0;
514 1.1 kardel
515 1.1 kardel /* Find the correct position to insert the state.
516 1.1 kardel * All states should be in alphabetical order
517 1.1 kardel */
518 1.1 kardel while (curr_char_s && (text[0] < sst[curr_char_s].ch)) {
519 1.1 kardel prev_char_s = curr_char_s;
520 1.1 kardel curr_char_s = sst[curr_char_s].other_next_s;
521 1.1 kardel }
522 1.1 kardel
523 1.1 kardel /*
524 1.1 kardel * Check if a previously seen keyword has the same prefix as
525 1.1 kardel * the current keyword. If so, simply use the state for that
526 1.1 kardel * keyword as my_state, otherwise, allocate a new state.
527 1.1 kardel */
528 1.1 kardel if (curr_char_s && (text[0] == sst[curr_char_s].ch)) {
529 1.1 kardel my_state = curr_char_s;
530 1.1 kardel if ('\0' == text[1]) {
531 1.1 kardel fprintf(stderr,
532 1.1 kardel "Duplicate entries for keyword '%s' in"
533 1.1 kardel " keyword_gen.c ntp_keywords[].\n",
534 1.1 kardel current_keyword);
535 1.1 kardel exit(2);
536 1.1 kardel }
537 1.1 kardel } else {
538 1.1 kardel do
539 1.1 kardel my_state = sst_highwater++;
540 1.1 kardel while (my_state < COUNTOF(sst)
541 1.1 kardel && sst[my_state].finishes_token);
542 1.1 kardel if (my_state >= COUNTOF(sst)) {
543 1.1 kardel fprintf(stderr,
544 1.1 kardel "fatal, keyword scanner state array "
545 1.1 kardel "sst[%d] is too small, modify\n"
546 1.1 kardel "keyword-gen.c to increase.\n",
547 1.1 kardel (int)COUNTOF(sst));
548 1.1 kardel exit(3);
549 1.1 kardel }
550 1.1 kardel /* Store the next character of the keyword */
551 1.1 kardel sst[my_state].ch = text[0];
552 1.1 kardel sst[my_state].other_next_s = curr_char_s;
553 1.1 kardel sst[my_state].followedby = FOLLBY_NON_ACCEPTING;
554 1.1 kardel
555 1.1 kardel if (prev_char_s)
556 1.1 kardel sst[prev_char_s].other_next_s = my_state;
557 1.1 kardel else
558 1.1 kardel return_state = my_state;
559 1.1 kardel }
560 1.1 kardel
561 1.1 kardel /* Check if the next character is '\0'.
562 1.1 kardel * If yes, we are done with the recognition and this is an accepting
563 1.1 kardel * state.
564 1.1 kardel * If not, we need to continue scanning
565 1.1 kardel */
566 1.1 kardel if ('\0' == text[1]) {
567 1.1 kardel sst[my_state].finishes_token = (u_short)token;
568 1.1 kardel sst[my_state].followedby = (char)followedby;
569 1.1 kardel
570 1.1 kardel if (sst[token].finishes_token != (u_short)token) {
571 1.1 kardel fprintf(stderr,
572 1.1 kardel "fatal, sst[%d] not reserved for %s.\n",
573 1.1 kardel token, symbname(token));
574 1.1 kardel exit(6);
575 1.1 kardel }
576 1.1 kardel /* relocate so token id is sst[] index */
577 1.1 kardel if (my_state != token) {
578 1.1 kardel sst[token] = sst[my_state];
579 1.4 christos ZERO(sst[my_state]);
580 1.1 kardel do
581 1.1 kardel sst_highwater--;
582 1.1 kardel while (sst[sst_highwater].finishes_token);
583 1.1 kardel my_state = token;
584 1.1 kardel if (prev_char_s)
585 1.1 kardel sst[prev_char_s].other_next_s = my_state;
586 1.1 kardel else
587 1.1 kardel return_state = my_state;
588 1.1 kardel }
589 1.1 kardel } else
590 1.1 kardel sst[my_state].match_next_s =
591 1.1 kardel create_scan_states(
592 1.1 kardel &text[1],
593 1.1 kardel token,
594 1.1 kardel followedby,
595 1.1 kardel sst[my_state].match_next_s);
596 1.1 kardel
597 1.1 kardel return return_state;
598 1.1 kardel }
599 1.1 kardel
600 1.1 kardel
601 1.1 kardel /* Define a function that takes a list of (keyword, token) values and
602 1.1 kardel * creates a keywords scanner out of it.
603 1.1 kardel */
604 1.1 kardel
605 1.4 christos static u_short
606 1.1 kardel create_keyword_scanner(void)
607 1.1 kardel {
608 1.4 christos u_short scanner;
609 1.4 christos u_short i;
610 1.1 kardel
611 1.1 kardel sst_highwater = 1; /* index 0 invalid, unused */
612 1.1 kardel scanner = 0;
613 1.1 kardel
614 1.1 kardel for (i = 0; i < COUNTOF(ntp_keywords); i++) {
615 1.1 kardel current_keyword = ntp_keywords[i].key;
616 1.1 kardel scanner =
617 1.1 kardel create_scan_states(
618 1.1 kardel ntp_keywords[i].key,
619 1.1 kardel ntp_keywords[i].token,
620 1.1 kardel ntp_keywords[i].followedby,
621 1.1 kardel scanner);
622 1.1 kardel }
623 1.1 kardel
624 1.1 kardel return scanner;
625 1.1 kardel }
626 1.1 kardel
627 1.1 kardel
628 1.1 kardel static void
629 1.1 kardel generate_token_text(void)
630 1.1 kardel {
631 1.4 christos u_short lowest_id;
632 1.4 christos u_short highest_id;
633 1.4 christos u_short id_count;
634 1.4 christos u_short id;
635 1.4 christos u_short i;
636 1.1 kardel
637 1.1 kardel /* sort ntp_keywords in token ID order */
638 1.1 kardel qsort(ntp_keywords, COUNTOF(ntp_keywords),
639 1.1 kardel sizeof(ntp_keywords[0]), compare_key_tok_id);
640 1.1 kardel
641 1.1 kardel lowest_id = ntp_keywords[0].token;
642 1.1 kardel highest_id = ntp_keywords[COUNTOF(ntp_keywords) - 1].token;
643 1.1 kardel id_count = highest_id - lowest_id + 1;
644 1.1 kardel
645 1.1 kardel printf("#define LOWEST_KEYWORD_ID %d\n\n", lowest_id);
646 1.1 kardel
647 1.1 kardel printf("const char * const keyword_text[%d] = {", id_count);
648 1.1 kardel
649 1.1 kardel id = lowest_id;
650 1.1 kardel i = 0;
651 1.1 kardel while (i < COUNTOF(ntp_keywords)) {
652 1.1 kardel while (id < ntp_keywords[i].token) {
653 1.1 kardel printf(",\n\t/* %-5d %5d %20s */\tNULL",
654 1.1 kardel id - lowest_id, id, symbname(id));
655 1.1 kardel id++;
656 1.1 kardel }
657 1.1 kardel if (i > 0)
658 1.1 kardel printf(",");
659 1.1 kardel printf("\n\t/* %-5d %5d %20s */\t\"%s\"",
660 1.1 kardel id - lowest_id, id, symbname(id),
661 1.1 kardel ntp_keywords[i].key);
662 1.1 kardel i++;
663 1.1 kardel id++;
664 1.1 kardel }
665 1.1 kardel
666 1.1 kardel printf("\n};\n\n");
667 1.1 kardel }
668 1.1 kardel
669 1.1 kardel
670 1.1 kardel int
671 1.1 kardel compare_key_tok_id(
672 1.4 christos const void *a1,
673 1.4 christos const void *a2
674 1.1 kardel )
675 1.1 kardel {
676 1.4 christos const struct key_tok *p1 = a1;
677 1.4 christos const struct key_tok *p2 = a2;
678 1.1 kardel
679 1.1 kardel if (p1->token == p2->token)
680 1.1 kardel return 0;
681 1.1 kardel
682 1.1 kardel if (p1->token < p2->token)
683 1.1 kardel return -1;
684 1.1 kardel else
685 1.1 kardel return 1;
686 1.1 kardel }
687 1.1 kardel
688 1.1 kardel
689 1.1 kardel int
690 1.1 kardel compare_key_tok_text(
691 1.4 christos const void *a1,
692 1.4 christos const void *a2
693 1.1 kardel )
694 1.1 kardel {
695 1.4 christos const struct key_tok *p1 = a1;
696 1.4 christos const struct key_tok *p2 = a2;
697 1.1 kardel
698 1.1 kardel return strcmp(p1->key, p2->key);
699 1.1 kardel }
700 1.1 kardel
701 1.1 kardel
702 1.1 kardel /*
703 1.1 kardel * populate_symb() - populate symb[] lookup array with symbolic token
704 1.1 kardel * names such that symb[T_Age] == "T_Age", etc.
705 1.1 kardel */
706 1.1 kardel void
707 1.1 kardel populate_symb(
708 1.1 kardel char *header_file
709 1.1 kardel )
710 1.1 kardel {
711 1.1 kardel FILE * yh;
712 1.4 christos char line[2 * MAX_TOK_LEN];
713 1.4 christos char name[2 * MAX_TOK_LEN];
714 1.1 kardel int token;
715 1.1 kardel
716 1.1 kardel yh = fopen(header_file, "r");
717 1.1 kardel if (NULL == yh) {
718 1.1 kardel perror("unable to open yacc/bison header file");
719 1.1 kardel exit(4);
720 1.1 kardel }
721 1.1 kardel
722 1.1 kardel while (NULL != fgets(line, sizeof(line), yh))
723 1.1 kardel if (2 == sscanf(line, "#define %s %d", name, &token)
724 1.1 kardel && 'T' == name[0] && '_' == name[1] && token >= 0
725 1.4 christos && token < COUNTOF(symb)) {
726 1.1 kardel
727 1.1 kardel symb[token] = estrdup(name);
728 1.4 christos if (strlen(name) > MAX_TOK_LEN) {
729 1.4 christos fprintf(stderr,
730 1.4 christos "MAX_TOK_LEN %d too small for '%s'\n"
731 1.4 christos "Edit keyword-gen.c to raise.\n",
732 1.4 christos MAX_TOK_LEN, name);
733 1.4 christos exit(10);
734 1.4 christos }
735 1.4 christos }
736 1.1 kardel fclose(yh);
737 1.1 kardel }
738 1.1 kardel
739 1.1 kardel
740 1.1 kardel const char *
741 1.1 kardel symbname(
742 1.4 christos u_short token
743 1.1 kardel )
744 1.1 kardel {
745 1.1 kardel char *name;
746 1.1 kardel
747 1.4 christos if (token < COUNTOF(symb) && symb[token] != NULL) {
748 1.4 christos name = symb[token];
749 1.4 christos } else {
750 1.4 christos LIB_GETBUF(name);
751 1.4 christos snprintf(name, LIB_BUFLENGTH, "%d", token);
752 1.4 christos }
753 1.1 kardel
754 1.1 kardel return name;
755 1.1 kardel }
756