fgen.l revision 1.41 1 %{
2 /* $NetBSD: fgen.l,v 1.41 2024/05/20 20:46:05 wiz Exp $ */
3 /* FLEX input for FORTH input file scanner */
4 /*
5 * Copyright (c) 1998 Eduardo Horvath.
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 */
28 /*
29 Specifications are as follows:
30
31 The function "yylex()" always returns a pointer to a structure:
32
33 struct tok {
34 int type;
35 char *text;
36 }
37 #define TOKEN struct tok
38 */
39 #include <sys/cdefs.h>
40 #ifdef HAVE_NBTOOL_CONFIG_H
41 #include "nbtool_config.h"
42 #endif
43
44 #if defined(__RCSID) && !defined(lint)
45 __RCSID("$NetBSD: fgen.l,v 1.41 2024/05/20 20:46:05 wiz Exp $");
46 #endif
47
48 %}
49
50 %option yylineno
51
52 hex [0-9A-Fa-f]
53 hexdot [0-9A-Fa-f.]
54 white [ \t\n\r\f]
55 tail {white}
56
57 %{
58 #include <sys/types.h>
59 #include <arpa/inet.h>
60
61 #include <assert.h>
62 #include <err.h>
63 #include <errno.h>
64 #include <fcntl.h>
65 #include <stdarg.h>
66 #include <stdio.h>
67 #include <string.h>
68 #include <unistd.h>
69 #include <util.h>
70
71 #include "fgen.h"
72 static TOKEN ltoken;
73
74 /*
75 * Global variables that control the parse state.
76 */
77
78 static struct fcode *dictionary = NULL;
79 static struct macro *aliases = NULL;
80 static int outf = 1; /* stdout */
81 static int state = 0;
82 static int nextfcode = 0x800;
83 static int numbase = TOK_HEX;
84 static long outpos;
85 static char *outbuf = NULL;
86 static char *outfile, *infile;
87 #define BUFCLICK (1024*1024)
88 static size_t outbufsiz = 0;
89 static int offsetsize = 8;
90 static int defining = 0;
91 static int tokenizer = 0;
92 static int need_end0 = 1;
93
94 #define PSTKSIZ 1024
95 static Cell parse_stack[PSTKSIZ];
96 static int parse_stack_ptr = 0;
97
98 static void token_err(int, const char *, const char *, const char *, ...)
99 __printflike(4, 5) __dead;
100 static YY_DECL;
101
102 static int debug = 0;
103 #define ASSERT if (debug) assert
104 #define STATE(y, x) do { if (debug) printf("%lx State %s: token `%s'\n", outpos, x, y); } while (0)
105 static int mark_fload = 0;
106
107 %}
108
109 %option nounput
110
111 %%
112
113 0 { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
114
115 1 { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
116
117 2 { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
118
119 3 { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
120
121 -1 { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
122
123 \. { ltoken.type = TOK_OTHER; ltoken.text = yytext; return <oken; }
124
125 {white}* /* whitespace -- keep looping */ ;
126
127 \\[^\n]*\n /* end of line comment -- keep looping */ { STATE(yytext, "EOL comment"); }
128
129 -?{hex}{hexdot}* { ltoken.type = TOK_NUMBER; ltoken.text = yytext;
130 return <oken; }
131
132 \'.\' { ltoken.type = TOK_C_LIT; ltoken.text = yytext; return <oken; }
133
134 \"{white}*(\\\"|[^"])*\" { ltoken.type = TOK_STRING_LIT; ltoken.text = yytext;
135 return <oken; } /* String started by `"' or `."' */
136
137 \.\({white}*(\\\"|[^)])*\) { ltoken.type = TOK_PSTRING; ltoken.text = yytext;
138 return <oken; } /* String of type `.(.....)' */
139
140 \.\"{white}*(\\\"|[^"])*\" { ltoken.type = TOK_PSTRING; ltoken.text = yytext;
141 return <oken; }
142
143 [aA][bB][oO][rR][tT]\"{white}*(\\\"|[^"])*\" { ltoken.type = TOK_ABORT_S;
144 ltoken.text = yytext; return <oken; }
145
146 "(" { ltoken.type = TOK_COMMENT; ltoken.text = yytext;
147 return <oken; }
148
149 ":" { ltoken.type = TOK_COLON; ltoken.text = yytext;
150 return <oken; }
151
152 ";" { ltoken.type = TOK_SEMICOLON; ltoken.text = yytext;
153 return <oken; }
154
155 \' { ltoken.type = TOK_TOKENIZE; ltoken.text = yytext;
156 return <oken; }
157
158 [aA][gG][aA][iI][nN] { ltoken.type = TOK_AGAIN; ltoken.text = yytext;
159 return <oken; }
160
161 [aA][lL][iI][aA][sS] { ltoken.type = TOK_ALIAS; ltoken.text = yytext;
162 return <oken; }
163
164 \[\'\] { ltoken.type = TOK_GETTOKEN; ltoken.text = yytext;
165 return <oken; }
166
167 [aA][sS][cC][iI][iI] { ltoken.type = TOK_ASCII; ltoken.text = yytext;
168 return <oken; }
169
170 [bB][eE][gG][iI][nN] { ltoken.type = TOK_BEGIN; ltoken.text = yytext;
171 return <oken; }
172
173 [bB][uU][fF][fF][eE][rR]: { ltoken.type = TOK_BUFFER; ltoken.text = yytext;
174 return <oken; }
175
176 [cC][aA][sS][eE] { ltoken.type = TOK_CASE; ltoken.text = yytext;
177 return <oken; }
178
179 [cC][oO][nN][sS][tT][aA][nN][tT] { ltoken.type = TOK_CONSTANT; ltoken.text = yytext;
180 return <oken; }
181
182 [cC][oO][nN][tT][rR][oO][lL] { ltoken.type = TOK_CONTROL; ltoken.text = yytext;
183 return <oken; }
184
185 [cC][rR][eE][aA][tT][eE] { ltoken.type = TOK_CREATE; ltoken.text = yytext;
186 return <oken; }
187
188 [dD]# { ltoken.type = TOK_DECIMAL; ltoken.text = yytext;
189 return <oken; }
190
191 [dD][eE][cC][iI][mM][aA][lL] { ltoken.type = TOK_DECIMAL; ltoken.text = yytext;
192 return <oken; }
193
194 [dD][eE][fF][eE][rR] { ltoken.type = TOK_DEFER; ltoken.text = yytext;
195 return <oken; }
196
197 \??[dD][oO] { ltoken.type = TOK_DO; ltoken.text = yytext;
198 return <oken; }
199
200 [eE][lL][sS][eE] { ltoken.type = TOK_ELSE; ltoken.text = yytext;
201 return <oken; }
202
203 [eE][nN][dD]0 { ltoken.type = TOK_END0; ltoken.text = yytext;
204 return <oken; }
205
206 [eE][nN][dD][cC][aA][sS][eE] { ltoken.type = TOK_ENDCASE; ltoken.text = yytext;
207 return <oken; }
208
209 [eE][nN][dD][oO][fF] { ltoken.type = TOK_ENDOF; ltoken.text = yytext;
210 return <oken; }
211
212 [eE][xX][tT][eE][rR][nN][aA][lL] { ltoken.type = TOK_EXTERNAL; ltoken.text = yytext;
213 return <oken; }
214
215 [fF][cC][oO][dD][eE]-[vV][eE][rR][sS][iI][oO][nN]2 {
216 ltoken.type = TOK_FCODE_VERSION2; ltoken.text = yytext;
217 return <oken; }
218
219 [fF][cC][oO][dD][eE]-[eE][nN][dD] { ltoken.type = TOK_FCODE_END; ltoken.text = yytext;
220 return <oken; }
221
222 [fF][iI][eE][lL][dD] { ltoken.type = TOK_FIELD; ltoken.text = yytext;
223 return <oken; }
224
225 [hH]# { ltoken.type = TOK_HEX; ltoken.text = yytext;
226 return <oken; }
227
228 [hH][eE][aA][dD][eE][rR][lL][eE][sS][sS] { ltoken.type = TOK_HEADERLESS; ltoken.text = yytext;
229 return <oken; }
230
231 [hH][eE][aA][dD][eE][rR][sS] { ltoken.type = TOK_HEADERS; ltoken.text = yytext;
232 return <oken; }
233
234 [hH][eE][xX] { ltoken.type = TOK_HEX; ltoken.text = yytext;
235 return <oken; }
236
237 [iI][fF] { ltoken.type = TOK_IF; ltoken.text = yytext;
238 return <oken; }
239
240 \??[lL][eE][aA][vV][eE] { ltoken.type = TOK_LEAVE; ltoken.text = yytext;
241 return <oken; }
242
243 \+?[lL][oO][oO][pP] { ltoken.type = TOK_LOOP; ltoken.text = yytext;
244 return <oken; }
245
246 [oO]# { ltoken.type = TOK_OCTAL; ltoken.text = yytext;
247 return <oken; }
248
249 [oO][cC][tT][aA][lL] { ltoken.type = TOK_OCTAL; ltoken.text = yytext;
250 return <oken; }
251
252 [oO][fF] { ltoken.type = TOK_OF; ltoken.text = yytext;
253 return <oken; }
254
255 [oO][fF][fF][sS][eE][tT]16 { ltoken.type = TOK_OFFSET16; ltoken.text = yytext;
256 return <oken; }
257
258 [rR][eE][pP][eE][aA][tT] { ltoken.type = TOK_REPEAT; ltoken.text = yytext;
259 return <oken; }
260
261 [sS][tT][aA][rR][tT][0124] { ltoken.type = TOK_STARTX; ltoken.text = yytext;
262 return <oken; }
263
264 [tT][hH][eE][nN] { ltoken.type = TOK_THEN; ltoken.text = yytext;
265 return <oken; }
266
267 [tT][oO] { ltoken.type = TOK_TO; ltoken.text = yytext;
268 return <oken; }
269
270 [uU][nN][tT][iI][lL] { ltoken.type = TOK_UNTIL; ltoken.text = yytext;
271 return <oken; }
272
273 [vV][aA][lL][uU][eE] { ltoken.type = TOK_VALUE; ltoken.text = yytext;
274 return <oken; }
275
276 [vV][aA][rR][iI][aA][bB][lL][eE] { ltoken.type = TOK_VARIABLE; ltoken.text = yytext;
277 return <oken; }
278
279 [vV][eE][rR][sS][iI][oO][nN]1 { ltoken.type = TOK_VERSION1; ltoken.text = yytext;
280 return <oken; }
281
282 [wW][hH][iI][lL][eE] { ltoken.type = TOK_WHILE; ltoken.text = yytext;
283 return <oken; }
284
285 tokenizer\[ { ltoken.type = TOK_BEGTOK; ltoken.text = yytext;
286 return <oken; }
287
288 emit-byte { ltoken.type = TOK_EMIT_BYTE; ltoken.text = yytext;
289 return <oken; }
290
291 \]tokenizer { ltoken.type = TOK_ENDTOK; ltoken.text = yytext;
292 return <oken; }
293
294 [fF][lL][oO][aA][dD] { ltoken.type = TOK_FLOAD; ltoken.text = yytext;
295 return <oken; }
296
297
298 [^ \n\t\r\f]+ { ltoken.type = TOK_OTHER; ltoken.text = yytext;
299 return <oken; }
300
301 <<EOF>> { return NULL; }
302 %%
303
304 /* Function definitions */
305 static void push(Cell);
306 static Cell pop(void);
307 static int depth(void);
308 static int fadd(struct fcode *, struct fcode *);
309 static struct fcode *flookup(struct fcode *, const char *);
310 static int aadd(struct macro *, struct macro *);
311 static struct macro *alookup(struct macro *, const char *);
312 static void initdic(void);
313 __dead static void usage(void);
314 static void tokenize(YY_BUFFER_STATE);
315 static int emit(const char *);
316 static int spit(long);
317 static int offspit(long);
318 static void sspit(const char *);
319 static int apply_macros(YY_BUFFER_STATE, const char *);
320 static Cell cvt(const char *, char **, int base);
321
322 /*
323 * Standard FCode names and numbers. Includes standard
324 * tokenizer aliases.
325 */
326 static struct fcode fcodes[] = {
327 { "end0", 0x0000, 0, NULL, NULL },
328 { "b(lit)", 0x0010, 0, NULL, NULL },
329 { "b(')", 0x0011, 0, NULL, NULL },
330 { "b(\")", 0x0012, 0, NULL, NULL },
331 { "bbranch", 0x0013, 0, NULL, NULL },
332 { "b?branch", 0x0014, 0, NULL, NULL },
333 { "b(loop)", 0x0015, 0, NULL, NULL },
334 { "b(+loop)", 0x0016, 0, NULL, NULL },
335 { "b(do)", 0x0017, 0, NULL, NULL },
336 { "b(?do)", 0x0018, 0, NULL, NULL },
337 { "i", 0x0019, 0, NULL, NULL },
338 { "j", 0x001a, 0, NULL, NULL },
339 { "b(leave)", 0x001b, 0, NULL, NULL },
340 { "b(of)", 0x001c, 0, NULL, NULL },
341 { "execute", 0x001d, 0, NULL, NULL },
342 { "+", 0x001e, 0, NULL, NULL },
343 { "-", 0x001f, 0, NULL, NULL },
344 { "*", 0x0020, 0, NULL, NULL },
345 { "/", 0x0021, 0, NULL, NULL },
346 { "mod", 0x0022, 0, NULL, NULL },
347 { "and", 0x0023, 0, NULL, NULL },
348 { "or", 0x0024, 0, NULL, NULL },
349 { "xor", 0x0025, 0, NULL, NULL },
350 { "invert", 0x0026, 0, NULL, NULL },
351 { "lshift", 0x0027, 0, NULL, NULL },
352 { "rshift", 0x0028, 0, NULL, NULL },
353 { ">>a", 0x0029, 0, NULL, NULL },
354 { "/mod", 0x002a, 0, NULL, NULL },
355 { "u/mod", 0x002b, 0, NULL, NULL },
356 { "negate", 0x002c, 0, NULL, NULL },
357 { "abs", 0x002d, 0, NULL, NULL },
358 { "min", 0x002e, 0, NULL, NULL },
359 { "max", 0x002f, 0, NULL, NULL },
360 { ">r", 0x0030, 0, NULL, NULL },
361 { "r>", 0x0031, 0, NULL, NULL },
362 { "r@", 0x0032, 0, NULL, NULL },
363 { "exit", 0x0033, 0, NULL, NULL },
364 { "0=", 0x0034, 0, NULL, NULL },
365 { "0<>", 0x0035, 0, NULL, NULL },
366 { "0<", 0x0036, 0, NULL, NULL },
367 { "0<=", 0x0037, 0, NULL, NULL },
368 { "0>", 0x0038, 0, NULL, NULL },
369 { "0>=", 0x0039, 0, NULL, NULL },
370 { "<", 0x003a, 0, NULL, NULL },
371 { ">", 0x003b, 0, NULL, NULL },
372 { "=", 0x003c, 0, NULL, NULL },
373 { "<>", 0x003d, 0, NULL, NULL },
374 { "u>", 0x003e, 0, NULL, NULL },
375 { "u<=", 0x003f, 0, NULL, NULL },
376 { "u<", 0x0040, 0, NULL, NULL },
377 { "u>=", 0x0041, 0, NULL, NULL },
378 { ">=", 0x0042, 0, NULL, NULL },
379 { "<=", 0x0043, 0, NULL, NULL },
380 { "between", 0x0044, 0, NULL, NULL },
381 { "within", 0x0045, 0, NULL, NULL },
382 { "drop", 0x0046, 0, NULL, NULL },
383 { "dup", 0x0047, 0, NULL, NULL },
384 { "over", 0x0048, 0, NULL, NULL },
385 { "swap", 0x0049, 0, NULL, NULL },
386 { "rot", 0x004a, 0, NULL, NULL },
387 { "-rot", 0x004b, 0, NULL, NULL },
388 { "tuck", 0x004c, 0, NULL, NULL },
389 { "nip", 0x004d, 0, NULL, NULL },
390 { "pick", 0x004e, 0, NULL, NULL },
391 { "roll", 0x004f, 0, NULL, NULL },
392 { "?dup", 0x0050, 0, NULL, NULL },
393 { "depth", 0x0051, 0, NULL, NULL },
394 { "2drop", 0x0052, 0, NULL, NULL },
395 { "2dup", 0x0053, 0, NULL, NULL },
396 { "2over", 0x0054, 0, NULL, NULL },
397 { "2swap", 0x0055, 0, NULL, NULL },
398 { "2rot", 0x0056, 0, NULL, NULL },
399 { "2/", 0x0057, 0, NULL, NULL },
400 { "u2/", 0x0058, 0, NULL, NULL },
401 { "2*", 0x0059, 0, NULL, NULL },
402 { "/c", 0x005a, 0, NULL, NULL },
403 { "/w", 0x005b, 0, NULL, NULL },
404 { "/l", 0x005c, 0, NULL, NULL },
405 { "/n", 0x005d, 0, NULL, NULL },
406 { "ca+", 0x005e, 0, NULL, NULL },
407 { "wa+", 0x005f, 0, NULL, NULL },
408 { "la+", 0x0060, 0, NULL, NULL },
409 { "na+", 0x0061, 0, NULL, NULL },
410 { "char+", 0x0062, 0, NULL, NULL },
411 { "wa1+", 0x0063, 0, NULL, NULL },
412 { "la1+", 0x0064, 0, NULL, NULL },
413 { "cell+", 0x0065, 0, NULL, NULL },
414 { "chars", 0x0066, 0, NULL, NULL },
415 { "/w*", 0x0067, 0, NULL, NULL },
416 { "/l*", 0x0068, 0, NULL, NULL },
417 { "cells", 0x0069, 0, NULL, NULL },
418 { "on", 0x006a, 0, NULL, NULL },
419 { "off", 0x006b, 0, NULL, NULL },
420 { "+!", 0x006c, 0, NULL, NULL },
421 { "@", 0x006d, 0, NULL, NULL },
422 { "l@", 0x006e, 0, NULL, NULL },
423 { "w@", 0x006f, 0, NULL, NULL },
424 { "<w@", 0x0070, 0, NULL, NULL },
425 { "c@", 0x0071, 0, NULL, NULL },
426 { "!", 0x0072, 0, NULL, NULL },
427 { "l!", 0x0073, 0, NULL, NULL },
428 { "w!", 0x0074, 0, NULL, NULL },
429 { "c!", 0x0075, 0, NULL, NULL },
430 { "2@", 0x0076, 0, NULL, NULL },
431 { "2!", 0x0077, 0, NULL, NULL },
432 { "move", 0x0078, 0, NULL, NULL },
433 { "fill", 0x0079, 0, NULL, NULL },
434 { "comp", 0x007a, 0, NULL, NULL },
435 { "noop", 0x007b, 0, NULL, NULL },
436 { "lwsplit", 0x007c, 0, NULL, NULL },
437 { "wjoin", 0x007d, 0, NULL, NULL },
438 { "lbsplit", 0x007e, 0, NULL, NULL },
439 { "bljoin", 0x007f, 0, NULL, NULL },
440 { "wbflip", 0x0080, 0, NULL, NULL },
441 { "upc", 0x0081, 0, NULL, NULL },
442 { "lcc", 0x0082, 0, NULL, NULL },
443 { "pack", 0x0083, 0, NULL, NULL },
444 { "count", 0x0084, 0, NULL, NULL },
445 { "body>", 0x0085, 0, NULL, NULL },
446 { ">body", 0x0086, 0, NULL, NULL },
447 { "fcode-revision", 0x0087, 0, NULL, NULL },
448 { "span", 0x0088, 0, NULL, NULL },
449 { "unloop", 0x0089, 0, NULL, NULL },
450 { "expect", 0x008a, 0, NULL, NULL },
451 { "alloc-mem", 0x008b, 0, NULL, NULL },
452 { "free-mem", 0x008c, 0, NULL, NULL },
453 { "key?", 0x008d, 0, NULL, NULL },
454 { "key", 0x008e, 0, NULL, NULL },
455 { "emit", 0x008f, 0, NULL, NULL },
456 { "type", 0x0090, 0, NULL, NULL },
457 { "(cr", 0x0091, 0, NULL, NULL },
458 { "cr", 0x0092, 0, NULL, NULL },
459 { "#out", 0x0093, 0, NULL, NULL },
460 { "#line", 0x0094, 0, NULL, NULL },
461 { "hold", 0x0095, 0, NULL, NULL },
462 { "<#", 0x0096, 0, NULL, NULL },
463 { "u#>", 0x0097, 0, NULL, NULL },
464 { "sign", 0x0098, 0, NULL, NULL },
465 { "u#", 0x0099, 0, NULL, NULL },
466 { "u#s", 0x009a, 0, NULL, NULL },
467 { "u.", 0x009b, 0, NULL, NULL },
468 { "u.r", 0x009c, 0, NULL, NULL },
469 { ".", 0x009d, 0, NULL, NULL },
470 { ".r", 0x009e, 0, NULL, NULL },
471 { ".s", 0x009f, 0, NULL, NULL },
472 { "base", 0x00a0, 0, NULL, NULL },
473 { "convert", 0x00a1, 0, NULL, NULL },
474 { "$number", 0x00a2, 0, NULL, NULL },
475 { "digit", 0x00a3, 0, NULL, NULL },
476 { "-1", 0x00a4, 0, NULL, NULL },
477 { "true", 0x00a4, 0, NULL, NULL },
478 { "0", 0x00a5, 0, NULL, NULL },
479 { "1", 0x00a6, 0, NULL, NULL },
480 { "2", 0x00a7, 0, NULL, NULL },
481 { "3", 0x00a8, 0, NULL, NULL },
482 { "bl", 0x00a9, 0, NULL, NULL },
483 { "bs", 0x00aa, 0, NULL, NULL },
484 { "bell", 0x00ab, 0, NULL, NULL },
485 { "bounds", 0x00ac, 0, NULL, NULL },
486 { "here", 0x00ad, 0, NULL, NULL },
487 { "aligned", 0x00ae, 0, NULL, NULL },
488 { "wbsplit", 0x00af, 0, NULL, NULL },
489 { "bwjoin", 0x00b0, 0, NULL, NULL },
490 { "b(<mark)", 0x00b1, 0, NULL, NULL },
491 { "b(>resolve)", 0x00b2, 0, NULL, NULL },
492 { "set-token-table", 0x00b3, 0, NULL, NULL },
493 { "set-table", 0x00b4, 0, NULL, NULL },
494 { "new-token", 0x00b5, 0, NULL, NULL },
495 { "named-token", 0x00b6, 0, NULL, NULL },
496 { "b(:)", 0x00b7, 0, NULL, NULL },
497 { "b(value)", 0x00b8, 0, NULL, NULL },
498 { "b(variable)", 0x00b9, 0, NULL, NULL },
499 { "b(constant)", 0x00ba, 0, NULL, NULL },
500 { "b(create)", 0x00bb, 0, NULL, NULL },
501 { "b(defer)", 0x00bc, 0, NULL, NULL },
502 { "b(buffer:)", 0x00bd, 0, NULL, NULL },
503 { "b(field)", 0x00be, 0, NULL, NULL },
504 { "b(code)", 0x00bf, 0, NULL, NULL },
505 { "instance", 0x00c0, 0, NULL, NULL },
506 { "b(;)", 0x00c2, 0, NULL, NULL },
507 { "b(to)", 0x00c3, 0, NULL, NULL },
508 { "b(case)", 0x00c4, 0, NULL, NULL },
509 { "b(endcase)", 0x00c5, 0, NULL, NULL },
510 { "b(endof)", 0x00c6, 0, NULL, NULL },
511 { "#", 0x00c7, 0, NULL, NULL },
512 { "#s", 0x00c8, 0, NULL, NULL },
513 { "#>", 0x00c9, 0, NULL, NULL },
514 { "external-token", 0x00ca, 0, NULL, NULL },
515 { "$find", 0x00cb, 0, NULL, NULL },
516 { "offset16", 0x00cc, 0, NULL, NULL },
517 { "evaluate", 0x00cd, 0, NULL, NULL },
518 { "c,", 0x00d0, 0, NULL, NULL },
519 { "w,", 0x00d1, 0, NULL, NULL },
520 { "l,", 0x00d2, 0, NULL, NULL },
521 { ",", 0x00d3, 0, NULL, NULL },
522 { "um*", 0x00d4, 0, NULL, NULL },
523 { "um/mod", 0x00d5, 0, NULL, NULL },
524 { "d+", 0x00d8, 0, NULL, NULL },
525 { "d-", 0x00d9, 0, NULL, NULL },
526 { "get-token", 0x00da, 0, NULL, NULL },
527 { "set-token", 0x00db, 0, NULL, NULL },
528 { "state", 0x00dc, 0, NULL, NULL },
529 { "compile,", 0x00dd, 0, NULL, NULL },
530 { "behavior", 0x00de, 0, NULL, NULL },
531 { "start0", 0x00f0, 0, NULL, NULL },
532 { "start1", 0x00f1, 0, NULL, NULL },
533 { "start2", 0x00f2, 0, NULL, NULL },
534 { "start4", 0x00f3, 0, NULL, NULL },
535 { "ferror", 0x00fc, 0, NULL, NULL },
536 { "version1", 0x00fd, 0, NULL, NULL },
537 { "4-byte-id", 0x00fe, 0, NULL, NULL },
538 { "end1", 0x00ff, 0, NULL, NULL },
539 { "dma-alloc", 0x0101, 0, NULL, NULL },
540 { "my-address", 0x0102, 0, NULL, NULL },
541 { "my-space", 0x0103, 0, NULL, NULL },
542 { "memmap", 0x0104, 0, NULL, NULL },
543 { "free-virtual", 0x0105, 0, NULL, NULL },
544 { ">physical", 0x0106, 0, NULL, NULL },
545 { "my-params", 0x010f, 0, NULL, NULL },
546 { "property", 0x0110, 0, NULL, NULL },
547 { "encode-int", 0x0111, 0, NULL, NULL },
548 { "encode+", 0x0112, 0, NULL, NULL },
549 { "encode-phys", 0x0113, 0, NULL, NULL },
550 { "encode-string", 0x0114, 0, NULL, NULL },
551 { "encode-bytes", 0x0115, 0, NULL, NULL },
552 { "reg", 0x0116, 0, NULL, NULL },
553 { "intr", 0x0117, 0, NULL, NULL },
554 { "driver", 0x0118, 0, NULL, NULL },
555 { "model", 0x0119, 0, NULL, NULL },
556 { "device-type", 0x011a, 0, NULL, NULL },
557 { "parse-2int", 0x011b, 0, NULL, NULL },
558 { "is-install", 0x011c, 0, NULL, NULL },
559 { "is-remove", 0x011d, 0, NULL, NULL },
560 { "is-selftest", 0x011e, 0, NULL, NULL },
561 { "new-device", 0x011f, 0, NULL, NULL },
562 { "diagnostic-mode?", 0x0120, 0, NULL, NULL },
563 { "display-status", 0x0121, 0, NULL, NULL },
564 { "memory-test-suite", 0x0122, 0, NULL, NULL },
565 { "group-code", 0x0123, 0, NULL, NULL },
566 { "mask", 0x0124, 0, NULL, NULL },
567 { "get-msecs", 0x0125, 0, NULL, NULL },
568 { "ms", 0x0126, 0, NULL, NULL },
569 { "finish-device", 0x0127, 0, NULL, NULL },
570 { "decode-phys", 0x0128, 0, NULL, NULL },
571 { "map-low", 0x0130, 0, NULL, NULL },
572 { "sbus-intr>cpu", 0x0131, 0, NULL, NULL },
573 { "#lines", 0x0150, 0, NULL, NULL },
574 { "#columns", 0x0151, 0, NULL, NULL },
575 { "line#", 0x0152, 0, NULL, NULL },
576 { "column#", 0x0153, 0, NULL, NULL },
577 { "inverse?", 0x0154, 0, NULL, NULL },
578 { "inverse-screen?", 0x0155, 0, NULL, NULL },
579 { "frame-buffer-busy?", 0x0156, 0, NULL, NULL },
580 { "draw-character", 0x0157, 0, NULL, NULL },
581 { "reset-screen", 0x0158, 0, NULL, NULL },
582 { "toggle-cursor", 0x0159, 0, NULL, NULL },
583 { "erase-screen", 0x015a, 0, NULL, NULL },
584 { "blink-screen", 0x015b, 0, NULL, NULL },
585 { "invert-screen", 0x015c, 0, NULL, NULL },
586 { "insert-characters", 0x015d, 0, NULL, NULL },
587 { "delete-characters", 0x015e, 0, NULL, NULL },
588 { "insert-lines", 0x015f, 0, NULL, NULL },
589 { "delete-lines", 0x0160, 0, NULL, NULL },
590 { "draw-logo", 0x0161, 0, NULL, NULL },
591 { "frame-buffer-addr", 0x0162, 0, NULL, NULL },
592 { "screen-height", 0x0163, 0, NULL, NULL },
593 { "screen-width", 0x0164, 0, NULL, NULL },
594 { "window-top", 0x0165, 0, NULL, NULL },
595 { "window-left", 0x0166, 0, NULL, NULL },
596 { "default-font", 0x016a, 0, NULL, NULL },
597 { "set-font", 0x016b, 0, NULL, NULL },
598 { "char-height", 0x016c, 0, NULL, NULL },
599 { "char-width", 0x016d, 0, NULL, NULL },
600 { ">font", 0x016e, 0, NULL, NULL },
601 { "fontbytes", 0x016f, 0, NULL, NULL },
602 { "fb8-draw-character", 0x0180, 0, NULL, NULL },
603 { "fb8-reset-screen", 0x0181, 0, NULL, NULL },
604 { "fb8-toggle-cursor", 0x0182, 0, NULL, NULL },
605 { "fb8-erase-screen", 0x0183, 0, NULL, NULL },
606 { "fb8-blink-screen", 0x0184, 0, NULL, NULL },
607 { "fb8-invert-screen", 0x0185, 0, NULL, NULL },
608 { "fb8-insert-characters", 0x0186, 0, NULL, NULL },
609 { "fb8-delete-characters", 0x0187, 0, NULL, NULL },
610 { "fb8-inisert-lines", 0x0188, 0, NULL, NULL },
611 { "fb8-delete-lines", 0x0189, 0, NULL, NULL },
612 { "fb8-draw-logo", 0x018a, 0, NULL, NULL },
613 { "fb8-install", 0x018b, 0, NULL, NULL },
614 { "return-buffer", 0x01a0, 0, NULL, NULL },
615 { "xmit-packet", 0x01a1, 0, NULL, NULL },
616 { "poll-packet", 0x01a2, 0, NULL, NULL },
617 { "mac-address", 0x01a4, 0, NULL, NULL },
618 { "device-name", 0x0201, 0, NULL, NULL },
619 { "my-args", 0x0202, 0, NULL, NULL },
620 { "my-self", 0x0203, 0, NULL, NULL },
621 { "find-package", 0x0204, 0, NULL, NULL },
622 { "open-package", 0x0205, 0, NULL, NULL },
623 { "close-package", 0x0206, 0, NULL, NULL },
624 { "find-method", 0x0207, 0, NULL, NULL },
625 { "call-package", 0x0208, 0, NULL, NULL },
626 { "$call-parent", 0x0209, 0, NULL, NULL },
627 { "my-parent", 0x020a, 0, NULL, NULL },
628 { "ihandle>phandle", 0x020b, 0, NULL, NULL },
629 { "my-unit", 0x020d, 0, NULL, NULL },
630 { "$call-method", 0x020e, 0, NULL, NULL },
631 { "$open-package", 0x020f, 0, NULL, NULL },
632 { "processor-type", 0x0210, 0, NULL, NULL },
633 { "firmware-version", 0x0211, 0, NULL, NULL },
634 { "fcode-version", 0x0212, 0, NULL, NULL },
635 { "alarm", 0x0213, 0, NULL, NULL },
636 { "(is-user-word)", 0x0214, 0, NULL, NULL },
637 { "suspend-fcode", 0x0215, 0, NULL, NULL },
638 { "abort", 0x0216, 0, NULL, NULL },
639 { "catch", 0x0217, 0, NULL, NULL },
640 { "throw", 0x0218, 0, NULL, NULL },
641 { "user-abort", 0x0219, 0, NULL, NULL },
642 { "get-my-property", 0x021a, 0, NULL, NULL },
643 { "decode-int", 0x021b, 0, NULL, NULL },
644 { "decode-string", 0x021c, 0, NULL, NULL },
645 { "get-inherited-property", 0x021d, 0, NULL, NULL },
646 { "delete-property", 0x021e, 0, NULL, NULL },
647 { "get-package-property", 0x021f, 0, NULL, NULL },
648 { "cpeek", 0x0220, 0, NULL, NULL },
649 { "wpeek", 0x0221, 0, NULL, NULL },
650 { "lpeek", 0x0222, 0, NULL, NULL },
651 { "cpoke", 0x0223, 0, NULL, NULL },
652 { "wpoke", 0x0224, 0, NULL, NULL },
653 { "lpoke", 0x0225, 0, NULL, NULL },
654 { "lwflip", 0x0226, 0, NULL, NULL },
655 { "lbflip", 0x0227, 0, NULL, NULL },
656 { "lbflips", 0x0228, 0, NULL, NULL },
657 { "adr-mask", 0x0229, 0, NULL, NULL },
658 { "rb@", 0x0230, 0, NULL, NULL },
659 { "rb!", 0x0231, 0, NULL, NULL },
660 { "rw@", 0x0232, 0, NULL, NULL },
661 { "rw!", 0x0233, 0, NULL, NULL },
662 { "rl@", 0x0234, 0, NULL, NULL },
663 { "rl!", 0x0235, 0, NULL, NULL },
664 { "wbflips", 0x0236, 0, NULL, NULL },
665 { "lwflips", 0x0237, 0, NULL, NULL },
666 { "probe", 0x0238, 0, NULL, NULL },
667 { "probe-virtual", 0x0239, 0, NULL, NULL },
668 { "child", 0x023b, 0, NULL, NULL },
669 { "peer", 0x023c, 0, NULL, NULL },
670 { "next-property", 0x023d, 0, NULL, NULL },
671 { "byte-load", 0x023e, 0, NULL, NULL },
672 { "set-args", 0x023f, 0, NULL, NULL },
673 { "left-parse-string", 0x0240, 0, NULL, NULL },
674 /* 64-bit FCode extensions */
675 { "bxjoin", 0x0241, 0, NULL, NULL },
676 { "<l@", 0x0242, 0, NULL, NULL },
677 { "lxjoin", 0x0243, 0, NULL, NULL },
678 { "rx@", 0x022e, 0, NULL, NULL },
679 { "rx!", 0x022f, 0, NULL, NULL },
680 { "wxjoin", 0x0244, 0, NULL, NULL },
681 { "x,", 0x0245, 0, NULL, NULL },
682 { "x@", 0x0246, 0, NULL, NULL },
683 { "x!", 0x0247, 0, NULL, NULL },
684 { "/x", 0x0248, 0, NULL, NULL },
685 { "/x*", 0x0249, 0, NULL, NULL },
686 { "xa+", 0x024a, 0, NULL, NULL },
687 { "xa1+", 0x024b, 0, NULL, NULL },
688 { "xbflip", 0x024c, 0, NULL, NULL },
689 { "xbflips", 0x024d, 0, NULL, NULL },
690 { "xbsplit", 0x024e, 0, NULL, NULL },
691 { "xlflip", 0x024f, 0, NULL, NULL },
692 { "xlflips", 0x0250, 0, NULL, NULL },
693 { "xlsplit", 0x0251, 0, NULL, NULL },
694 { "xwflip", 0x0252, 0, NULL, NULL },
695 { "xwflips", 0x0253, 0, NULL, NULL },
696 { "xwsplit", 0x0254, 0, NULL, NULL },
697 { NULL, 0, 0, NULL, NULL }
698 };
699
700 /*
701 * Default macros -- can be overridden by colon definitions.
702 */
703 static struct macro macros[] = {
704 { "eval", "evaluate", 0, NULL, NULL }, /* Build a more balanced tree */
705 { "(.)", "dup abs <# u#s swap sign u#>", 0, NULL, NULL },
706 { "<<", "lshift", 0, NULL, NULL },
707 { ">>", "rshift", 0, NULL, NULL },
708 { "?", "@ .", 0, NULL, NULL },
709 { "1+", "1 +", 0, NULL, NULL },
710 { "1-", "1 -", 0, NULL, NULL },
711 { "2+", "2 +", 0, NULL, NULL },
712 { "2-", "2 -", 0, NULL, NULL },
713 { "abort\"", "-2 throw", 0, NULL, NULL },
714 { "accept", "span @ -rot expect span @ swap span !", 0, NULL, NULL },
715 { "allot", "0 max 0 ?do 0 c, loop", 0, NULL, NULL },
716 { "blank", "bl fill", 0, NULL, NULL },
717 { "/c*", "chars", 0, NULL, NULL },
718 { "ca1+", "char+", 0, NULL, NULL },
719 { "carret", "b(lit) 00 00 00 h# 0d", 0, NULL, NULL },
720 { ".d", "base @ swap d# 0a base ! . base !", 0, NULL, NULL },
721 { "decode-bytes", ">r over r@ + swap r@ - rot r>", 0, NULL, NULL },
722 { "3drop", "drop 2drop", 0, NULL, NULL },
723 { "3dup", "2 pick 2 pick 2 pick", 0, NULL, NULL },
724 { "erase", "0 fill", 0, NULL, NULL },
725 { "false", "0", 0, NULL, NULL },
726 { ".h", "base @ swap d# 10 base ! . base !", 0, NULL, NULL },
727 { "linefeed", "b(lit) 00 00 00 d# 0a", 0, NULL, NULL },
728 { "/n*", "cells", 0, NULL, NULL },
729 { "na1+", "cell+", 0, NULL, NULL },
730 { "not", "invert", 0, NULL, NULL },
731 { "s.", "(.) type space", 0, NULL, NULL },
732 { "space", "bl emit", 0, NULL, NULL },
733 { "spaces", "0 max 0 ?do space loop", 0, NULL, NULL },
734 { "struct", "0", 0, NULL, NULL },
735 { "true", "-1", 0, NULL, NULL },
736 { "(u,)", "<# u#s u#>", 0, NULL, NULL },
737 { NULL, NULL, 0, NULL, NULL }
738 };
739
740 /*
741 * Utility functions.
742 */
743
744 /*
745 * ASCII -> long int converter, eats `.'s
746 */
747 #define strtol(x, y, z) cvt(x, y, z)
748 static Cell
749 cvt(const char *s, char **e, int base)
750 {
751 Cell v = 0;
752 int c, n = 0;
753
754 c = *s;
755 if (c == '-') { n = 1; s++; }
756
757 for (c = *s; (c = *s); s++) {
758
759 /* Ignore `.' */
760 if (c == '.')
761 continue;
762 if (c >= '0' && c <= '9')
763 c -= '0';
764 else if (c >= 'a' && c <= 'f')
765 c += 10 - 'a';
766 else if (c >= 'A' && c <= 'F')
767 c += 10 - 'A';
768 if (c >= base)
769 break;
770 v *= base;
771 v += c;
772 }
773 if (e)
774 *e = __UNCONST(s);
775 if (n)
776 return (-v);
777 return (v);
778 }
779
780 /*
781 * Parser stack control functions.
782 */
783
784 static void
785 push(Cell val)
786 {
787 if (debug > 1)
788 printf("push %lx\n", (long)val);
789 parse_stack[parse_stack_ptr++] = val;
790 if (parse_stack_ptr >= PSTKSIZ)
791 errx(EXIT_FAILURE, "Parse stack overflow");
792 }
793
794 static Cell
795 pop(void)
796 {
797 ASSERT(parse_stack_ptr);
798 if (debug > 1)
799 printf("pop %lx\n", (long)parse_stack[parse_stack_ptr-1]);
800 return parse_stack[--parse_stack_ptr];
801 }
802
803 static int
804 depth(void)
805 {
806 return (parse_stack_ptr);
807 }
808
809 /*
810 * Insert fcode into dictionary.
811 */
812 static int
813 fadd(struct fcode *dict, struct fcode *new)
814 {
815 int res = strcmp(dict->name, new->name);
816
817 new->type = FCODE;
818 ASSERT(dict->type == FCODE);
819 if (!res) {
820 /*
821 * Duplicate entry. Give the old name the new FCode
822 * number.
823 */
824 dict->num = new->num;
825 return (0);
826 }
827 if (res < 0) {
828 if (dict->l)
829 return fadd(dict->l, new);
830 else {
831 if (debug > 5)
832 printf("fadd: new FCode `%s' is %lx\n",
833 new->name, new->num);
834 new->l = new->r = NULL;
835 dict->l = new;
836 }
837 } else {
838 if (dict->r)
839 return fadd(dict->r, new);
840 else {
841 if (debug > 5)
842 printf("fadd: new FCode `%s' is %lx\n",
843 new->name, new->num);
844 new->l = new->r = NULL;
845 dict->r = new;
846 }
847 }
848 return (1);
849 }
850
851 /*
852 * Look for a code in the dictionary.
853 */
854 static struct fcode *
855 flookup(struct fcode *dict, const char *str)
856 {
857 int res;
858 if (!dict) return (dict);
859
860 res = strcmp(dict->name, str);
861 ASSERT(dict->type == FCODE);
862 if (debug > 5)
863 printf("flookup: `%s' and `%s' %s match\n",
864 str, dict->name, res?"don't":"do");
865 if (!res) return (dict);
866 if (res < 0)
867 return (flookup(dict->l, str));
868 else
869 return (flookup(dict->r, str));
870
871 }
872
873 /*
874 * Insert alias into macros.
875 */
876 static int
877 aadd(struct macro *dict, struct macro *new)
878 {
879 int res = strcmp(dict->name, new->name);
880
881 new->type = MACRO;
882 ASSERT(dict->type == MACRO);
883 if (!res) {
884 /* Duplicate name. Replace the old macro */
885 dict->equiv = new->equiv;
886 /* We can't free the old equiv since it may be static data. */
887 return (0);
888 }
889 if (res < 0) {
890 if (dict->l)
891 return aadd(dict->l, new);
892 else {
893 new->l = new->r = NULL;
894 dict->l = new;
895 if (debug > 5)
896 printf("aadd: new alias `%s' to `%s'\n",
897 new->name, new->equiv);
898 }
899 } else {
900 if (dict->r)
901 return aadd(dict->r, new);
902 else {
903 new->l = new->r = NULL;
904 dict->r = new;
905 if (debug > 5)
906 printf("aadd: new alias `%s' to `%s'\n",
907 new->name, new->equiv);
908 }
909 }
910 return (1);
911 }
912
913 /*
914 * Look for a macro in the aliases.
915 */
916 static struct macro *
917 alookup(struct macro *dict, const char *str)
918 {
919 int res;
920 if (!dict) return (dict);
921
922 ASSERT(dict->type == MACRO);
923 res = strcmp(dict->name, str);
924 if (!res) return (dict);
925 if (res < 0)
926 return (alookup(dict->l, str));
927 else
928 return (alookup(dict->r, str));
929
930 }
931
932 /*
933 * Bootstrap the dictionary and then install
934 * all the standard FCodes.
935 */
936 static void
937 initdic(void)
938 {
939 struct fcode *code = fcodes;
940 struct macro *alias = macros;
941
942 ASSERT(dictionary == NULL);
943 code->l = code->r = NULL;
944 dictionary = code;
945 code->type = FCODE;
946
947 while ((++code)->name) {
948 if(!fadd(dictionary, code)) {
949 warnx("%s: duplicate dictionary entry `%s'", __func__,
950 code->name);
951 }
952 }
953
954 ASSERT(aliases == NULL);
955 aliases = alias;
956 alias->l = alias->r = NULL;
957 alias->type = MACRO;
958 while ((++alias)->name) {
959 if(!aadd(aliases, alias)) {
960 warnx("%s: duplicate macro entry `%s'", __func__,
961 alias->name);
962 }
963 }
964
965 }
966
967 static int
968 apply_macros(YY_BUFFER_STATE yinput, const char *str)
969 {
970 struct macro *xform = alookup(aliases, str);
971
972 if (xform) {
973 YY_BUFFER_STATE newbuf;
974
975 if (debug > 1)
976 printf("Expanding %s to %s\n", str, xform->equiv);
977
978 newbuf = yy_scan_string(xform->equiv);
979 yy_switch_to_buffer(newbuf);
980 tokenize(newbuf);
981 yy_switch_to_buffer(yinput);
982 yy_delete_buffer(newbuf);
983 }
984 return (xform != NULL);
985 }
986
987 static void
988 usage(void)
989 {
990 (void)fprintf(stderr, "usage: %s [-d level] [-o outfile] infile\n",
991 getprogname());
992 exit(EXIT_FAILURE);
993 }
994
995 int
996 main(int argc, char *argv[])
997 {
998 int ch;
999 FILE *inf;
1000 struct fcode_header *fheader;
1001 YY_BUFFER_STATE inbuf;
1002 const char *hdrtype = "version1";
1003 int i;
1004
1005 outf = 1; /* stdout */
1006
1007 while ((ch = getopt(argc, argv, "d:o:")) != -1)
1008 switch(ch) {
1009 case 'd':
1010 mark_fload = 1;
1011 debug = atol(optarg);
1012 break;
1013 case 'o':
1014 outfile = optarg;
1015 break;
1016 default:
1017 usage();
1018 }
1019 argc -= optind;
1020 argv += optind;
1021
1022 if (argc != 1)
1023 usage();
1024
1025 infile = argv[0];
1026
1027 /*
1028 * Initialization stuff.
1029 */
1030 initdic();
1031 outbufsiz = BUFCLICK;
1032 fheader = emalloc(outbufsiz);
1033 outbuf = (void *)fheader;
1034 outpos = 0;
1035 emit(hdrtype);
1036 outpos = sizeof(*fheader);
1037
1038 /*
1039 * Do it.
1040 */
1041 if ((inf = fopen(infile, "r")) == NULL)
1042 err(EXIT_FAILURE, "Cannot open `%s'", infile);
1043
1044 inbuf = yy_create_buffer(inf, YY_BUF_SIZE);
1045 yy_switch_to_buffer(inbuf);
1046 tokenize(inbuf);
1047 yy_delete_buffer(inbuf);
1048 fclose(inf);
1049 if (need_end0) emit("end0");
1050
1051 /* Now calculate length and checksum and stick them in the header */
1052 fheader->format = 0x08;
1053 fheader->length = htonl(outpos);
1054 fheader->checksum = 0;
1055 for (i = sizeof(*fheader); i<outpos; i++)
1056 fheader->checksum += (unsigned char)outbuf[i];
1057 fheader->checksum = htons(fheader->checksum);
1058
1059 if ((outf = open(outfile, O_WRONLY|O_CREAT|O_TRUNC, 0666)) == -1)
1060 err(EXIT_FAILURE, "Cannot open `%s'", outfile);
1061
1062 if (write(outf, outbuf, outpos) != outpos) {
1063 int serrno = errno;
1064 close(outf);
1065 unlink(outfile);
1066 errc(EXIT_FAILURE, serrno, "write error");
1067 }
1068 close(outf);
1069 return EXIT_SUCCESS;
1070 };
1071
1072 /*
1073 * Tokenize one file. This is a separate function so it can
1074 * be called recursively to parse multiple levels of include files.
1075 */
1076
1077 static void
1078 tokenize(YY_BUFFER_STATE yinput)
1079 {
1080 FILE *inf;
1081 YY_BUFFER_STATE inbuf;
1082 TOKEN *token;
1083 const char *last_token = "";
1084 struct fcode *fcode;
1085 int pos, off;
1086
1087 while ((token = yylex()) != NULL) {
1088 switch (token->type) {
1089 case TOK_NUMBER:
1090 STATE(token->text, "TOK_NUMBER");
1091 {
1092 char *end;
1093 Cell value;
1094
1095 if (tokenizer) {
1096 push(strtol(token->text, &end, 16));
1097 break;
1098 }
1099 value = strtol(token->text, &end, numbase);
1100 if (*end != 0)
1101 token_err(yylineno, infile, yytext,
1102 "illegal number conversion");
1103
1104 /*
1105 * If this is a 64-bit value we need to store two literals
1106 * and issue a `lxjoin' to combine them. But that's a future
1107 * project.
1108 */
1109 emit("b(lit)");
1110 spit((value>>24)&0x0ff);
1111 spit((value>>16)&0x0ff);
1112 spit((value>>8)&0x0ff);
1113 spit(value&0x0ff);
1114 if ((value>>32) != value && (value>>32) != 0 &&
1115 (value>>32) != -1) {
1116 emit("b(lit)");
1117 spit((value>>56)&0x0ff);
1118 spit((value>>48)&0x0ff);
1119 spit((value>>40)&0x0ff);
1120 spit((value>>32)&0x0ff);
1121 emit("lxjoin");
1122 }
1123 }
1124 break;
1125 case TOK_C_LIT:
1126 STATE(token->text, "TOK_C_LIT");
1127 emit("b(lit)");
1128 spit(0);
1129 spit(0);
1130 spit(0);
1131 spit(token->text[1]);
1132 break;
1133 case TOK_STRING_LIT:
1134 STATE(token->text, "TOK_STRING_LIT:");
1135 {
1136 size_t len;
1137 char *p = token->text;
1138
1139 ++p; /* Skip the quote */
1140 len = strlen(++p); /* Skip the 1st space */
1141
1142 #define ERR_TOOLONG \
1143 token_err(yylineno, infile, yytext, "string length %zu too long", len)
1144
1145 if (len > 255)
1146 ERR_TOOLONG;
1147
1148 if (p[len-1] == ')' ||
1149 p[len-1] == '"') {
1150 p[len-1] = 0;
1151 }
1152 emit("b(\")");
1153 sspit(p);
1154 }
1155 break;
1156 case TOK_PSTRING:
1157 STATE(token->text, "TOK_PSTRING:");
1158 {
1159 size_t len;
1160 char *p = token->text;
1161
1162 if (*p++ == '.') p++; /* Skip over delimiter */
1163 p++; /* Skip over space/tab */
1164
1165 len = strlen(p);
1166 if (len > 255)
1167 ERR_TOOLONG;
1168
1169 if (p[len-1] == ')' ||
1170 p[len-1] == '"') {
1171 p[len-1] = 0;
1172 }
1173 emit("b(\")");
1174 sspit(p);
1175 emit("type");
1176 }
1177 break;
1178 case TOK_ABORT_S:
1179 STATE(token->text, "TOK_PSTRING:");
1180 {
1181 size_t len;
1182 Cell value = -2;
1183 char *p = token->text;
1184
1185 while (*p++ != ' '); /* Skip to the string */
1186
1187 len = strlen(p);
1188 if (len > 255)
1189 ERR_TOOLONG;
1190
1191 if (p[len-1] == '"') {
1192 p[len-1] = 0;
1193 }
1194 emit("b?branch");
1195 push(outpos);
1196 offspit(0);
1197 emit("b(\")");
1198 sspit(p);
1199 emit("type");
1200 emit("cr");
1201 emit("b(lit)");
1202 spit((value>>24)&0x0ff);
1203 spit((value>>16)&0x0ff);
1204 spit((value>>8)&0x0ff);
1205 spit(value&0x0ff);
1206 emit("throw");
1207 emit("b(>resolve)");
1208 pos = outpos;
1209 outpos = pop();
1210 off = pos - outpos;
1211 offspit(off);
1212 outpos = pos;
1213 }
1214 break;
1215
1216 case TOK_TOKENIZE:
1217 STATE(token->text, "TOK_TOKENIZE");
1218 /* The next pass should tokenize the FCODE number */
1219 emit("b(')");
1220 break;
1221 case TOK_COMMENT:
1222 STATE(token->text, "TOK_COMMENT:");
1223 do {
1224 off = input();
1225 } while ((off != ')') && (off != '\n') &&
1226 (off != EOF));
1227 break;
1228 case TOK_COLON:
1229 STATE(token->text, "TOK_COLON:");
1230
1231 token = yylex();
1232 if (token == NULL)
1233 token_err(yylineno, infile, yytext,
1234 "EOF in colon definition");
1235
1236 /* Add new code to dictionary */
1237 fcode = emalloc(sizeof(*fcode));
1238 fcode->num = nextfcode++;
1239 fcode->name = estrdup(token->text);
1240 if (!fadd(dictionary, fcode)) {
1241 /* Duplicate definition. Free the memory. */
1242 if (debug)
1243 printf("%s: duplicate FCode\n",
1244 token->text);
1245 free(__UNCONST(fcode->name));
1246 free(fcode);
1247 }
1248 if (debug)
1249 printf("Adding %s to dictionary\n", token->text);
1250 if (state == 0)
1251 emit("new-token");
1252 else {
1253 if (state == TOK_EXTERNAL)
1254 emit("external-token");
1255 else
1256 /* Here we have a choice of new-token or named-token */
1257 emit("named-token");
1258 sspit(token->text);
1259 }
1260 spit(fcode->num);
1261 emit("b(:)");
1262 last_token = fcode->name;
1263 defining = 1;
1264 break;
1265 case TOK_SEMICOLON:
1266 STATE(token->text, "TOK_SEMICOLON:");
1267 emit("b(;)");
1268 defining = 0;
1269 if (depth()) {
1270 token_err(yylineno, infile, NULL,
1271 "Warning: stack depth %d at end of %s\n",
1272 depth(), last_token);
1273 }
1274 last_token = "";
1275 break;
1276
1277 /* These are special */
1278 case TOK_AGAIN:
1279 STATE(token->text, "TOK_AGAIN");
1280 emit("bbranch");
1281 pos = pop();
1282 pos = pos - outpos;
1283 offspit(pos);
1284 break;
1285 case TOK_ALIAS:
1286 STATE(token->text, "TOK_ALIAS");
1287 {
1288 struct macro *alias;
1289
1290 token = yylex();
1291 if (token == NULL) {
1292 warnx("EOF in alias definition");
1293 return;
1294 }
1295 if (token->type != TOK_OTHER) {
1296 warnx("ENDCOMMENT aliasing weird token type %d",
1297 token->type);
1298 }
1299 alias = emalloc(sizeof(*alias));
1300 alias->name = estrdup(token->text);
1301 token = yylex();
1302 if (token == NULL) {
1303 warnx("EOF in alias definition");
1304 free(__UNCONST(alias->name));
1305 free(alias);
1306 return;
1307 }
1308 alias->equiv = estrdup(token->text);
1309 if (!aadd(aliases, alias)) {
1310 free(__UNCONST(alias->name));
1311 free(alias);
1312 }
1313 }
1314 break;
1315 case TOK_GETTOKEN:
1316 STATE(token->text, "TOK_GETTOKEN");
1317 /* This is caused by ['] */
1318 emit("b(')");
1319 token = yylex();
1320 if (token == NULL) {
1321 warnx("EOF in [']");
1322 return;
1323 }
1324 if ((fcode = flookup(dictionary, token->text)) == NULL)
1325 errx(EXIT_FAILURE, "[']: %s not found",
1326 token->text);
1327 spit(fcode->num);
1328 break;
1329 case TOK_ASCII:
1330 STATE(token->text, "TOK_ASCII");
1331 token = yylex();
1332 if (token == NULL)
1333 errx(EXIT_FAILURE, "EOF after \"ascii\"");
1334 emit("b(lit)");
1335 spit(0);
1336 spit(0);
1337 spit(0);
1338 spit(token->text[0]);
1339 break;
1340 case TOK_BEGIN:
1341 STATE(token->text, "TOK_BEGIN");
1342 emit("b(<mark)");
1343 push(outpos);
1344 break;
1345 case TOK_BUFFER:
1346 STATE(token->text, "TOK_BUFFER");
1347
1348 token = yylex();
1349 if (token == NULL) {
1350 warnx("EOF in colon definition");
1351 return;
1352 }
1353
1354 /* Add new code to dictionary */
1355 fcode = emalloc(sizeof(*fcode));
1356 fcode->num = nextfcode++;
1357 fcode->name = estrdup(token->text);
1358 fadd(dictionary, fcode);
1359
1360 if (state == 0)
1361 emit("new-token");
1362 else {
1363 if (state == TOK_EXTERNAL)
1364 emit("external-token");
1365 else
1366 /* Here we have a choice of new-token or named-token */
1367 emit("named-token");
1368 sspit(token->text);
1369 }
1370 spit(fcode->num);
1371 emit("b(buffer:)");
1372 break;
1373 case TOK_CASE:
1374 STATE(token->text, "TOK_CASE");
1375 emit("b(case)");
1376 push(0);
1377 break;
1378 case TOK_CONSTANT:
1379 STATE(token->text, "TOK_CONSTANT");
1380
1381 token = yylex();
1382 if (token == NULL) {
1383 warnx("EOF in constant definition");
1384 return;
1385 }
1386
1387 /* Add new code to dictionary */
1388 fcode = emalloc(sizeof(*fcode));
1389 fcode->num = nextfcode++;
1390 fcode->name = estrdup(token->text);
1391 fadd(dictionary, fcode);
1392
1393 if (state == 0)
1394 emit("new-token");
1395 else {
1396 if (state == TOK_EXTERNAL)
1397 emit("external-token");
1398 else
1399 /* Here we have a choice of new-token or named-token */
1400 emit("named-token");
1401 sspit(token->text);
1402 }
1403 spit(fcode->num);
1404 emit("b(constant)");
1405 break;
1406 case TOK_CONTROL:
1407 STATE(token->text, "TOK_CONTROL");
1408 token = yylex();
1409 if (token == NULL)
1410 errx(EXIT_FAILURE, "EOF after \"ascii\"");
1411 emit("b(lit)");
1412 spit(0);
1413 spit(0);
1414 spit(0);
1415 spit(token->text[0]&0x1f);
1416 break;
1417 case TOK_CREATE:
1418 STATE(token->text, "TOK_CREATE");
1419 /* Don't know what this does or if it's right */
1420 token = yylex();
1421 if (token == NULL) {
1422 warnx("EOF in create definition");
1423 return;
1424 }
1425
1426 /* Add new code to dictionary */
1427 fcode = emalloc(sizeof(*fcode));
1428 fcode->num = nextfcode++;
1429 fcode->name = estrdup(token->text);
1430 fadd(dictionary, fcode);
1431
1432 if (state == 0)
1433 emit("new-token");
1434 else {
1435 if (state == TOK_EXTERNAL)
1436 emit("external-token");
1437 else
1438 /* Here we have a choice of new-token or named-token */
1439 emit("named-token");
1440 sspit(token->text);
1441 }
1442 spit(fcode->num);
1443 emit("b(create)");
1444 break;
1445 case TOK_DECIMAL:
1446 STATE(token->text, "TOK_DECIMAL");
1447 if (token->text[1] != '#') {
1448 if (defining) {
1449 emit("b(lit)");
1450 spit(0);
1451 spit(0);
1452 spit(0);
1453 spit(10);
1454 emit("base");
1455 emit("!");
1456 } else
1457 numbase = TOK_DECIMAL;
1458 } else {
1459 char *end;
1460 Cell value;
1461
1462 token = yylex();
1463 if (token == NULL) {
1464 warnx("EOF after d#");
1465 return;
1466 }
1467 if (token->type == TOK_OTHER) {
1468 if (strcmp("-1", token->text) == 0) {
1469 emit(token->text);
1470 break;
1471 }
1472 }
1473 value = strtol(token->text, &end, 10);
1474 if (*end != 0)
1475 token_err(yylineno, infile, NULL,
1476 "Illegal number conversion: %s", token->text);
1477
1478 /*
1479 * If this is a 64-bit value we need to store two literals
1480 * and issue a `lxjoin' to combine them. But that's a future
1481 * project.
1482 */
1483 emit("b(lit)");
1484 spit((value>>24)&0x0ff);
1485 spit((value>>16)&0x0ff);
1486 spit((value>>8)&0x0ff);
1487 spit(value&0x0ff);
1488 if ((value>>32) != value && (value>>32) != 0) {
1489 emit("b(lit)");
1490 spit((value>>56)&0x0ff);
1491 spit((value>>48)&0x0ff);
1492 spit((value>>40)&0x0ff);
1493 spit((value>>32)&0x0ff);
1494 emit("lxjoin");
1495 }
1496 }
1497 break;
1498 case TOK_DEFER:
1499 STATE(token->text, "TOK_DEFER");
1500 /* Don't know what this does or if it's right */
1501 token = yylex();
1502 if (token == NULL) {
1503 warnx("EOF in colon definition");
1504 return;
1505 }
1506
1507 /* Add new code to dictionary */
1508 fcode = emalloc(sizeof(*fcode));
1509 fcode->num = nextfcode++;
1510 fcode->name = estrdup(token->text);
1511 fadd(dictionary, fcode);
1512
1513 if (state == 0)
1514 emit("new-token");
1515 else {
1516 if (state == TOK_EXTERNAL)
1517 emit("external-token");
1518 else
1519 /* Here we have a choice of new-token or named-token */
1520 emit("named-token");
1521 sspit(token->text);
1522 }
1523 spit(fcode->num);
1524 emit("b(defer)");
1525 break;
1526 case TOK_DO:
1527 STATE(token->text, "TOK_DO");
1528 /*
1529 * From the 1275 spec. B is branch location, T is branch target.
1530 *
1531 * b(do) offset1 ... b(loop) offset2 ...
1532 * b(do) offset1 ... b(+loop) offset2 ...
1533 * b(?do) offset1 ... b(loop) offset2 ...
1534 * b(?do) offset1 ... b(+loop) offset2 ...
1535 * ^ ^
1536 * B1 ^ ^ T1
1537 * T2 B2
1538 *
1539 * How we do this is we generate the b(do) or b(?do), spit out a
1540 * zero offset while remembering b1 and t2. Then we call tokenize()
1541 * to generate the body. When tokenize() finds a b(loop) or b(+loop),
1542 * it generates the FCode and returns, with outpos at b2. We then
1543 * calculate the offsets, put them in the right slots and finishup.
1544 */
1545
1546 if (token->text[0] == '?')
1547 emit("b(?do)");
1548 else
1549 emit("b(do)");
1550 push(outpos);
1551 offspit(0); /* Place holder for later */
1552 push(outpos);
1553 break;
1554 case TOK_END0:
1555 STATE(token->text, "TOK_END0");
1556 emit("end0");
1557 /* Remember we already generated end0 */
1558 need_end0 = 0;
1559 break;
1560 case TOK_ELSE:
1561 STATE(token->text, "TOK_ELSE");
1562 /* Get where we need to patch */
1563 off = pop();
1564 emit("bbranch");
1565 /* Save where we are now. */
1566 push(outpos);
1567 offspit(0); /* Place holder for later */
1568 emit("b(>resolve)");
1569 /* Rewind and patch the if branch */
1570 pos = outpos;
1571 outpos = off;
1572 off = pos - off;
1573 offspit(off); /* Place holder for later */
1574 /* revert to the end */
1575 outpos = pos;
1576 break;
1577 case TOK_ENDCASE:
1578 STATE(token->text, "TOK_ENDCASE:");
1579 emit("b(endcase)");
1580 pos = outpos; /* Remember where we need to branch to */
1581
1582 /* Thread our way backwards and install proper offsets */
1583 off = pop();
1584 while (off) {
1585 int disp;
1586 int next;
1587
1588 /* Move to this offset */
1589 outpos = off;
1590 /* Load next offset to process */
1591 disp = (signed char)(outbuf[outpos]);
1592 if (offsetsize == 16) {
1593 disp = (disp << 8) |
1594 (unsigned char)outbuf[outpos+1];
1595 }
1596 next = outpos + disp;
1597 if (debug > -3)
1598 printf("Next endof: %x at %x\n",
1599 disp, next);
1600
1601 /* process this offset */
1602 off = pos - outpos;
1603 offspit(off);
1604 if ((off = disp))
1605 off = next;
1606 }
1607 outpos = pos;
1608 break;
1609 case TOK_ENDOF:
1610 STATE(token->text, "TOK_ENDOF");
1611 off = pop();
1612 emit("b(endof)");
1613 /*
1614 * Save back pointer in the offset field so we can traverse
1615 * the linked list and patch it in the endcase.
1616 */
1617 pos = pop(); /* get position of prev link. */
1618 push(outpos); /* save position of this link. */
1619 if (pos)
1620 /* save potision of prev link. */
1621 offspit(pos - outpos);
1622 else
1623 /* This is the first statement */
1624 offspit(0);
1625 pos = outpos;
1626 /* Now point the offset from b(of) here. */
1627 outpos = off;
1628 off = pos - off;
1629 offspit(off);
1630 /* Restore position */
1631 outpos = pos;
1632 break;
1633 case TOK_EXTERNAL:
1634 STATE(token->text, "TOK_EXTERNAL");
1635 state = TOK_EXTERNAL;
1636 break;
1637 case TOK_FCODE_VERSION2:
1638 /* This is actually a tokenizer directive. */
1639 STATE(token->text, "TOK_FCODE_VERSION2");
1640 offsetsize = 16;
1641 pos = outpos;
1642 outpos = 0;
1643 emit("start1");
1644 outpos = pos;
1645 break;
1646 case TOK_FCODE_END:
1647 /*
1648 * Another tokenizer directive.
1649 *
1650 * This should generate end0 and finish filling in
1651 * the FCode header. But that's all done in main().
1652 */
1653 STATE(token->text, "TOK_FCODE_END");
1654 return;
1655 case TOK_FIELD:
1656 STATE(token->text, "TOK_FIELD");
1657
1658 token = yylex();
1659 if (token == NULL) {
1660 warnx("EOF in field definition");
1661 return;
1662 }
1663
1664 /* Add new code to dictionary */
1665 fcode = emalloc(sizeof(*fcode));
1666 fcode->num = nextfcode++;
1667 fcode->name = estrdup(token->text);
1668 fadd(dictionary, fcode);
1669
1670 if (state == 0)
1671 emit("new-token");
1672 else {
1673 if (state == TOK_EXTERNAL)
1674 emit("external-token");
1675 else
1676 /* Here we have a choice of new-token or named-token */
1677 emit("named-token");
1678 sspit(token->text);
1679 }
1680 spit(fcode->num);
1681 emit("b(field)");
1682 break;
1683
1684 case TOK_HEX:
1685 STATE(token->text, "TOK_HEX");
1686 if (token->text[1] != '#') {
1687 if (defining) {
1688 emit("b(lit)");
1689 spit(0);
1690 spit(0);
1691 spit(0);
1692 spit(16);
1693 emit("base");
1694 emit("!");
1695 } else
1696 numbase = TOK_HEX;
1697 } else {
1698 char *end;
1699 Cell value;
1700
1701 token = yylex();
1702 if (token == NULL) {
1703 warnx("EOF after h#");
1704 return;
1705 }
1706 value = strtol(token->text, &end, 16);
1707 if (*end != 0)
1708 errx(EXIT_FAILURE, "Illegal number"
1709 " conversion:%s:%d: %s\n",
1710 infile, yylineno, yytext);
1711 /*
1712 * If this is a 64-bit value we need to store two literals
1713 * and issue a `lxjoin' to combine them. But that's a future
1714 * project.
1715 */
1716 emit("b(lit)");
1717 spit((value>>24)&0x0ff);
1718 spit((value>>16)&0x0ff);
1719 spit((value>>8)&0x0ff);
1720 spit(value&0x0ff);
1721 if ((value>>32) != value && (value>>32) != 0) {
1722 emit("b(lit)");
1723 spit((value>>56)&0x0ff);
1724 spit((value>>48)&0x0ff);
1725 spit((value>>40)&0x0ff);
1726 spit((value>>32)&0x0ff);
1727 emit("lxjoin");
1728 }
1729 }
1730 break;
1731 case TOK_HEADERLESS:
1732 STATE(token->text, "TOK_HEADERLESS");
1733 state = 0;
1734 break;
1735 case TOK_HEADERS:
1736 STATE(token->text, "TOK_HEADERS");
1737 state = TOK_HEADERS;
1738 break;
1739 case TOK_IF:
1740 STATE(token->text, "TOK_IF");
1741 /*
1742 * Similar to do but simpler since we only deal w/one branch.
1743 */
1744 emit("b?branch");
1745 push(outpos);
1746 offspit(0); /* Place holder for later */
1747 break;
1748 case TOK_LEAVE:
1749 STATE(token->text, "TOK_LEAVE");
1750 emit("b(leave)");
1751 break;
1752 case TOK_LOOP:
1753 STATE(token->text, "TOK_LOOP");
1754
1755 if (token->text[0] == '+')
1756 emit("b(+loop)");
1757 else
1758 emit("b(loop)");
1759 /* First do backwards branch of loop */
1760 pos = pop();
1761 off = pos - outpos;
1762 offspit(off);
1763 /* Now do forward branch of do */
1764 pos = outpos;
1765 outpos = pop();
1766 off = pos - outpos;
1767 spit(off);
1768 /* Restore output position */
1769 outpos = pos;
1770 break;
1771 case TOK_OCTAL:
1772 STATE(token->text, "TOK_OCTAL");
1773 if (token->text[1] != '#') {
1774 if (defining) {
1775 spit(16);
1776 emit("base");
1777 emit("!");
1778 } else
1779 numbase = TOK_OCTAL;
1780 } else {
1781 char *end;
1782 Cell value;
1783
1784 token = yylex();
1785 if (token == NULL) {
1786 warnx("EOF after o#");
1787 return;
1788 }
1789 value = strtol(token->text, &end, 8);
1790 if (*end != 0) {
1791 errx(EXIT_FAILURE, "Illegal number"
1792 " conversion:%s:%d: %s\n",
1793 infile, yylineno, yytext);
1794 }
1795 /*
1796 * If this is a 64-bit value we need to store two literals
1797 * and issue a `lxjoin' to combine them. But that's a future
1798 * project.
1799 */
1800 emit("b(lit)");
1801 spit((value>>24)&0x0ff);
1802 spit((value>>16)&0x0ff);
1803 spit((value>>8)&0x0ff);
1804 spit(value&0x0ff);
1805 if ((value>>32) != value && (value>>32) != 0) {
1806 emit("b(lit)");
1807 spit((value>>56)&0x0ff);
1808 spit((value>>48)&0x0ff);
1809 spit((value>>40)&0x0ff);
1810 spit((value>>32)&0x0ff);
1811 emit("lxjoin");
1812 }
1813 }
1814 break;
1815 case TOK_OF:
1816 STATE(token->text, "TOK_OF");
1817 /*
1818 * Let's hope I get the semantics right.
1819 *
1820 * The `of' behaves almost the same as an
1821 * `if'. The difference is that `endof'
1822 * takes a branch offset to the associated
1823 * `endcase'. Here we will generate a temporary
1824 * offset of the `of' associated with the `endof'.
1825 * Then in `endcase' we should be pointing just
1826 * after the offset of the last `endof' so we
1827 * calculate the offset and thread our way backwards
1828 * searching for the previous `b(case)' or `b(endof)'.
1829 */
1830 emit("b(of)");
1831 push(outpos);
1832 offspit(0); /* Place holder for later */
1833 break;
1834 case TOK_OFFSET16:
1835 STATE(token->text, "TOK_OFFSET16");
1836 offsetsize = 16;
1837 emit("offset16");
1838 break;
1839 case TOK_REPEAT:
1840 STATE(token->text, "TOK_REPEAT");
1841 emit("bbranch");
1842 pos = pop();
1843 off = pop();
1844 /* First the offset for the branch back to the begin */
1845 off -= outpos;
1846 offspit(off);
1847 emit("b(>resolve)");
1848 /* Now point the offset of the while here. */
1849 off = outpos;
1850 outpos = pos;
1851 pos = off - pos;
1852 offspit(pos);
1853 /* Return to the end of the output */
1854 outpos = off;
1855 break;
1856 case TOK_STARTX:
1857 /* Put a "startX" at addr 0. */
1858 STATE(token->text, "TOK_FCODE_VERSION2");
1859 offsetsize = 16;
1860 pos = outpos;
1861 outpos = 0;
1862 emit(token->text);
1863 outpos = pos;
1864 break;
1865 case TOK_THEN:
1866 STATE(token->text, "TOK_THEN");
1867 emit("b(>resolve)");
1868 pos = outpos;
1869 outpos = pop();
1870 off = pos - outpos;
1871 offspit(off);
1872 outpos = pos;
1873 break;
1874 case TOK_TO:
1875 STATE(token->text, "TOK_TO");
1876 /* The next pass should tokenize the FCODE number */
1877 emit("b(to)");
1878 break;
1879 case TOK_UNTIL:
1880 STATE(token->text, "TOK_UNTIL");
1881 emit("b?branch");
1882 pos = pop();
1883 pos -= outpos;
1884 offspit(pos);
1885 break;
1886 case TOK_VALUE:
1887 STATE(token->text, "TOK_VALUE");
1888
1889 token = yylex();
1890 if (token == NULL) {
1891 warnx("EOF in value definition");
1892 return;
1893 }
1894
1895 /* Add new code to dictionary */
1896 fcode = emalloc(sizeof(*fcode));
1897 fcode->num = nextfcode++;
1898 fcode->name = estrdup(token->text);
1899 fadd(dictionary, fcode);
1900
1901 if (state == 0)
1902 emit("new-token");
1903 else {
1904 if (state == TOK_EXTERNAL)
1905 emit("external-token");
1906 else
1907 /* Here we have a choice of new-token or named-token */
1908 emit("named-token");
1909 sspit(token->text);
1910 }
1911 spit(fcode->num);
1912 emit("b(value)");
1913 break;
1914 case TOK_VARIABLE:
1915 STATE(token->text, "TOK_VARIABLE");
1916
1917 token = yylex();
1918 if (token == NULL) {
1919 warnx("EOF in variable definition");
1920 return;
1921 }
1922
1923 /* Add new code to dictionary */
1924 fcode = emalloc(sizeof(*fcode));
1925 fcode->num = nextfcode++;
1926 fcode->name = estrdup(token->text);
1927 fadd(dictionary, fcode);
1928
1929 if (state == 0)
1930 emit("new-token");
1931 else {
1932 if (state == TOK_EXTERNAL)
1933 emit("external-token");
1934 else
1935 /* Here we have a choice of new-token or named-token */
1936 emit("named-token");
1937 sspit(token->text);
1938 }
1939 spit(fcode->num);
1940 emit("b(variable)");
1941 break;
1942 case TOK_VERSION1:
1943 /* This is actually a tokenizer directive. */
1944 STATE(token->text, "TOK_FCODE_VERSION1");
1945 offsetsize = 8;
1946 pos = outpos;
1947 outpos = 0;
1948 emit("version1");
1949 outpos = pos;
1950 break;
1951 case TOK_WHILE:
1952 STATE(token->text, "TOK_WHILE");
1953 emit("b?branch");
1954 push(outpos);
1955 offspit(0);
1956 break;
1957
1958 /* Tokenizer directives */
1959 case TOK_BEGTOK:
1960 STATE(token->text, "TOK_BEGTOK");
1961 tokenizer = 1;
1962 break;
1963 case TOK_EMIT_BYTE:
1964 STATE(token->text, "TOK_EMIT_BYTE");
1965 spit(pop());
1966 break;
1967 case TOK_ENDTOK:
1968 STATE(token->text, "TOK_ENDTOK");
1969 tokenizer = 0;
1970 break;
1971 case TOK_FLOAD:
1972 {
1973 char *oldinfile = infile;
1974
1975 STATE(token->text, "TOK_FLOAD");
1976 /* Parse a different file for a while */
1977 token = yylex();
1978 if ((inf = fopen(token->text, "r")) == NULL) {
1979 warn("Cannot open `%s'", token->text);
1980 break;
1981 }
1982 infile = estrdup(token->text);
1983 if (mark_fload) {
1984 /*
1985 * Insert commands to print out the
1986 * filename into the instruction
1987 * stream
1988 */
1989 emit("b(\")");
1990 sspit("fload-ing ");
1991 emit("type");
1992 emit("b(\")");
1993 sspit(infile);
1994 emit("type");
1995 emit("cr");
1996 emit(".s");
1997 }
1998 inbuf = yy_create_buffer(inf, YY_BUF_SIZE);
1999 yy_switch_to_buffer(inbuf);
2000
2001 printf("======= fload file %s\n", infile);
2002 tokenize(inbuf);
2003 printf("======= done file %s\n", infile);
2004 yy_switch_to_buffer(yinput);
2005 yy_delete_buffer(inbuf);
2006 fclose(inf);
2007 if (mark_fload) {
2008 /*
2009 * Insert commands to print out the
2010 * filename into the instruction
2011 * stream
2012 */
2013 emit("b(\")");
2014 sspit("fload-ed ");
2015 emit("type");
2016 emit("b(\")");
2017 sspit(infile);
2018 emit("type");
2019 emit("cr");
2020 emit(".s");
2021 emit("cr");
2022 }
2023 free(infile);
2024 infile = oldinfile;
2025 }
2026 break;
2027 case TOK_OTHER:
2028 STATE(token->text, "TOK_OTHER");
2029 if (apply_macros(yinput, token->text))
2030 break;
2031 if (emit(token->text)) {
2032 #if 0
2033 /*
2034 * Call an external command
2035 *
2036 * XXXXX assumes it will always find the command
2037 */
2038 sspit(token->text);
2039 emit("$find");
2040 emit("drop");
2041 emit("execute");
2042 #else
2043 token_err(yylineno, infile, yytext,
2044 "%s: undefined token `%s'\n",
2045 __func__, token->text);
2046 #endif
2047 }
2048 break;
2049 default:
2050 /* Nothing */ ;
2051 }
2052 }
2053 return;
2054 }
2055
2056 /*
2057 * print a tokenizer error message
2058 */
2059 static void
2060 token_err(int lineno, const char *file, const char *text, const char *fmt, ...)
2061 {
2062 va_list ap;
2063
2064 va_start(ap, fmt);
2065 fprintf(stderr, "%s: ", getprogname());
2066 if (file)
2067 (void)fprintf(stderr, "%s,%d: ", file, lineno);
2068 if (fmt)
2069 (void)vfprintf(stderr, fmt, ap);
2070 fputc('\n', stderr);
2071 if (text)
2072 fprintf(stderr, "\t%s", text);
2073 va_end(ap);
2074 exit(EXIT_FAILURE);
2075 }
2076
2077 /*
2078 * Lookup fcode string in dictionary and spit it out.
2079 *
2080 * Fcode must be in dictionary. No alias conversion done.
2081 */
2082 static int
2083 emit(const char *str)
2084 {
2085 struct fcode *code;
2086 if ((code = flookup(dictionary, str)))
2087 spit(code->num);
2088 if (debug > 1) {
2089 if (code)
2090 printf("emitting `%s'\n", code->name);
2091 else
2092 printf("emit: not found `%s'\n", str);
2093 }
2094 return (code == NULL);
2095 }
2096
2097 /*
2098 * Spit out an integral value as a series of FCodes.
2099 *
2100 * It will spit out one zero byte or as many bytes as are
2101 * non-zero.
2102 */
2103 static int
2104 spit(long n)
2105 {
2106 int count = 1;
2107
2108 if (n >> 8)
2109 count += spit(n >> 8);
2110 if ((size_t)outpos >= outbufsiz) {
2111 while ((size_t)outpos >= outbufsiz) outbufsiz += BUFCLICK;
2112 outbuf = erealloc(outbuf, outbufsiz);
2113 }
2114 if (debug > 3) printf("%lx: spitting %2.2x\n", outpos, (unsigned char)n);
2115 outbuf[outpos++] = n;
2116 return (count);
2117 }
2118
2119 /*
2120 * Spit out an FCode string.
2121 */
2122 static void
2123 sspit(const char *s)
2124 {
2125 int len = strlen(s);
2126
2127 if (len > 255) {
2128 warnx("string length %d too long", len);
2129 return;
2130 }
2131 if (debug > 2)
2132 printf("sspit: len %d str `%s'\n", len, s);
2133 spit(len);
2134 while (len--)
2135 spit(*s++);
2136 }
2137
2138 /*
2139 * Spit out an offset. Offsets can be 8 or 16 bits.
2140 * Bail if the value overflows. This is a little complicated since
2141 * offsets can be negative numbers.
2142 */
2143 static int
2144 offspit(long n)
2145 {
2146
2147 if (offsetsize == 16) {
2148 volatile int16_t off16 = n;
2149
2150 if (n != off16)
2151 token_err(yylineno, infile, NULL,
2152 "Offset16 offset overflow: %lx != %x\n",
2153 n, off16);
2154 spit((n>>8) & 0xff);
2155 return spit(n & 0xff);
2156 } else {
2157 volatile int8_t off8 = n;
2158
2159 if (n != off8)
2160 token_err(yylineno, infile, NULL,
2161 "Offset8 offset overflow: %lx != %x\n",
2162 n, off8);
2163 return spit(n & 0x0ffL);
2164 }
2165 }
2166
2167 int
2168 yywrap(void)
2169 {
2170 /* Always generate EOF */
2171 return (1);
2172 }
2173