yacc.y revision 1.25 1 1.25 tnozaki /* $NetBSD: yacc.y,v 1.25 2009/01/02 00:20:23 tnozaki Exp $ */
2 1.2 itojun
3 1.2 itojun %{
4 1.2 itojun /*-
5 1.2 itojun * Copyright (c) 1993
6 1.2 itojun * The Regents of the University of California. All rights reserved.
7 1.2 itojun *
8 1.2 itojun * This code is derived from software contributed to Berkeley by
9 1.2 itojun * Paul Borman at Krystal Technologies.
10 1.2 itojun *
11 1.2 itojun * Redistribution and use in source and binary forms, with or without
12 1.2 itojun * modification, are permitted provided that the following conditions
13 1.2 itojun * are met:
14 1.2 itojun * 1. Redistributions of source code must retain the above copyright
15 1.2 itojun * notice, this list of conditions and the following disclaimer.
16 1.2 itojun * 2. Redistributions in binary form must reproduce the above copyright
17 1.2 itojun * notice, this list of conditions and the following disclaimer in the
18 1.2 itojun * documentation and/or other materials provided with the distribution.
19 1.22 agc * 3. Neither the name of the University nor the names of its contributors
20 1.2 itojun * may be used to endorse or promote products derived from this software
21 1.2 itojun * without specific prior written permission.
22 1.2 itojun *
23 1.2 itojun * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.2 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.2 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.2 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.2 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.2 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.2 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.2 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.2 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.2 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.2 itojun * SUCH DAMAGE.
34 1.2 itojun */
35 1.2 itojun
36 1.23 lukem #if HAVE_NBTOOL_CONFIG_H
37 1.23 lukem #include "nbtool_config.h"
38 1.7 tv #endif
39 1.7 tv
40 1.2 itojun #include <sys/cdefs.h>
41 1.18 christos #ifndef lint
42 1.2 itojun #if 0
43 1.2 itojun static char sccsid[] = "@(#)yacc.y 8.1 (Berkeley) 6/6/93";
44 1.2 itojun static char rcsid[] = "$FreeBSD$";
45 1.2 itojun #else
46 1.25 tnozaki __RCSID("$NetBSD: yacc.y,v 1.25 2009/01/02 00:20:23 tnozaki Exp $");
47 1.2 itojun #endif
48 1.18 christos #endif /* not lint */
49 1.10 bjh21
50 1.10 bjh21 #include <sys/types.h>
51 1.10 bjh21 #include <netinet/in.h> /* Needed by <arpa/inet.h> on NetBSD 1.5. */
52 1.10 bjh21 #include <arpa/inet.h> /* Needed for htonl on POSIX systems. */
53 1.2 itojun
54 1.8 tv #include <err.h>
55 1.15 tshiozak #include "locale/runetype.h"
56 1.25 tnozaki #include <locale.h>
57 1.2 itojun #include <stddef.h>
58 1.2 itojun #include <stdio.h>
59 1.2 itojun #include <stdlib.h>
60 1.2 itojun #include <string.h>
61 1.2 itojun #include <unistd.h>
62 1.15 tshiozak #include <ctype.h>
63 1.2 itojun
64 1.2 itojun #include "ldef.h"
65 1.7 tv
66 1.4 thorpej const char *locale_file = "<stdout>";
67 1.2 itojun
68 1.2 itojun rune_map maplower = { { 0, }, };
69 1.2 itojun rune_map mapupper = { { 0, }, };
70 1.2 itojun rune_map types = { { 0, }, };
71 1.2 itojun
72 1.17 tshiozak _NBRuneLocale new_locale = { { 0, }, };
73 1.2 itojun
74 1.17 tshiozak __nbrune_t charsetbits = (__nbrune_t)0x00000000;
75 1.2 itojun #if 0
76 1.17 tshiozak __nbrune_t charsetmask = (__nbrune_t)0x0000007f;
77 1.2 itojun #endif
78 1.17 tshiozak __nbrune_t charsetmask = (__nbrune_t)0xffffffff;
79 1.2 itojun
80 1.2 itojun void set_map __P((rune_map *, rune_list *, u_int32_t));
81 1.2 itojun void set_digitmap __P((rune_map *, rune_list *));
82 1.2 itojun void add_map __P((rune_map *, rune_list *, u_int32_t));
83 1.2 itojun
84 1.2 itojun int main __P((int, char *[]));
85 1.25 tnozaki void usage __P((void));
86 1.2 itojun int yyerror __P((const char *s));
87 1.2 itojun void *xmalloc __P((unsigned int sz));
88 1.2 itojun u_int32_t *xlalloc __P((unsigned int sz));
89 1.2 itojun u_int32_t *xrelalloc __P((u_int32_t *old, unsigned int sz));
90 1.2 itojun void dump_tables __P((void));
91 1.2 itojun int yyparse __P((void));
92 1.2 itojun extern int yylex __P((void));
93 1.25 tnozaki
94 1.25 tnozaki /* mklocaledb.c */
95 1.25 tnozaki extern void mklocaledb __P((const char *, FILE *, FILE *));
96 1.25 tnozaki
97 1.2 itojun %}
98 1.2 itojun
99 1.2 itojun %union {
100 1.17 tshiozak __nbrune_t rune;
101 1.2 itojun int i;
102 1.2 itojun char *str;
103 1.2 itojun
104 1.2 itojun rune_list *list;
105 1.2 itojun }
106 1.2 itojun
107 1.2 itojun %token <rune> RUNE
108 1.2 itojun %token LBRK
109 1.2 itojun %token RBRK
110 1.2 itojun %token THRU
111 1.2 itojun %token MAPLOWER
112 1.2 itojun %token MAPUPPER
113 1.2 itojun %token DIGITMAP
114 1.2 itojun %token <i> LIST
115 1.2 itojun %token <str> VARIABLE
116 1.2 itojun %token CHARSET
117 1.2 itojun %token ENCODING
118 1.2 itojun %token INVALID
119 1.2 itojun %token <str> STRING
120 1.2 itojun
121 1.2 itojun %type <list> list
122 1.2 itojun %type <list> map
123 1.2 itojun
124 1.2 itojun
125 1.2 itojun %%
126 1.2 itojun
127 1.2 itojun locale : /* empty */
128 1.2 itojun | table
129 1.2 itojun { dump_tables(); }
130 1.2 itojun ;
131 1.2 itojun
132 1.2 itojun table : entry
133 1.2 itojun | table entry
134 1.2 itojun ;
135 1.2 itojun
136 1.2 itojun entry : ENCODING STRING
137 1.9 tshiozak { strncpy(new_locale.rl_encoding, $2, sizeof(new_locale.rl_encoding)); }
138 1.2 itojun | VARIABLE
139 1.9 tshiozak { new_locale.rl_variable_len = strlen($1) + 1;
140 1.21 itojun new_locale.rl_variable = strdup($1);
141 1.2 itojun }
142 1.2 itojun | CHARSET RUNE
143 1.2 itojun { charsetbits = $2; charsetmask = 0x0000007f; }
144 1.2 itojun | CHARSET RUNE RUNE
145 1.2 itojun { charsetbits = $2; charsetmask = $3; }
146 1.2 itojun | CHARSET STRING
147 1.2 itojun { int final = $2[strlen($2) - 1] & 0x7f;
148 1.2 itojun charsetbits = final << 24;
149 1.2 itojun if ($2[0] == '$') {
150 1.2 itojun charsetmask = 0x00007f7f;
151 1.2 itojun if (strchr(",-./", $2[1]))
152 1.2 itojun charsetbits |= 0x80;
153 1.2 itojun if (0xd0 <= final && final <= 0xdf)
154 1.2 itojun charsetmask |= 0x007f0000;
155 1.2 itojun } else {
156 1.2 itojun charsetmask = 0x0000007f;
157 1.2 itojun if (strchr(",-./", $2[0]))
158 1.2 itojun charsetbits |= 0x80;
159 1.2 itojun if (strlen($2) == 2 && $2[0] == '!')
160 1.2 itojun charsetbits |= ((0x80 | $2[0]) << 16);
161 1.2 itojun }
162 1.2 itojun
163 1.2 itojun /*
164 1.2 itojun * special rules
165 1.2 itojun */
166 1.2 itojun if (charsetbits == ('B' << 24)
167 1.2 itojun && charsetmask == 0x0000007f) {
168 1.2 itojun /*ASCII: 94B*/
169 1.2 itojun charsetbits = 0;
170 1.2 itojun charsetmask = 0x0000007f;
171 1.2 itojun } else if (charsetbits == (('A' << 24) | 0x80)
172 1.2 itojun && charsetmask == 0x0000007f) {
173 1.2 itojun /*Latin1: 96A*/
174 1.2 itojun charsetbits = 0x80;
175 1.2 itojun charsetmask = 0x0000007f;
176 1.2 itojun }
177 1.2 itojun }
178 1.2 itojun | INVALID RUNE
179 1.9 tshiozak { new_locale.rl_invalid_rune = $2; }
180 1.2 itojun | LIST list
181 1.2 itojun { set_map(&types, $2, $1); }
182 1.2 itojun | MAPLOWER map
183 1.2 itojun { set_map(&maplower, $2, 0); }
184 1.2 itojun | MAPUPPER map
185 1.2 itojun { set_map(&mapupper, $2, 0); }
186 1.2 itojun | DIGITMAP map
187 1.2 itojun { set_digitmap(&types, $2); }
188 1.2 itojun ;
189 1.2 itojun
190 1.2 itojun list : RUNE
191 1.2 itojun {
192 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
193 1.2 itojun $$->min = ($1 & charsetmask) | charsetbits;
194 1.2 itojun $$->max = ($1 & charsetmask) | charsetbits;
195 1.2 itojun $$->next = 0;
196 1.2 itojun }
197 1.2 itojun | RUNE THRU RUNE
198 1.2 itojun {
199 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
200 1.2 itojun $$->min = ($1 & charsetmask) | charsetbits;
201 1.2 itojun $$->max = ($3 & charsetmask) | charsetbits;
202 1.2 itojun $$->next = 0;
203 1.2 itojun }
204 1.2 itojun | list RUNE
205 1.2 itojun {
206 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
207 1.2 itojun $$->min = ($2 & charsetmask) | charsetbits;
208 1.2 itojun $$->max = ($2 & charsetmask) | charsetbits;
209 1.2 itojun $$->next = $1;
210 1.2 itojun }
211 1.2 itojun | list RUNE THRU RUNE
212 1.2 itojun {
213 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
214 1.2 itojun $$->min = ($2 & charsetmask) | charsetbits;
215 1.2 itojun $$->max = ($4 & charsetmask) | charsetbits;
216 1.2 itojun $$->next = $1;
217 1.2 itojun }
218 1.2 itojun ;
219 1.2 itojun
220 1.2 itojun map : LBRK RUNE RUNE RBRK
221 1.2 itojun {
222 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
223 1.2 itojun $$->min = ($2 & charsetmask) | charsetbits;
224 1.2 itojun $$->max = ($2 & charsetmask) | charsetbits;
225 1.2 itojun $$->map = $3;
226 1.2 itojun $$->next = 0;
227 1.2 itojun }
228 1.2 itojun | map LBRK RUNE RUNE RBRK
229 1.2 itojun {
230 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
231 1.2 itojun $$->min = ($3 & charsetmask) | charsetbits;
232 1.2 itojun $$->max = ($3 & charsetmask) | charsetbits;
233 1.2 itojun $$->map = $4;
234 1.2 itojun $$->next = $1;
235 1.2 itojun }
236 1.2 itojun | LBRK RUNE THRU RUNE ':' RUNE RBRK
237 1.2 itojun {
238 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
239 1.2 itojun $$->min = ($2 & charsetmask) | charsetbits;
240 1.2 itojun $$->max = ($4 & charsetmask) | charsetbits;
241 1.2 itojun $$->map = $6;
242 1.2 itojun $$->next = 0;
243 1.2 itojun }
244 1.2 itojun | map LBRK RUNE THRU RUNE ':' RUNE RBRK
245 1.2 itojun {
246 1.2 itojun $$ = (rune_list *)malloc(sizeof(rune_list));
247 1.2 itojun $$->min = ($3 & charsetmask) | charsetbits;
248 1.2 itojun $$->max = ($5 & charsetmask) | charsetbits;
249 1.2 itojun $$->map = $7;
250 1.2 itojun $$->next = $1;
251 1.2 itojun }
252 1.2 itojun ;
253 1.2 itojun %%
254 1.2 itojun
255 1.2 itojun int debug = 0;
256 1.8 tv FILE *ofile;
257 1.2 itojun
258 1.2 itojun int
259 1.2 itojun main(ac, av)
260 1.2 itojun int ac;
261 1.2 itojun char *av[];
262 1.2 itojun {
263 1.2 itojun int x;
264 1.25 tnozaki const char *locale_type;
265 1.2 itojun
266 1.2 itojun extern char *optarg;
267 1.2 itojun extern int optind;
268 1.2 itojun
269 1.25 tnozaki locale_type = NULL;
270 1.25 tnozaki while ((x = getopt(ac, av, "do:t:")) != EOF) {
271 1.2 itojun switch(x) {
272 1.2 itojun case 'd':
273 1.2 itojun debug = 1;
274 1.2 itojun break;
275 1.2 itojun case 'o':
276 1.2 itojun locale_file = optarg;
277 1.8 tv if ((ofile = fopen(locale_file, "w")) == 0)
278 1.5 thorpej err(1, "unable to open output file %s", locale_file);
279 1.2 itojun break;
280 1.25 tnozaki case 't':
281 1.25 tnozaki locale_type = optarg;
282 1.25 tnozaki break;
283 1.2 itojun default:
284 1.25 tnozaki usage();
285 1.2 itojun }
286 1.2 itojun }
287 1.2 itojun
288 1.2 itojun switch (ac - optind) {
289 1.2 itojun case 0:
290 1.2 itojun break;
291 1.2 itojun case 1:
292 1.5 thorpej if (freopen(av[optind], "r", stdin) == 0)
293 1.5 thorpej err(1, "unable to open input file %s", av[optind]);
294 1.2 itojun break;
295 1.2 itojun default:
296 1.25 tnozaki usage();
297 1.25 tnozaki }
298 1.25 tnozaki
299 1.25 tnozaki if (ofile == NULL)
300 1.25 tnozaki ofile = stdout;
301 1.25 tnozaki if (locale_type != NULL && strcasecmp(locale_type, "CTYPE")) {
302 1.25 tnozaki mklocaledb(locale_type, stdin, ofile);
303 1.25 tnozaki return 0;
304 1.2 itojun }
305 1.25 tnozaki
306 1.17 tshiozak for (x = 0; x < _NB_CACHED_RUNES; ++x) {
307 1.2 itojun mapupper.map[x] = x;
308 1.2 itojun maplower.map[x] = x;
309 1.2 itojun }
310 1.25 tnozaki
311 1.17 tshiozak new_locale.rl_invalid_rune = _NB_DEFAULT_INVALID_RUNE;
312 1.17 tshiozak memcpy(new_locale.rl_magic, _NB_RUNE_MAGIC_1, sizeof(new_locale.rl_magic));
313 1.2 itojun
314 1.2 itojun yyparse();
315 1.2 itojun
316 1.2 itojun return 0;
317 1.25 tnozaki
318 1.25 tnozaki }
319 1.25 tnozaki
320 1.25 tnozaki void
321 1.25 tnozaki usage()
322 1.25 tnozaki {
323 1.25 tnozaki fprintf(stderr,
324 1.25 tnozaki "usage: mklocale [-d] [-o output] [-t type] [source]\n");
325 1.25 tnozaki
326 1.25 tnozaki exit(1);
327 1.2 itojun }
328 1.2 itojun
329 1.2 itojun int
330 1.2 itojun yyerror(s)
331 1.2 itojun const char *s;
332 1.2 itojun {
333 1.2 itojun fprintf(stderr, "%s\n", s);
334 1.2 itojun
335 1.2 itojun return 0;
336 1.2 itojun }
337 1.2 itojun
338 1.2 itojun void *
339 1.2 itojun xmalloc(sz)
340 1.2 itojun unsigned int sz;
341 1.2 itojun {
342 1.2 itojun void *r = malloc(sz);
343 1.2 itojun if (!r) {
344 1.2 itojun perror("xmalloc");
345 1.2 itojun abort();
346 1.2 itojun }
347 1.2 itojun return(r);
348 1.2 itojun }
349 1.2 itojun
350 1.2 itojun u_int32_t *
351 1.2 itojun xlalloc(sz)
352 1.2 itojun unsigned int sz;
353 1.2 itojun {
354 1.2 itojun u_int32_t *r = (u_int32_t *)malloc(sz * sizeof(u_int32_t));
355 1.2 itojun if (!r) {
356 1.2 itojun perror("xlalloc");
357 1.2 itojun abort();
358 1.2 itojun }
359 1.2 itojun return(r);
360 1.2 itojun }
361 1.2 itojun
362 1.2 itojun u_int32_t *
363 1.2 itojun xrelalloc(old, sz)
364 1.2 itojun u_int32_t *old;
365 1.2 itojun unsigned int sz;
366 1.2 itojun {
367 1.2 itojun u_int32_t *r = (u_int32_t *)realloc((char *)old,
368 1.2 itojun sz * sizeof(u_int32_t));
369 1.2 itojun if (!r) {
370 1.2 itojun perror("xrelalloc");
371 1.2 itojun abort();
372 1.2 itojun }
373 1.2 itojun return(r);
374 1.2 itojun }
375 1.2 itojun
376 1.2 itojun void
377 1.2 itojun set_map(map, list, flag)
378 1.2 itojun rune_map *map;
379 1.2 itojun rune_list *list;
380 1.2 itojun u_int32_t flag;
381 1.2 itojun {
382 1.2 itojun list->map &= charsetmask;
383 1.2 itojun list->map |= charsetbits;
384 1.2 itojun while (list) {
385 1.2 itojun rune_list *nlist = list->next;
386 1.2 itojun add_map(map, list, flag);
387 1.2 itojun list = nlist;
388 1.2 itojun }
389 1.2 itojun }
390 1.2 itojun
391 1.2 itojun void
392 1.2 itojun set_digitmap(map, list)
393 1.2 itojun rune_map *map;
394 1.2 itojun rune_list *list;
395 1.2 itojun {
396 1.17 tshiozak __nbrune_t i;
397 1.2 itojun
398 1.2 itojun while (list) {
399 1.2 itojun rune_list *nlist = list->next;
400 1.2 itojun for (i = list->min; i <= list->max; ++i) {
401 1.2 itojun if (list->map + (i - list->min)) {
402 1.2 itojun rune_list *tmp = (rune_list *)xmalloc(sizeof(rune_list));
403 1.2 itojun tmp->min = i;
404 1.2 itojun tmp->max = i;
405 1.2 itojun add_map(map, tmp, list->map + (i - list->min));
406 1.2 itojun }
407 1.2 itojun }
408 1.2 itojun free(list);
409 1.2 itojun list = nlist;
410 1.2 itojun }
411 1.2 itojun }
412 1.2 itojun
413 1.2 itojun void
414 1.2 itojun add_map(map, list, flag)
415 1.2 itojun rune_map *map;
416 1.2 itojun rune_list *list;
417 1.2 itojun u_int32_t flag;
418 1.2 itojun {
419 1.17 tshiozak __nbrune_t i;
420 1.2 itojun rune_list *lr = 0;
421 1.2 itojun rune_list *r;
422 1.17 tshiozak __nbrune_t run;
423 1.2 itojun
424 1.17 tshiozak while (list->min < _NB_CACHED_RUNES && list->min <= list->max) {
425 1.2 itojun if (flag)
426 1.2 itojun map->map[list->min++] |= flag;
427 1.2 itojun else
428 1.2 itojun map->map[list->min++] = list->map++;
429 1.2 itojun }
430 1.2 itojun
431 1.2 itojun if (list->min > list->max) {
432 1.2 itojun free(list);
433 1.2 itojun return;
434 1.2 itojun }
435 1.2 itojun
436 1.2 itojun run = list->max - list->min + 1;
437 1.2 itojun
438 1.2 itojun if (!(r = map->root) || (list->max < r->min - 1)
439 1.2 itojun || (!flag && list->max == r->min - 1)) {
440 1.2 itojun if (flag) {
441 1.2 itojun list->types = xlalloc(run);
442 1.2 itojun for (i = 0; i < run; ++i)
443 1.2 itojun list->types[i] = flag;
444 1.2 itojun }
445 1.2 itojun list->next = map->root;
446 1.2 itojun map->root = list;
447 1.2 itojun return;
448 1.2 itojun }
449 1.2 itojun
450 1.2 itojun for (r = map->root; r && r->max + 1 < list->min; r = r->next)
451 1.2 itojun lr = r;
452 1.2 itojun
453 1.2 itojun if (!r) {
454 1.2 itojun /*
455 1.2 itojun * We are off the end.
456 1.2 itojun */
457 1.2 itojun if (flag) {
458 1.2 itojun list->types = xlalloc(run);
459 1.2 itojun for (i = 0; i < run; ++i)
460 1.2 itojun list->types[i] = flag;
461 1.2 itojun }
462 1.2 itojun list->next = 0;
463 1.2 itojun lr->next = list;
464 1.2 itojun return;
465 1.2 itojun }
466 1.2 itojun
467 1.2 itojun if (list->max < r->min - 1) {
468 1.2 itojun /*
469 1.2 itojun * We come before this range and we do not intersect it.
470 1.2 itojun * We are not before the root node, it was checked before the loop
471 1.2 itojun */
472 1.2 itojun if (flag) {
473 1.2 itojun list->types = xlalloc(run);
474 1.2 itojun for (i = 0; i < run; ++i)
475 1.2 itojun list->types[i] = flag;
476 1.2 itojun }
477 1.2 itojun list->next = lr->next;
478 1.2 itojun lr->next = list;
479 1.2 itojun return;
480 1.2 itojun }
481 1.2 itojun
482 1.2 itojun /*
483 1.2 itojun * At this point we have found that we at least intersect with
484 1.2 itojun * the range pointed to by `r', we might intersect with one or
485 1.2 itojun * more ranges beyond `r' as well.
486 1.2 itojun */
487 1.2 itojun
488 1.2 itojun if (!flag && list->map - list->min != r->map - r->min) {
489 1.2 itojun /*
490 1.2 itojun * There are only two cases when we are doing case maps and
491 1.2 itojun * our maps needn't have the same offset. When we are adjoining
492 1.2 itojun * but not intersecting.
493 1.2 itojun */
494 1.2 itojun if (list->max + 1 == r->min) {
495 1.2 itojun lr->next = list;
496 1.2 itojun list->next = r;
497 1.2 itojun return;
498 1.2 itojun }
499 1.2 itojun if (list->min - 1 == r->max) {
500 1.2 itojun list->next = r->next;
501 1.2 itojun r->next = list;
502 1.2 itojun return;
503 1.2 itojun }
504 1.2 itojun fprintf(stderr, "Error: conflicting map entries\n");
505 1.2 itojun exit(1);
506 1.2 itojun }
507 1.2 itojun
508 1.2 itojun if (list->min >= r->min && list->max <= r->max) {
509 1.2 itojun /*
510 1.2 itojun * Subset case.
511 1.2 itojun */
512 1.2 itojun
513 1.2 itojun if (flag) {
514 1.2 itojun for (i = list->min; i <= list->max; ++i)
515 1.2 itojun r->types[i - r->min] |= flag;
516 1.2 itojun }
517 1.2 itojun free(list);
518 1.2 itojun return;
519 1.2 itojun }
520 1.2 itojun if (list->min <= r->min && list->max >= r->max) {
521 1.2 itojun /*
522 1.2 itojun * Superset case. Make him big enough to hold us.
523 1.2 itojun * We might need to merge with the guy after him.
524 1.2 itojun */
525 1.2 itojun if (flag) {
526 1.2 itojun list->types = xlalloc(list->max - list->min + 1);
527 1.2 itojun
528 1.2 itojun for (i = list->min; i <= list->max; ++i)
529 1.2 itojun list->types[i - list->min] = flag;
530 1.2 itojun
531 1.2 itojun for (i = r->min; i <= r->max; ++i)
532 1.2 itojun list->types[i - list->min] |= r->types[i - r->min];
533 1.2 itojun
534 1.2 itojun free(r->types);
535 1.2 itojun r->types = list->types;
536 1.2 itojun } else {
537 1.2 itojun r->map = list->map;
538 1.2 itojun }
539 1.2 itojun r->min = list->min;
540 1.2 itojun r->max = list->max;
541 1.2 itojun free(list);
542 1.2 itojun } else if (list->min < r->min) {
543 1.2 itojun /*
544 1.2 itojun * Our tail intersects his head.
545 1.2 itojun */
546 1.2 itojun if (flag) {
547 1.2 itojun list->types = xlalloc(r->max - list->min + 1);
548 1.2 itojun
549 1.2 itojun for (i = r->min; i <= r->max; ++i)
550 1.2 itojun list->types[i - list->min] = r->types[i - r->min];
551 1.2 itojun
552 1.2 itojun for (i = list->min; i < r->min; ++i)
553 1.2 itojun list->types[i - list->min] = flag;
554 1.2 itojun
555 1.2 itojun for (i = r->min; i <= list->max; ++i)
556 1.2 itojun list->types[i - list->min] |= flag;
557 1.2 itojun
558 1.2 itojun free(r->types);
559 1.2 itojun r->types = list->types;
560 1.2 itojun } else {
561 1.2 itojun r->map = list->map;
562 1.2 itojun }
563 1.2 itojun r->min = list->min;
564 1.2 itojun free(list);
565 1.2 itojun return;
566 1.2 itojun } else {
567 1.2 itojun /*
568 1.2 itojun * Our head intersects his tail.
569 1.2 itojun * We might need to merge with the guy after him.
570 1.2 itojun */
571 1.2 itojun if (flag) {
572 1.2 itojun r->types = xrelalloc(r->types, list->max - r->min + 1);
573 1.2 itojun
574 1.2 itojun for (i = list->min; i <= r->max; ++i)
575 1.2 itojun r->types[i - r->min] |= flag;
576 1.2 itojun
577 1.2 itojun for (i = r->max+1; i <= list->max; ++i)
578 1.2 itojun r->types[i - r->min] = flag;
579 1.2 itojun }
580 1.2 itojun r->max = list->max;
581 1.2 itojun free(list);
582 1.2 itojun }
583 1.2 itojun
584 1.2 itojun /*
585 1.2 itojun * Okay, check to see if we grew into the next guy(s)
586 1.2 itojun */
587 1.2 itojun while ((lr = r->next) && r->max >= lr->min) {
588 1.2 itojun if (flag) {
589 1.2 itojun if (r->max >= lr->max) {
590 1.2 itojun /*
591 1.2 itojun * Good, we consumed all of him.
592 1.2 itojun */
593 1.2 itojun for (i = lr->min; i <= lr->max; ++i)
594 1.2 itojun r->types[i - r->min] |= lr->types[i - lr->min];
595 1.2 itojun } else {
596 1.2 itojun /*
597 1.2 itojun * "append" him on to the end of us.
598 1.2 itojun */
599 1.2 itojun r->types = xrelalloc(r->types, lr->max - r->min + 1);
600 1.2 itojun
601 1.2 itojun for (i = lr->min; i <= r->max; ++i)
602 1.2 itojun r->types[i - r->min] |= lr->types[i - lr->min];
603 1.2 itojun
604 1.2 itojun for (i = r->max+1; i <= lr->max; ++i)
605 1.2 itojun r->types[i - r->min] = lr->types[i - lr->min];
606 1.2 itojun
607 1.2 itojun r->max = lr->max;
608 1.2 itojun }
609 1.2 itojun } else {
610 1.2 itojun if (lr->max > r->max)
611 1.2 itojun r->max = lr->max;
612 1.2 itojun }
613 1.2 itojun
614 1.2 itojun r->next = lr->next;
615 1.2 itojun
616 1.2 itojun if (flag)
617 1.2 itojun free(lr->types);
618 1.2 itojun free(lr);
619 1.2 itojun }
620 1.2 itojun }
621 1.2 itojun
622 1.2 itojun void
623 1.2 itojun dump_tables()
624 1.2 itojun {
625 1.5 thorpej int x, n;
626 1.2 itojun rune_list *list;
627 1.2 itojun _FileRuneLocale file_new_locale;
628 1.25 tnozaki FILE *fp = ofile;
629 1.2 itojun
630 1.2 itojun memset(&file_new_locale, 0, sizeof(file_new_locale));
631 1.2 itojun
632 1.2 itojun /*
633 1.2 itojun * See if we can compress some of the istype arrays
634 1.2 itojun */
635 1.2 itojun for(list = types.root; list; list = list->next) {
636 1.2 itojun list->map = list->types[0];
637 1.2 itojun for (x = 1; x < list->max - list->min + 1; ++x) {
638 1.2 itojun if (list->types[x] != list->map) {
639 1.2 itojun list->map = 0;
640 1.2 itojun break;
641 1.2 itojun }
642 1.2 itojun }
643 1.2 itojun }
644 1.2 itojun
645 1.9 tshiozak memcpy(&file_new_locale.frl_magic, new_locale.rl_magic,
646 1.9 tshiozak sizeof(file_new_locale.frl_magic));
647 1.9 tshiozak memcpy(&file_new_locale.frl_encoding, new_locale.rl_encoding,
648 1.9 tshiozak sizeof(file_new_locale.frl_encoding));
649 1.2 itojun
650 1.9 tshiozak file_new_locale.frl_invalid_rune = htonl(new_locale.rl_invalid_rune);
651 1.2 itojun
652 1.2 itojun /*
653 1.2 itojun * Fill in our tables. Do this in network order so that
654 1.2 itojun * diverse machines have a chance of sharing data.
655 1.2 itojun * (Machines like Crays cannot share with little machines due to
656 1.2 itojun * word size. Sigh. We tried.)
657 1.2 itojun */
658 1.17 tshiozak for (x = 0; x < _NB_CACHED_RUNES; ++x) {
659 1.9 tshiozak file_new_locale.frl_runetype[x] = htonl(types.map[x]);
660 1.9 tshiozak file_new_locale.frl_maplower[x] = htonl(maplower.map[x]);
661 1.9 tshiozak file_new_locale.frl_mapupper[x] = htonl(mapupper.map[x]);
662 1.2 itojun }
663 1.2 itojun
664 1.2 itojun /*
665 1.2 itojun * Count up how many ranges we will need for each of the extents.
666 1.2 itojun */
667 1.2 itojun list = types.root;
668 1.2 itojun
669 1.2 itojun while (list) {
670 1.9 tshiozak new_locale.rl_runetype_ext.rr_nranges++;
671 1.2 itojun list = list->next;
672 1.2 itojun }
673 1.9 tshiozak file_new_locale.frl_runetype_ext.frr_nranges =
674 1.9 tshiozak htonl(new_locale.rl_runetype_ext.rr_nranges);
675 1.2 itojun
676 1.2 itojun list = maplower.root;
677 1.2 itojun
678 1.2 itojun while (list) {
679 1.9 tshiozak new_locale.rl_maplower_ext.rr_nranges++;
680 1.2 itojun list = list->next;
681 1.2 itojun }
682 1.9 tshiozak file_new_locale.frl_maplower_ext.frr_nranges =
683 1.9 tshiozak htonl(new_locale.rl_maplower_ext.rr_nranges);
684 1.2 itojun
685 1.2 itojun list = mapupper.root;
686 1.2 itojun
687 1.2 itojun while (list) {
688 1.9 tshiozak new_locale.rl_mapupper_ext.rr_nranges++;
689 1.2 itojun list = list->next;
690 1.2 itojun }
691 1.9 tshiozak file_new_locale.frl_mapupper_ext.frr_nranges =
692 1.9 tshiozak htonl(new_locale.rl_mapupper_ext.rr_nranges);
693 1.2 itojun
694 1.9 tshiozak file_new_locale.frl_variable_len = htonl(new_locale.rl_variable_len);
695 1.2 itojun
696 1.2 itojun /*
697 1.2 itojun * Okay, we are now ready to write the new locale file.
698 1.2 itojun */
699 1.2 itojun
700 1.2 itojun /*
701 1.2 itojun * PART 1: The _RuneLocale structure
702 1.2 itojun */
703 1.5 thorpej if (fwrite((char *)&file_new_locale, sizeof(file_new_locale), 1, fp) != 1)
704 1.5 thorpej err(1, "writing _RuneLocale to %s", locale_file);
705 1.2 itojun /*
706 1.2 itojun * PART 2: The runetype_ext structures (not the actual tables)
707 1.2 itojun */
708 1.5 thorpej for (list = types.root, n = 0; list != NULL; list = list->next, n++) {
709 1.2 itojun _FileRuneEntry re;
710 1.2 itojun
711 1.20 tshiozak memset(&re, 0, sizeof(re));
712 1.9 tshiozak re.fre_min = htonl(list->min);
713 1.9 tshiozak re.fre_max = htonl(list->max);
714 1.9 tshiozak re.fre_map = htonl(list->map);
715 1.2 itojun
716 1.5 thorpej if (fwrite((char *)&re, sizeof(re), 1, fp) != 1)
717 1.5 thorpej err(1, "writing runetype_ext #%d to %s", n, locale_file);
718 1.2 itojun }
719 1.2 itojun /*
720 1.2 itojun * PART 3: The maplower_ext structures
721 1.2 itojun */
722 1.5 thorpej for (list = maplower.root, n = 0; list != NULL; list = list->next, n++) {
723 1.2 itojun _FileRuneEntry re;
724 1.2 itojun
725 1.20 tshiozak memset(&re, 0, sizeof(re));
726 1.9 tshiozak re.fre_min = htonl(list->min);
727 1.9 tshiozak re.fre_max = htonl(list->max);
728 1.9 tshiozak re.fre_map = htonl(list->map);
729 1.2 itojun
730 1.5 thorpej if (fwrite((char *)&re, sizeof(re), 1, fp) != 1)
731 1.5 thorpej err(1, "writing maplower_ext #%d to %s", n, locale_file);
732 1.2 itojun }
733 1.2 itojun /*
734 1.2 itojun * PART 4: The mapupper_ext structures
735 1.2 itojun */
736 1.5 thorpej for (list = mapupper.root, n = 0; list != NULL; list = list->next, n++) {
737 1.2 itojun _FileRuneEntry re;
738 1.2 itojun
739 1.20 tshiozak memset(&re, 0, sizeof(re));
740 1.9 tshiozak re.fre_min = htonl(list->min);
741 1.9 tshiozak re.fre_max = htonl(list->max);
742 1.9 tshiozak re.fre_map = htonl(list->map);
743 1.2 itojun
744 1.5 thorpej if (fwrite((char *)&re, sizeof(re), 1, fp) != 1)
745 1.5 thorpej err(1, "writing mapupper_ext #%d to %s", n, locale_file);
746 1.2 itojun }
747 1.2 itojun /*
748 1.2 itojun * PART 5: The runetype_ext tables
749 1.2 itojun */
750 1.5 thorpej for (list = types.root, n = 0; list != NULL; list = list->next, n++) {
751 1.2 itojun for (x = 0; x < list->max - list->min + 1; ++x)
752 1.2 itojun list->types[x] = htonl(list->types[x]);
753 1.2 itojun
754 1.2 itojun if (!list->map) {
755 1.2 itojun if (fwrite((char *)list->types,
756 1.2 itojun (list->max - list->min + 1) * sizeof(u_int32_t),
757 1.5 thorpej 1, fp) != 1)
758 1.5 thorpej err(1, "writing runetype_ext table #%d to %s", n, locale_file);
759 1.2 itojun }
760 1.2 itojun }
761 1.2 itojun /*
762 1.2 itojun * PART 5: And finally the variable data
763 1.2 itojun */
764 1.9 tshiozak if (new_locale.rl_variable_len != 0 &&
765 1.9 tshiozak fwrite((char *)new_locale.rl_variable,
766 1.9 tshiozak new_locale.rl_variable_len, 1, fp) != 1)
767 1.5 thorpej err(1, "writing variable data to %s", locale_file);
768 1.2 itojun fclose(fp);
769 1.2 itojun
770 1.2 itojun if (!debug)
771 1.2 itojun return;
772 1.2 itojun
773 1.9 tshiozak if (new_locale.rl_encoding[0])
774 1.9 tshiozak fprintf(stderr, "ENCODING %s\n", new_locale.rl_encoding);
775 1.9 tshiozak if (new_locale.rl_variable)
776 1.2 itojun fprintf(stderr, "VARIABLE %s\n",
777 1.9 tshiozak (char *)new_locale.rl_variable);
778 1.2 itojun
779 1.2 itojun fprintf(stderr, "\nMAPLOWER:\n\n");
780 1.2 itojun
781 1.17 tshiozak for (x = 0; x < _NB_CACHED_RUNES; ++x) {
782 1.2 itojun if (isprint(maplower.map[x]))
783 1.2 itojun fprintf(stderr, " '%c'", (int)maplower.map[x]);
784 1.2 itojun else if (maplower.map[x])
785 1.2 itojun fprintf(stderr, "%04x", maplower.map[x]);
786 1.2 itojun else
787 1.2 itojun fprintf(stderr, "%4x", 0);
788 1.2 itojun if ((x & 0xf) == 0xf)
789 1.2 itojun fprintf(stderr, "\n");
790 1.2 itojun else
791 1.2 itojun fprintf(stderr, " ");
792 1.2 itojun }
793 1.2 itojun fprintf(stderr, "\n");
794 1.2 itojun
795 1.2 itojun for (list = maplower.root; list; list = list->next)
796 1.2 itojun fprintf(stderr, "\t%04x - %04x : %04x\n", list->min, list->max, list->map);
797 1.2 itojun
798 1.2 itojun fprintf(stderr, "\nMAPUPPER:\n\n");
799 1.2 itojun
800 1.17 tshiozak for (x = 0; x < _NB_CACHED_RUNES; ++x) {
801 1.2 itojun if (isprint(mapupper.map[x]))
802 1.2 itojun fprintf(stderr, " '%c'", (int)mapupper.map[x]);
803 1.2 itojun else if (mapupper.map[x])
804 1.2 itojun fprintf(stderr, "%04x", mapupper.map[x]);
805 1.2 itojun else
806 1.2 itojun fprintf(stderr, "%4x", 0);
807 1.2 itojun if ((x & 0xf) == 0xf)
808 1.2 itojun fprintf(stderr, "\n");
809 1.2 itojun else
810 1.2 itojun fprintf(stderr, " ");
811 1.2 itojun }
812 1.2 itojun fprintf(stderr, "\n");
813 1.2 itojun
814 1.2 itojun for (list = mapupper.root; list; list = list->next)
815 1.2 itojun fprintf(stderr, "\t%04x - %04x : %04x\n", list->min, list->max, list->map);
816 1.2 itojun
817 1.2 itojun
818 1.2 itojun fprintf(stderr, "\nTYPES:\n\n");
819 1.2 itojun
820 1.17 tshiozak for (x = 0; x < _NB_CACHED_RUNES; ++x) {
821 1.2 itojun u_int32_t r = types.map[x];
822 1.2 itojun
823 1.2 itojun if (r) {
824 1.2 itojun if (isprint(x))
825 1.2 itojun fprintf(stderr, " '%c':%2d", x, (int)(r & 0xff));
826 1.2 itojun else
827 1.2 itojun fprintf(stderr, "%04x:%2d", x, (int)(r & 0xff));
828 1.2 itojun
829 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_A) ? "alph" : "");
830 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_C) ? "ctrl" : "");
831 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_D) ? "dig" : "");
832 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_G) ? "graf" : "");
833 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_L) ? "low" : "");
834 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_P) ? "punc" : "");
835 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_S) ? "spac" : "");
836 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_U) ? "upp" : "");
837 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_X) ? "xdig" : "");
838 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_B) ? "blnk" : "");
839 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_R) ? "prnt" : "");
840 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_I) ? "ideo" : "");
841 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_T) ? "spec" : "");
842 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_Q) ? "phon" : "");
843 1.2 itojun fprintf(stderr, "\n");
844 1.2 itojun }
845 1.2 itojun }
846 1.2 itojun
847 1.2 itojun for (list = types.root; list; list = list->next) {
848 1.2 itojun if (list->map && list->min + 3 < list->max) {
849 1.2 itojun u_int32_t r = list->map;
850 1.2 itojun
851 1.2 itojun fprintf(stderr, "%04x:%2d", list->min, r & 0xff);
852 1.2 itojun
853 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_A) ? "alph" : "");
854 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_C) ? "ctrl" : "");
855 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_D) ? "dig" : "");
856 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_G) ? "graf" : "");
857 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_L) ? "low" : "");
858 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_P) ? "punc" : "");
859 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_S) ? "spac" : "");
860 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_U) ? "upp" : "");
861 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_X) ? "xdig" : "");
862 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_B) ? "blnk" : "");
863 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_R) ? "prnt" : "");
864 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_I) ? "ideo" : "");
865 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_T) ? "spec" : "");
866 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_Q) ? "phon" : "");
867 1.2 itojun fprintf(stderr, "\n...\n");
868 1.2 itojun
869 1.2 itojun fprintf(stderr, "%04x:%2d", list->max, r & 0xff);
870 1.2 itojun
871 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_A) ? "alph" : "");
872 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_C) ? "ctrl" : "");
873 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_D) ? "dig" : "");
874 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_G) ? "graf" : "");
875 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_L) ? "low" : "");
876 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_P) ? "punc" : "");
877 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_S) ? "spac" : "");
878 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_U) ? "upp" : "");
879 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_X) ? "xdig" : "");
880 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_B) ? "blnk" : "");
881 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_R) ? "prnt" : "");
882 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_I) ? "ideo" : "");
883 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_T) ? "spec" : "");
884 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_Q) ? "phon" : "");
885 1.16 tshiozak fprintf(stderr, " %1u", (unsigned)((r & _RUNETYPE_SWM)>>_RUNETYPE_SWS));
886 1.2 itojun fprintf(stderr, "\n");
887 1.2 itojun } else
888 1.2 itojun for (x = list->min; x <= list->max; ++x) {
889 1.2 itojun u_int32_t r = ntohl(list->types[x - list->min]);
890 1.2 itojun
891 1.2 itojun if (r) {
892 1.2 itojun fprintf(stderr, "%04x:%2d", x, (int)(r & 0xff));
893 1.2 itojun
894 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_A) ? "alph" : "");
895 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_C) ? "ctrl" : "");
896 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_D) ? "dig" : "");
897 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_G) ? "graf" : "");
898 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_L) ? "low" : "");
899 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_P) ? "punc" : "");
900 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_S) ? "spac" : "");
901 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_U) ? "upp" : "");
902 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_X) ? "xdig" : "");
903 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_B) ? "blnk" : "");
904 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_R) ? "prnt" : "");
905 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_I) ? "ideo" : "");
906 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_T) ? "spec" : "");
907 1.16 tshiozak fprintf(stderr, " %4s", (r & _RUNETYPE_Q) ? "phon" : "");
908 1.16 tshiozak fprintf(stderr, " %1u", (unsigned)((r & _RUNETYPE_SWM)>>_RUNETYPE_SWS));
909 1.2 itojun fprintf(stderr, "\n");
910 1.2 itojun }
911 1.2 itojun }
912 1.2 itojun }
913 1.2 itojun }
914