gettext.c revision 1.28 1 /* $NetBSD: gettext.c,v 1.28 2012/07/30 23:04:42 yamt Exp $ */
2
3 /*-
4 * Copyright (c) 2000, 2001 Citrus Project,
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * SUCH DAMAGE.
27 *
28 * $Citrus: xpg4dl/FreeBSD/lib/libintl/gettext.c,v 1.31 2001/09/27 15:18:45 yamt Exp $
29 */
30
31 #include <sys/cdefs.h>
32 __RCSID("$NetBSD: gettext.c,v 1.28 2012/07/30 23:04:42 yamt Exp $");
33
34 #include <sys/param.h>
35 #include <sys/stat.h>
36 #include <sys/mman.h>
37 #include <sys/uio.h>
38
39 #include <assert.h>
40 #include <fcntl.h>
41 #include <stdio.h>
42 #include <stdlib.h>
43 #include <unistd.h>
44 #include <string.h>
45 #if 0
46 #include <util.h>
47 #endif
48 #include <libintl.h>
49 #include <locale.h>
50 #include "libintl_local.h"
51 #include "plural_parser.h"
52 #include "pathnames.h"
53
54 static const char *lookup_category(int);
55 static const char *split_locale(const char *);
56 static const char *lookup_mofile(char *, size_t, const char *, const char *,
57 const char *, const char *,
58 struct domainbinding *);
59 static uint32_t flip(uint32_t, uint32_t);
60 static int validate(void *, struct mohandle *);
61 static int mapit(const char *, struct domainbinding *);
62 static int unmapit(struct domainbinding *);
63 static const char *lookup_hash(const char *, struct domainbinding *, size_t *);
64 static const char *lookup_bsearch(const char *, struct domainbinding *,
65 size_t *);
66 static const char *lookup(const char *, struct domainbinding *, size_t *);
67 static const char *get_lang_env(const char *);
68
69 /*
70 * shortcut functions. the main implementation resides in dcngettext().
71 */
72 char *
73 gettext(const char *msgid)
74 {
75
76 return dcngettext(NULL, msgid, NULL, 1UL, LC_MESSAGES);
77 }
78
79 char *
80 dgettext(const char *domainname, const char *msgid)
81 {
82
83 return dcngettext(domainname, msgid, NULL, 1UL, LC_MESSAGES);
84 }
85
86 char *
87 dcgettext(const char *domainname, const char *msgid, int category)
88 {
89
90 return dcngettext(domainname, msgid, NULL, 1UL, category);
91 }
92
93 char *
94 ngettext(const char *msgid1, const char *msgid2, unsigned long int n)
95 {
96
97 return dcngettext(NULL, msgid1, msgid2, n, LC_MESSAGES);
98 }
99
100 char *
101 dngettext(const char *domainname, const char *msgid1, const char *msgid2,
102 unsigned long int n)
103 {
104
105 return dcngettext(domainname, msgid1, msgid2, n, LC_MESSAGES);
106 }
107
108 /*
109 * dcngettext() -
110 * lookup internationalized message on database locale/category/domainname
111 * (like ja_JP.eucJP/LC_MESSAGES/domainname).
112 * if n equals to 1, internationalized message will be looked up for msgid1.
113 * otherwise, message will be looked up for msgid2.
114 * if the lookup fails, the function will return msgid1 or msgid2 as is.
115 *
116 * Even though the return type is "char *", caller should not rewrite the
117 * region pointed to by the return value (should be "const char *", but can't
118 * change it for compatibility with other implementations).
119 *
120 * by default (if domainname == NULL), domainname is taken from the value set
121 * by textdomain(). usually name of the application (like "ls") is used as
122 * domainname. category is usually LC_MESSAGES.
123 *
124 * the code reads in *.mo files generated by GNU gettext. *.mo is a host-
125 * endian encoded file. both endians are supported here, as the files are in
126 * /usr/share/locale! (or we should move those files into /usr/libdata)
127 */
128
129 static const char *
130 lookup_category(int category)
131 {
132
133 switch (category) {
134 case LC_COLLATE: return "LC_COLLATE";
135 case LC_CTYPE: return "LC_CTYPE";
136 case LC_MONETARY: return "LC_MONETARY";
137 case LC_NUMERIC: return "LC_NUMERIC";
138 case LC_TIME: return "LC_TIME";
139 case LC_MESSAGES: return "LC_MESSAGES";
140 }
141 return NULL;
142 }
143
144 /*
145 * XPG syntax: language[_territory[.codeset]][@modifier]
146 * XXX boundary check on "result" is lacking
147 */
148 static const char *
149 split_locale(const char *lname)
150 {
151 char buf[BUFSIZ], tmp[BUFSIZ];
152 char *l, *t, *c, *m;
153 static char result[BUFSIZ];
154
155 memset(result, 0, sizeof(result));
156
157 if (strlen(lname) + 1 > sizeof(buf)) {
158 fail:
159 return lname;
160 }
161
162 strlcpy(buf, lname, sizeof(buf));
163 m = strrchr(buf, '@');
164 if (m)
165 *m++ = '\0';
166 c = strrchr(buf, '.');
167 if (c)
168 *c++ = '\0';
169 t = strrchr(buf, '_');
170 if (t)
171 *t++ = '\0';
172 l = buf;
173 if (strlen(l) == 0)
174 goto fail;
175 if (c && !t)
176 goto fail;
177
178 if (m) {
179 if (t) {
180 if (c) {
181 snprintf(tmp, sizeof(tmp), "%s_%s.%s@%s",
182 l, t, c, m);
183 strlcat(result, tmp, sizeof(result));
184 strlcat(result, ":", sizeof(result));
185 }
186 snprintf(tmp, sizeof(tmp), "%s_%s@%s", l, t, m);
187 strlcat(result, tmp, sizeof(result));
188 strlcat(result, ":", sizeof(result));
189 }
190 snprintf(tmp, sizeof(tmp), "%s@%s", l, m);
191 strlcat(result, tmp, sizeof(result));
192 strlcat(result, ":", sizeof(result));
193 }
194 if (t) {
195 if (c) {
196 snprintf(tmp, sizeof(tmp), "%s_%s.%s", l, t, c);
197 strlcat(result, tmp, sizeof(result));
198 strlcat(result, ":", sizeof(result));
199 }
200 snprintf(tmp, sizeof(tmp), "%s_%s", l, t);
201 strlcat(result, tmp, sizeof(result));
202 strlcat(result, ":", sizeof(result));
203 }
204 strlcat(result, l, sizeof(result));
205
206 return result;
207 }
208
209 static const char *
210 lookup_mofile(char *buf, size_t len, const char *dir, const char *lpath,
211 const char *category, const char *domainname,
212 struct domainbinding *db)
213 {
214 struct stat st;
215 char *p, *q;
216 char lpath_tmp[BUFSIZ];
217
218 /*
219 * LANGUAGE is a colon separated list of locale names.
220 */
221
222 strlcpy(lpath_tmp, lpath, sizeof(lpath_tmp));
223 q = lpath_tmp;
224 /* CONSTCOND */
225 while (1) {
226 p = strsep(&q, ":");
227 if (!p)
228 break;
229 if (!*p)
230 continue;
231
232 /* don't mess with default locales */
233 if (strcmp(p, "C") == 0 || strcmp(p, "POSIX") == 0)
234 return NULL;
235
236 /* validate pathname */
237 if (strchr(p, '/') || strchr(category, '/'))
238 continue;
239 #if 1 /*?*/
240 if (strchr(domainname, '/'))
241 continue;
242 #endif
243
244 snprintf(buf, len, "%s/%s/%s/%s.mo", dir, p,
245 category, domainname);
246 if (stat(buf, &st) < 0)
247 continue;
248 if ((st.st_mode & S_IFMT) != S_IFREG)
249 continue;
250
251 if (mapit(buf, db) == 0)
252 return buf;
253 }
254
255 return NULL;
256 }
257
258 static uint32_t
259 flip(uint32_t v, uint32_t magic)
260 {
261
262 if (magic == MO_MAGIC)
263 return v;
264 else if (magic == MO_MAGIC_SWAPPED) {
265 v = ((v >> 24) & 0xff) | ((v >> 8) & 0xff00) |
266 ((v << 8) & 0xff0000) | ((v << 24) & 0xff000000);
267 return v;
268 } else {
269 abort();
270 /*NOTREACHED*/
271 }
272 }
273
274 static int
275 validate(void *arg, struct mohandle *mohandle)
276 {
277 char *p;
278
279 p = (char *)arg;
280 if (p < (char *)mohandle->addr ||
281 p > (char *)mohandle->addr + mohandle->len)
282 return 0;
283 else
284 return 1;
285 }
286
287 /*
288 * calculate the step value if the hash value is conflicted.
289 */
290 static __inline uint32_t
291 calc_collision_step(uint32_t hashval, uint32_t hashsize)
292 {
293 _DIAGASSERT(hashsize>2);
294 return (hashval % (hashsize - 2)) + 1;
295 }
296
297 /*
298 * calculate the next index while conflicting.
299 */
300 static __inline uint32_t
301 calc_next_index(uint32_t curidx, uint32_t hashsize, uint32_t step)
302 {
303 return curidx+step - (curidx >= hashsize-step ? hashsize : 0);
304 }
305
306 static int
307 get_sysdep_string_table(struct mosysdepstr_h **table_h, uint32_t *ofstable,
308 uint32_t nstrings, uint32_t magic, char *base)
309 {
310 unsigned int i;
311 int j, count;
312 size_t l;
313 struct mosysdepstr *table;
314
315 for (i=0; i<nstrings; i++) {
316 /* get mosysdepstr record */
317 /* LINTED: ignore the alignment problem. */
318 table = (struct mosysdepstr *)(base + flip(ofstable[i], magic));
319 /* count number of segments */
320 count = 0;
321 while (flip(table->segs[count++].ref, magic) != MO_LASTSEG)
322 ;
323 /* get table */
324 l = sizeof(struct mosysdepstr_h) +
325 sizeof(struct mosysdepsegentry_h) * (count-1);
326 table_h[i] = (struct mosysdepstr_h *)malloc(l);
327 if (!table_h[i])
328 return -1;
329 memset(table_h[i], 0, l);
330 table_h[i]->off = (const char *)(base + flip(table->off, magic));
331 for (j=0; j<count; j++) {
332 table_h[i]->segs[j].len =
333 flip(table->segs[j].len, magic);
334 table_h[i]->segs[j].ref =
335 flip(table->segs[j].ref, magic);
336 }
337 /* LINTED: ignore the alignment problem. */
338 table = (struct mosysdepstr *)&table->segs[count];
339 }
340 return 0;
341 }
342
343 static int
344 expand_sysdep(struct mohandle *mohandle, struct mosysdepstr_h *str)
345 {
346 int i;
347 const char *src;
348 char *dst;
349
350 /* check whether already expanded */
351 if (str->expanded)
352 return 0;
353
354 /* calc total length */
355 str->expanded_len = 1;
356 for (i=0; /*CONSTCOND*/1; i++) {
357 str->expanded_len += str->segs[i].len;
358 if (str->segs[i].ref == MO_LASTSEG)
359 break;
360 str->expanded_len +=
361 mohandle->mo.mo_sysdep_segs[str->segs[i].ref].len;
362 }
363 /* expand */
364 str->expanded = malloc(str->expanded_len);
365 if (!str->expanded)
366 return -1;
367 src = str->off;
368 dst = str->expanded;
369 for (i=0; /*CONSTCOND*/1; i++) {
370 memcpy(dst, src, str->segs[i].len);
371 src += str->segs[i].len;
372 dst += str->segs[i].len;
373 if (str->segs[i].ref == MO_LASTSEG)
374 break;
375 memcpy(dst, mohandle->mo.mo_sysdep_segs[str->segs[i].ref].str,
376 mohandle->mo.mo_sysdep_segs[str->segs[i].ref].len);
377 dst += mohandle->mo.mo_sysdep_segs[str->segs[i].ref].len;
378 }
379 *dst = '\0';
380
381 return 0;
382 }
383
384 static void
385 insert_to_hash(uint32_t *htable, uint32_t hsize, const char *str, uint32_t ref)
386 {
387 uint32_t hashval, idx, step;
388
389 hashval = __intl_string_hash(str);
390 step = calc_collision_step(hashval, hsize);
391 idx = hashval % hsize;
392
393 while (htable[idx])
394 idx = calc_next_index(idx, hsize, step);
395
396 htable[idx] = ref;
397 }
398
399 static int
400 setup_sysdep_stuffs(struct mo *mo, struct mohandle *mohandle, char *base)
401 {
402 uint32_t magic;
403 struct moentry *stable;
404 size_t l;
405 unsigned int i;
406 char *v;
407 uint32_t *ofstable;
408
409 magic = mo->mo_magic;
410
411 mohandle->mo.mo_sysdep_nsegs = flip(mo->mo_sysdep_nsegs, magic);
412 mohandle->mo.mo_sysdep_nstring = flip(mo->mo_sysdep_nstring, magic);
413
414 if (mohandle->mo.mo_sysdep_nstring == 0)
415 return 0;
416
417 /* check hash size */
418 if (mohandle->mo.mo_hsize <= 2 ||
419 mohandle->mo.mo_hsize <
420 (mohandle->mo.mo_nstring + mohandle->mo.mo_sysdep_nstring))
421 return -1;
422
423 /* get sysdep segments */
424 l = sizeof(struct mosysdepsegs_h) * mohandle->mo.mo_sysdep_nsegs;
425 mohandle->mo.mo_sysdep_segs = (struct mosysdepsegs_h *)malloc(l);
426 if (!mohandle->mo.mo_sysdep_segs)
427 return -1;
428 /* LINTED: ignore the alignment problem. */
429 stable = (struct moentry *)(base + flip(mo->mo_sysdep_segoff, magic));
430 for (i=0; i<mohandle->mo.mo_sysdep_nsegs; i++) {
431 v = base + flip(stable[i].off, magic);
432 mohandle->mo.mo_sysdep_segs[i].str =
433 __intl_sysdep_get_string_by_tag(
434 v,
435 &mohandle->mo.mo_sysdep_segs[i].len);
436 }
437
438 /* get sysdep string table */
439 mohandle->mo.mo_sysdep_otable =
440 (struct mosysdepstr_h **)calloc(mohandle->mo.mo_sysdep_nstring,
441 sizeof(struct mosysdepstr_h *));
442 if (!mohandle->mo.mo_sysdep_otable)
443 return -1;
444 /* LINTED: ignore the alignment problem. */
445 ofstable = (uint32_t *)(base + flip(mo->mo_sysdep_otable, magic));
446 if (get_sysdep_string_table(mohandle->mo.mo_sysdep_otable, ofstable,
447 mohandle->mo.mo_sysdep_nstring, magic,
448 base))
449 return -1;
450 mohandle->mo.mo_sysdep_ttable =
451 (struct mosysdepstr_h **)calloc(mohandle->mo.mo_sysdep_nstring,
452 sizeof(struct mosysdepstr_h *));
453 if (!mohandle->mo.mo_sysdep_ttable)
454 return -1;
455 /* LINTED: ignore the alignment problem. */
456 ofstable = (uint32_t *)(base + flip(mo->mo_sysdep_ttable, magic));
457 if (get_sysdep_string_table(mohandle->mo.mo_sysdep_ttable, ofstable,
458 mohandle->mo.mo_sysdep_nstring, magic,
459 base))
460 return -1;
461
462 /* update hash */
463 for (i=0; i<mohandle->mo.mo_sysdep_nstring; i++) {
464 if (expand_sysdep(mohandle, mohandle->mo.mo_sysdep_otable[i]))
465 return -1;
466 insert_to_hash(mohandle->mo.mo_htable,
467 mohandle->mo.mo_hsize,
468 mohandle->mo.mo_sysdep_otable[i]->expanded,
469 (i+1) | MO_HASH_SYSDEP_MASK);
470 }
471
472 return 0;
473 }
474
475 int
476 mapit(const char *path, struct domainbinding *db)
477 {
478 int fd;
479 struct stat st;
480 char *base;
481 uint32_t magic, revision, flags = 0;
482 struct moentry *otable, *ttable;
483 const uint32_t *htable;
484 struct moentry_h *p;
485 struct mo *mo;
486 size_t l, headerlen;
487 unsigned int i;
488 char *v;
489 struct mohandle *mohandle = &db->mohandle;
490
491 if (mohandle->addr && mohandle->addr != MAP_FAILED &&
492 mohandle->mo.mo_magic)
493 return 0; /*already opened*/
494
495 unmapit(db);
496
497 #if 0
498 if (secure_path(path) != 0)
499 goto fail;
500 #endif
501 if (stat(path, &st) < 0)
502 goto fail;
503 if ((st.st_mode & S_IFMT) != S_IFREG || st.st_size > GETTEXT_MMAP_MAX)
504 goto fail;
505 fd = open(path, O_RDONLY);
506 if (fd < 0)
507 goto fail;
508 if (read(fd, &magic, sizeof(magic)) != sizeof(magic) ||
509 (magic != MO_MAGIC && magic != MO_MAGIC_SWAPPED)) {
510 close(fd);
511 goto fail;
512 }
513 if (read(fd, &revision, sizeof(revision)) != sizeof(revision)) {
514 close(fd);
515 goto fail;
516 }
517 switch (flip(revision, magic)) {
518 case MO_MAKE_REV(0, 0):
519 break;
520 case MO_MAKE_REV(0, 1):
521 case MO_MAKE_REV(1, 1):
522 flags |= MO_F_SYSDEP;
523 break;
524 default:
525 close(fd);
526 goto fail;
527 }
528 mohandle->addr = mmap(NULL, (size_t)st.st_size, PROT_READ,
529 MAP_FILE | MAP_SHARED, fd, (off_t)0);
530 if (!mohandle->addr || mohandle->addr == MAP_FAILED) {
531 close(fd);
532 goto fail;
533 }
534 close(fd);
535 mohandle->len = (size_t)st.st_size;
536
537 base = mohandle->addr;
538 mo = (struct mo *)mohandle->addr;
539
540 /* flip endian. do not flip magic number! */
541 mohandle->mo.mo_magic = mo->mo_magic;
542 mohandle->mo.mo_revision = flip(mo->mo_revision, magic);
543 mohandle->mo.mo_nstring = flip(mo->mo_nstring, magic);
544 mohandle->mo.mo_hsize = flip(mo->mo_hsize, magic);
545 mohandle->mo.mo_flags = flags;
546
547 /* validate otable/ttable */
548 /* LINTED: ignore the alignment problem. */
549 otable = (struct moentry *)(base + flip(mo->mo_otable, magic));
550 /* LINTED: ignore the alignment problem. */
551 ttable = (struct moentry *)(base + flip(mo->mo_ttable, magic));
552 if (!validate(otable, mohandle) ||
553 !validate(&otable[mohandle->mo.mo_nstring], mohandle)) {
554 unmapit(db);
555 goto fail;
556 }
557 if (!validate(ttable, mohandle) ||
558 !validate(&ttable[mohandle->mo.mo_nstring], mohandle)) {
559 unmapit(db);
560 goto fail;
561 }
562
563 /* allocate [ot]table, and convert to normal pointer representation. */
564 l = sizeof(struct moentry_h) * mohandle->mo.mo_nstring;
565 mohandle->mo.mo_otable = (struct moentry_h *)malloc(l);
566 if (!mohandle->mo.mo_otable) {
567 unmapit(db);
568 goto fail;
569 }
570 mohandle->mo.mo_ttable = (struct moentry_h *)malloc(l);
571 if (!mohandle->mo.mo_ttable) {
572 unmapit(db);
573 goto fail;
574 }
575 p = mohandle->mo.mo_otable;
576 for (i = 0; i < mohandle->mo.mo_nstring; i++) {
577 p[i].len = flip(otable[i].len, magic);
578 p[i].off = base + flip(otable[i].off, magic);
579
580 if (!validate(p[i].off, mohandle) ||
581 !validate(p[i].off + p[i].len + 1, mohandle)) {
582 unmapit(db);
583 goto fail;
584 }
585 }
586 p = mohandle->mo.mo_ttable;
587 for (i = 0; i < mohandle->mo.mo_nstring; i++) {
588 p[i].len = flip(ttable[i].len, magic);
589 p[i].off = base + flip(ttable[i].off, magic);
590
591 if (!validate(p[i].off, mohandle) ||
592 !validate(p[i].off + p[i].len + 1, mohandle)) {
593 unmapit(db);
594 goto fail;
595 }
596 }
597 /* allocate htable, and convert it to the host order. */
598 if (mohandle->mo.mo_hsize > 2) {
599 l = sizeof(uint32_t) * mohandle->mo.mo_hsize;
600 mohandle->mo.mo_htable = (uint32_t *)malloc(l);
601 if (!mohandle->mo.mo_htable) {
602 unmapit(db);
603 goto fail;
604 }
605 /* LINTED: ignore the alignment problem. */
606 htable = (const uint32_t *)(base+flip(mo->mo_hoffset, magic));
607 for (i=0; i < mohandle->mo.mo_hsize; i++) {
608 mohandle->mo.mo_htable[i] = flip(htable[i], magic);
609 if (mohandle->mo.mo_htable[i] >=
610 mohandle->mo.mo_nstring+1) {
611 /* illegal string number. */
612 unmapit(db);
613 goto fail;
614 }
615 }
616 }
617 /* grab MIME-header and charset field */
618 mohandle->mo.mo_header = lookup("", db, &headerlen);
619 if (mohandle->mo.mo_header)
620 v = strstr(mohandle->mo.mo_header, "charset=");
621 else
622 v = NULL;
623 if (v) {
624 mohandle->mo.mo_charset = strdup(v + 8);
625 if (!mohandle->mo.mo_charset)
626 goto fail;
627 v = strchr(mohandle->mo.mo_charset, '\n');
628 if (v)
629 *v = '\0';
630 }
631 if (!mohandle->mo.mo_header ||
632 _gettext_parse_plural(&mohandle->mo.mo_plural,
633 &mohandle->mo.mo_nplurals,
634 mohandle->mo.mo_header, headerlen))
635 mohandle->mo.mo_plural = NULL;
636
637 /*
638 * XXX check charset, reject it if we are unable to support the charset
639 * with the current locale.
640 * for example, if we are using euc-jp locale and we are looking at
641 * *.mo file encoded by euc-kr (charset=euc-kr), we should reject
642 * the *.mo file as we cannot support it.
643 */
644
645 /* system dependent string support */
646 if ((mohandle->mo.mo_flags & MO_F_SYSDEP) != 0) {
647 if (setup_sysdep_stuffs(mo, mohandle, base)) {
648 unmapit(db);
649 goto fail;
650 }
651 }
652
653 return 0;
654
655 fail:
656 return -1;
657 }
658
659 static void
660 free_sysdep_table(struct mosysdepstr_h **table, uint32_t nstring)
661 {
662 uint32_t i;
663
664 for (i=0; i<nstring; i++) {
665 if (table[i]) {
666 if (table[i]->expanded)
667 free(table[i]->expanded);
668 free(table[i]);
669 }
670 }
671 free(table);
672 }
673
674 static int
675 unmapit(struct domainbinding *db)
676 {
677 struct mohandle *mohandle = &db->mohandle;
678
679 /* unmap if there's already mapped region */
680 if (mohandle->addr && mohandle->addr != MAP_FAILED)
681 munmap(mohandle->addr, mohandle->len);
682 mohandle->addr = NULL;
683 if (mohandle->mo.mo_otable)
684 free(mohandle->mo.mo_otable);
685 if (mohandle->mo.mo_ttable)
686 free(mohandle->mo.mo_ttable);
687 if (mohandle->mo.mo_charset)
688 free(mohandle->mo.mo_charset);
689 if (mohandle->mo.mo_htable)
690 free(mohandle->mo.mo_htable);
691 if (mohandle->mo.mo_sysdep_segs)
692 free(mohandle->mo.mo_sysdep_segs);
693 if (mohandle->mo.mo_sysdep_otable) {
694 free_sysdep_table(mohandle->mo.mo_sysdep_otable,
695 mohandle->mo.mo_sysdep_nstring);
696 }
697 if (mohandle->mo.mo_sysdep_ttable) {
698 free_sysdep_table(mohandle->mo.mo_sysdep_ttable,
699 mohandle->mo.mo_sysdep_nstring);
700 }
701 if (mohandle->mo.mo_plural)
702 _gettext_free_plural(mohandle->mo.mo_plural);
703 memset(&mohandle->mo, 0, sizeof(mohandle->mo));
704 return 0;
705 }
706
707 /* ARGSUSED */
708 static const char *
709 lookup_hash(const char *msgid, struct domainbinding *db, size_t *rlen)
710 {
711 struct mohandle *mohandle = &db->mohandle;
712 uint32_t idx, hashval, step, strno;
713 size_t len;
714 struct mosysdepstr_h *sysdep_otable, *sysdep_ttable;
715
716 if (mohandle->mo.mo_hsize <= 2 || mohandle->mo.mo_htable == NULL)
717 return NULL;
718
719 hashval = __intl_string_hash(msgid);
720 step = calc_collision_step(hashval, mohandle->mo.mo_hsize);
721 idx = hashval % mohandle->mo.mo_hsize;
722 len = strlen(msgid);
723 while (/*CONSTCOND*/1) {
724 strno = mohandle->mo.mo_htable[idx];
725 if (strno == 0) {
726 /* unexpected miss */
727 return NULL;
728 }
729 strno--;
730 if ((strno & MO_HASH_SYSDEP_MASK) == 0) {
731 /* system independent strings */
732 if (len <= mohandle->mo.mo_otable[strno].len &&
733 !strcmp(msgid, mohandle->mo.mo_otable[strno].off)) {
734 /* hit */
735 if (rlen)
736 *rlen =
737 mohandle->mo.mo_ttable[strno].len;
738 return mohandle->mo.mo_ttable[strno].off;
739 }
740 } else {
741 /* system dependent strings */
742 strno &= ~MO_HASH_SYSDEP_MASK;
743 sysdep_otable = mohandle->mo.mo_sysdep_otable[strno];
744 sysdep_ttable = mohandle->mo.mo_sysdep_ttable[strno];
745 if (len <= sysdep_otable->expanded_len &&
746 !strcmp(msgid, sysdep_otable->expanded)) {
747 /* hit */
748 if (expand_sysdep(mohandle, sysdep_ttable))
749 /* memory exhausted */
750 return NULL;
751 if (rlen)
752 *rlen = sysdep_ttable->expanded_len;
753 return sysdep_ttable->expanded;
754 }
755 }
756 idx = calc_next_index(idx, mohandle->mo.mo_hsize, step);
757 }
758 /*NOTREACHED*/
759 }
760
761 static const char *
762 lookup_bsearch(const char *msgid, struct domainbinding *db, size_t *rlen)
763 {
764 int top, bottom, middle, omiddle;
765 int n;
766 struct mohandle *mohandle = &db->mohandle;
767
768 top = 0;
769 bottom = mohandle->mo.mo_nstring;
770 omiddle = -1;
771 /* CONSTCOND */
772 while (1) {
773 if (top > bottom)
774 break;
775 middle = (top + bottom) / 2;
776 /* avoid possible infinite loop, when the data is not sorted */
777 if (omiddle == middle)
778 break;
779 if ((size_t)middle >= mohandle->mo.mo_nstring)
780 break;
781
782 n = strcmp(msgid, mohandle->mo.mo_otable[middle].off);
783 if (n == 0) {
784 if (rlen)
785 *rlen = mohandle->mo.mo_ttable[middle].len;
786 return (const char *)mohandle->mo.mo_ttable[middle].off;
787 }
788 else if (n < 0)
789 bottom = middle;
790 else
791 top = middle;
792 omiddle = middle;
793 }
794
795 return NULL;
796 }
797
798 static const char *
799 lookup(const char *msgid, struct domainbinding *db, size_t *rlen)
800 {
801 const char *v;
802
803 v = lookup_hash(msgid, db, rlen);
804 if (v)
805 return v;
806
807 return lookup_bsearch(msgid, db, rlen);
808 }
809
810 static const char *
811 get_lang_env(const char *category_name)
812 {
813 const char *lang;
814
815 /*
816 * 1. see LANGUAGE variable first.
817 *
818 * LANGUAGE is a GNU extension.
819 * It's a colon separated list of locale names.
820 */
821 lang = getenv("LANGUAGE");
822 if (lang)
823 return lang;
824
825 /*
826 * 2. if LANGUAGE isn't set, see LC_ALL, LC_xxx, LANG.
827 *
828 * It's essentially setlocale(LC_xxx, NULL).
829 */
830 lang = getenv("LC_ALL");
831 if (!lang)
832 lang = getenv(category_name);
833 if (!lang)
834 lang = getenv("LANG");
835
836 if (!lang)
837 return 0; /* error */
838
839 return split_locale(lang);
840 }
841
842 static const char *
843 get_indexed_string(const char *str, size_t len, unsigned long idx)
844 {
845 while (idx > 0) {
846 if (len <= 1)
847 return str;
848 if (*str == '\0')
849 idx--;
850 if (len > 0) {
851 str++;
852 len--;
853 }
854 }
855 return str;
856 }
857
858 #define _NGETTEXT_DEFAULT(msgid1, msgid2, n) \
859 ((char *)__UNCONST((n) == 1 ? (msgid1) : (msgid2)))
860
861 char *
862 dcngettext(const char *domainname, const char *msgid1, const char *msgid2,
863 unsigned long int n, int category)
864 {
865 const char *msgid;
866 char path[PATH_MAX];
867 const char *lpath;
868 static char olpath[PATH_MAX];
869 const char *cname = NULL;
870 const char *v;
871 static char *ocname = NULL;
872 static char *odomainname = NULL;
873 struct domainbinding *db;
874 unsigned long plural_index = 0;
875 size_t len;
876
877 if (!domainname)
878 domainname = __current_domainname;
879 cname = lookup_category(category);
880 if (!domainname || !cname)
881 goto fail;
882
883 lpath = get_lang_env(cname);
884 if (!lpath)
885 goto fail;
886
887 for (db = __bindings; db; db = db->next)
888 if (strcmp(db->domainname, domainname) == 0)
889 break;
890 if (!db) {
891 if (!bindtextdomain(domainname, _PATH_TEXTDOMAIN))
892 goto fail;
893 db = __bindings;
894 }
895
896 /* resolve relative path */
897 /* XXX not necessary? */
898 if (db->path[0] != '/') {
899 char buf[PATH_MAX];
900
901 if (getcwd(buf, sizeof(buf)) == 0)
902 goto fail;
903 if (strlcat(buf, "/", sizeof(buf)) >= sizeof(buf))
904 goto fail;
905 if (strlcat(buf, db->path, sizeof(buf)) >= sizeof(buf))
906 goto fail;
907 strlcpy(db->path, buf, sizeof(db->path));
908 }
909
910 /* don't bother looking it up if the values are the same */
911 if (odomainname && strcmp(domainname, odomainname) == 0 &&
912 ocname && strcmp(cname, ocname) == 0 && strcmp(lpath, olpath) == 0 &&
913 db->mohandle.mo.mo_magic)
914 goto found;
915
916 /* try to find appropriate file, from $LANGUAGE */
917 if (lookup_mofile(path, sizeof(path), db->path, lpath, cname,
918 domainname, db) == NULL)
919 goto fail;
920
921 if (odomainname)
922 free(odomainname);
923 if (ocname)
924 free(ocname);
925 odomainname = strdup(domainname);
926 ocname = strdup(cname);
927 if (!odomainname || !ocname) {
928 if (odomainname)
929 free(odomainname);
930 if (ocname)
931 free(ocname);
932 odomainname = ocname = NULL;
933 }
934 else
935 strlcpy(olpath, lpath, sizeof(olpath));
936
937 found:
938 if (db->mohandle.mo.mo_plural) {
939 plural_index =
940 _gettext_calculate_plural(db->mohandle.mo.mo_plural, n);
941 if (plural_index >= db->mohandle.mo.mo_nplurals)
942 plural_index = 0;
943 msgid = msgid1;
944 } else
945 msgid = _NGETTEXT_DEFAULT(msgid1, msgid2, n);
946
947 if (msgid == NULL)
948 return NULL;
949
950 v = lookup(msgid, db, &len);
951 if (v) {
952 if (db->mohandle.mo.mo_plural)
953 v = get_indexed_string(v, len, plural_index);
954 /*
955 * convert the translated message's encoding.
956 *
957 * special case:
958 * a result of gettext("") shouldn't need any conversion.
959 */
960 if (msgid[0])
961 v = __gettext_iconv(v, db);
962
963 /*
964 * Given the amount of printf-format security issues, it may
965 * be a good idea to validate if the original msgid and the
966 * translated message format string carry the same printf-like
967 * format identifiers.
968 */
969
970 msgid = v;
971 }
972
973 return (char *)__UNCONST(msgid);
974
975 fail:
976 return _NGETTEXT_DEFAULT(msgid1, msgid2, n);
977 }
978