PR tree-ssa/57385
[official-gcc.git] / intl / dcigettext.c
bloba8d4a14d273b153b117b507ec76356635ccd876e
1 /* Implementation of the internal dcigettext function.
2 Copyright (C) 1995-1999, 2000-2003 Free Software Foundation, Inc.
4 This program is free software; you can redistribute it and/or modify it
5 under the terms of the GNU Library General Public License as published
6 by the Free Software Foundation; either version 2, or (at your option)
7 any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 Library General Public License for more details.
14 You should have received a copy of the GNU Library General Public
15 License along with this program; if not, write to the Free Software
16 Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA 02110-1301,
17 USA. */
19 /* Tell glibc's <string.h> to provide a prototype for mempcpy().
20 This must come before <config.h> because <config.h> may include
21 <features.h>, and once <features.h> has been included, it's too late. */
22 #ifndef _GNU_SOURCE
23 # define _GNU_SOURCE 1
24 #endif
26 #ifdef HAVE_CONFIG_H
27 # include <config.h>
28 #endif
30 #include <sys/types.h>
32 #ifdef __GNUC__
33 # define alloca __builtin_alloca
34 # define HAVE_ALLOCA 1
35 #else
36 # ifdef _MSC_VER
37 # include <malloc.h>
38 # define alloca _alloca
39 # else
40 # if defined HAVE_ALLOCA_H || defined _LIBC
41 # include <alloca.h>
42 # else
43 # ifdef _AIX
44 #pragma alloca
45 # else
46 # ifndef alloca
47 char *alloca ();
48 # endif
49 # endif
50 # endif
51 # endif
52 #endif
54 #include <errno.h>
55 #ifndef errno
56 extern int errno;
57 #endif
58 #ifndef __set_errno
59 # define __set_errno(val) errno = (val)
60 #endif
62 #include <stddef.h>
63 #include <stdlib.h>
64 #include <string.h>
66 #if defined HAVE_UNISTD_H || defined _LIBC
67 # include <unistd.h>
68 #endif
70 #include <locale.h>
72 #ifdef _LIBC
73 /* Guess whether integer division by zero raises signal SIGFPE.
74 Set to 1 only if you know for sure. In case of doubt, set to 0. */
75 # if defined __alpha__ || defined __arm__ || defined __i386__ \
76 || defined __m68k__ || defined __s390__
77 # define INTDIV0_RAISES_SIGFPE 1
78 # else
79 # define INTDIV0_RAISES_SIGFPE 0
80 # endif
81 #endif
82 #if !INTDIV0_RAISES_SIGFPE
83 # include <signal.h>
84 #endif
86 #if defined HAVE_SYS_PARAM_H || defined _LIBC
87 # include <sys/param.h>
88 #endif
90 #include "gettextP.h"
91 #include "plural-exp.h"
92 #ifdef _LIBC
93 # include <libintl.h>
94 #else
95 # include "libgnuintl.h"
96 #endif
97 #include "hash-string.h"
99 /* Thread safetyness. */
100 #ifdef _LIBC
101 # include <bits/libc-lock.h>
102 #else
103 /* Provide dummy implementation if this is outside glibc. */
104 # define __libc_lock_define_initialized(CLASS, NAME)
105 # define __libc_lock_lock(NAME)
106 # define __libc_lock_unlock(NAME)
107 # define __libc_rwlock_define_initialized(CLASS, NAME)
108 # define __libc_rwlock_rdlock(NAME)
109 # define __libc_rwlock_unlock(NAME)
110 #endif
112 /* Alignment of types. */
113 #if defined __GNUC__ && __GNUC__ >= 2
114 # define alignof(TYPE) __alignof__ (TYPE)
115 #else
116 # define alignof(TYPE) \
117 ((int) &((struct { char dummy1; TYPE dummy2; } *) 0)->dummy2)
118 #endif
120 /* The internal variables in the standalone libintl.a must have different
121 names than the internal variables in GNU libc, otherwise programs
122 using libintl.a cannot be linked statically. */
123 #if !defined _LIBC
124 # define _nl_default_default_domain libintl_nl_default_default_domain
125 # define _nl_current_default_domain libintl_nl_current_default_domain
126 # define _nl_default_dirname libintl_nl_default_dirname
127 # define _nl_domain_bindings libintl_nl_domain_bindings
128 #endif
130 /* Some compilers, like SunOS4 cc, don't have offsetof in <stddef.h>. */
131 #ifndef offsetof
132 # define offsetof(type,ident) ((size_t)&(((type*)0)->ident))
133 #endif
135 /* @@ end of prolog @@ */
137 #ifdef _LIBC
138 /* Rename the non ANSI C functions. This is required by the standard
139 because some ANSI C functions will require linking with this object
140 file and the name space must not be polluted. */
141 # define getcwd __getcwd
142 # ifndef stpcpy
143 # define stpcpy __stpcpy
144 # endif
145 # define tfind __tfind
146 #else
147 # if !defined HAVE_GETCWD
148 char *getwd ();
149 # define getcwd(buf, max) getwd (buf)
150 # else
151 char *getcwd ();
152 # endif
153 # ifndef HAVE_STPCPY
154 static char *stpcpy PARAMS ((char *dest, const char *src));
155 # endif
156 # ifndef HAVE_MEMPCPY
157 static void *mempcpy PARAMS ((void *dest, const void *src, size_t n));
158 # endif
159 #endif
161 /* Amount to increase buffer size by in each try. */
162 #define PATH_INCR 32
164 /* The following is from pathmax.h. */
165 /* Non-POSIX BSD systems might have gcc's limits.h, which doesn't define
166 PATH_MAX but might cause redefinition warnings when sys/param.h is
167 later included (as on MORE/BSD 4.3). */
168 #if defined _POSIX_VERSION || (defined HAVE_LIMITS_H && !defined __GNUC__)
169 # include <limits.h>
170 #endif
172 #ifndef _POSIX_PATH_MAX
173 # define _POSIX_PATH_MAX 255
174 #endif
176 #if !defined PATH_MAX && defined _PC_PATH_MAX
177 # define PATH_MAX (pathconf ("/", _PC_PATH_MAX) < 1 ? 1024 : pathconf ("/", _PC_PATH_MAX))
178 #endif
180 /* Don't include sys/param.h if it already has been. */
181 #if defined HAVE_SYS_PARAM_H && !defined PATH_MAX && !defined MAXPATHLEN
182 # include <sys/param.h>
183 #endif
185 #if !defined PATH_MAX && defined MAXPATHLEN
186 # define PATH_MAX MAXPATHLEN
187 #endif
189 #ifndef PATH_MAX
190 # define PATH_MAX _POSIX_PATH_MAX
191 #endif
193 /* Pathname support.
194 ISSLASH(C) tests whether C is a directory separator character.
195 IS_ABSOLUTE_PATH(P) tests whether P is an absolute path. If it is not,
196 it may be concatenated to a directory pathname.
197 IS_PATH_WITH_DIR(P) tests whether P contains a directory specification.
199 #if defined _WIN32 || defined __WIN32__ || defined __EMX__ || defined __DJGPP__
200 /* Win32, OS/2, DOS */
201 # define ISSLASH(C) ((C) == '/' || (C) == '\\')
202 # define HAS_DEVICE(P) \
203 ((((P)[0] >= 'A' && (P)[0] <= 'Z') || ((P)[0] >= 'a' && (P)[0] <= 'z')) \
204 && (P)[1] == ':')
205 # define IS_ABSOLUTE_PATH(P) (ISSLASH ((P)[0]) || HAS_DEVICE (P))
206 # define IS_PATH_WITH_DIR(P) \
207 (strchr (P, '/') != NULL || strchr (P, '\\') != NULL || HAS_DEVICE (P))
208 #else
209 /* Unix */
210 # define ISSLASH(C) ((C) == '/')
211 # define IS_ABSOLUTE_PATH(P) ISSLASH ((P)[0])
212 # define IS_PATH_WITH_DIR(P) (strchr (P, '/') != NULL)
213 #endif
215 /* This is the type used for the search tree where known translations
216 are stored. */
217 struct known_translation_t
219 /* Domain in which to search. */
220 char *domainname;
222 /* The category. */
223 int category;
225 /* State of the catalog counter at the point the string was found. */
226 int counter;
228 /* Catalog where the string was found. */
229 struct loaded_l10nfile *domain;
231 /* And finally the translation. */
232 const char *translation;
233 size_t translation_length;
235 /* Pointer to the string in question. */
236 char msgid[ZERO];
239 /* Root of the search tree with known translations. We can use this
240 only if the system provides the `tsearch' function family. */
241 #if defined HAVE_TSEARCH || defined _LIBC
242 # include <search.h>
244 static void *root;
246 # ifdef _LIBC
247 # define tsearch __tsearch
248 # endif
250 /* Function to compare two entries in the table of known translations. */
251 static int transcmp PARAMS ((const void *p1, const void *p2));
252 static int
253 transcmp (p1, p2)
254 const void *p1;
255 const void *p2;
257 const struct known_translation_t *s1;
258 const struct known_translation_t *s2;
259 int result;
261 s1 = (const struct known_translation_t *) p1;
262 s2 = (const struct known_translation_t *) p2;
264 result = strcmp (s1->msgid, s2->msgid);
265 if (result == 0)
267 result = strcmp (s1->domainname, s2->domainname);
268 if (result == 0)
269 /* We compare the category last (though this is the cheapest
270 operation) since it is hopefully always the same (namely
271 LC_MESSAGES). */
272 result = s1->category - s2->category;
275 return result;
277 #endif
279 #ifndef INTVARDEF
280 # define INTVARDEF(name)
281 #endif
282 #ifndef INTUSE
283 # define INTUSE(name) name
284 #endif
286 /* Name of the default domain used for gettext(3) prior any call to
287 textdomain(3). The default value for this is "messages". */
288 const char _nl_default_default_domain[] attribute_hidden = "messages";
290 /* Value used as the default domain for gettext(3). */
291 const char *_nl_current_default_domain attribute_hidden
292 = _nl_default_default_domain;
294 /* Contains the default location of the message catalogs. */
295 #if defined __EMX__
296 extern const char _nl_default_dirname[];
297 #else
298 const char _nl_default_dirname[] = LOCALEDIR;
299 INTVARDEF (_nl_default_dirname)
300 #endif
302 /* List with bindings of specific domains created by bindtextdomain()
303 calls. */
304 struct binding *_nl_domain_bindings;
306 /* Prototypes for local functions. */
307 static char *plural_lookup PARAMS ((struct loaded_l10nfile *domain,
308 unsigned long int n,
309 const char *translation,
310 size_t translation_len))
311 internal_function;
312 static const char *guess_category_value PARAMS ((int category,
313 const char *categoryname))
314 internal_function;
315 #ifdef _LIBC
316 # include "../locale/localeinfo.h"
317 # define category_to_name(category) _nl_category_names[category]
318 #else
319 static const char *category_to_name PARAMS ((int category)) internal_function;
320 #endif
323 /* For those loosing systems which don't have `alloca' we have to add
324 some additional code emulating it. */
325 #ifdef HAVE_ALLOCA
326 /* Nothing has to be done. */
327 # define freea(p) /* nothing */
328 # define ADD_BLOCK(list, address) /* nothing */
329 # define FREE_BLOCKS(list) /* nothing */
330 #else
331 struct block_list
333 void *address;
334 struct block_list *next;
336 # define ADD_BLOCK(list, addr) \
337 do { \
338 struct block_list *newp = (struct block_list *) malloc (sizeof (*newp)); \
339 /* If we cannot get a free block we cannot add the new element to \
340 the list. */ \
341 if (newp != NULL) { \
342 newp->address = (addr); \
343 newp->next = (list); \
344 (list) = newp; \
346 } while (0)
347 # define FREE_BLOCKS(list) \
348 do { \
349 while (list != NULL) { \
350 struct block_list *old = list; \
351 list = list->next; \
352 free (old->address); \
353 free (old); \
355 } while (0)
356 # undef alloca
357 # define alloca(size) (malloc (size))
358 # define freea(p) free (p)
359 #endif /* have alloca */
362 #ifdef _LIBC
363 /* List of blocks allocated for translations. */
364 typedef struct transmem_list
366 struct transmem_list *next;
367 char data[ZERO];
368 } transmem_block_t;
369 static struct transmem_list *transmem_list;
370 #else
371 typedef unsigned char transmem_block_t;
372 #endif
375 /* Names for the libintl functions are a problem. They must not clash
376 with existing names and they should follow ANSI C. But this source
377 code is also used in GNU C Library where the names have a __
378 prefix. So we have to make a difference here. */
379 #ifdef _LIBC
380 # define DCIGETTEXT __dcigettext
381 #else
382 # define DCIGETTEXT libintl_dcigettext
383 #endif
385 /* Lock variable to protect the global data in the gettext implementation. */
386 #ifdef _LIBC
387 __libc_rwlock_define_initialized (, _nl_state_lock attribute_hidden)
388 #endif
390 /* Checking whether the binaries runs SUID must be done and glibc provides
391 easier methods therefore we make a difference here. */
392 #ifdef _LIBC
393 # define ENABLE_SECURE __libc_enable_secure
394 # define DETERMINE_SECURE
395 #else
396 # ifndef HAVE_GETUID
397 # define getuid() 0
398 # endif
399 # ifndef HAVE_GETGID
400 # define getgid() 0
401 # endif
402 # ifndef HAVE_GETEUID
403 # define geteuid() getuid()
404 # endif
405 # ifndef HAVE_GETEGID
406 # define getegid() getgid()
407 # endif
408 static int enable_secure;
409 # define ENABLE_SECURE (enable_secure == 1)
410 # define DETERMINE_SECURE \
411 if (enable_secure == 0) \
413 if (getuid () != geteuid () || getgid () != getegid ()) \
414 enable_secure = 1; \
415 else \
416 enable_secure = -1; \
418 #endif
420 /* Get the function to evaluate the plural expression. */
421 #include "eval-plural.h"
423 /* Look up MSGID in the DOMAINNAME message catalog for the current
424 CATEGORY locale and, if PLURAL is nonzero, search over string
425 depending on the plural form determined by N. */
426 char *
427 DCIGETTEXT (domainname, msgid1, msgid2, plural, n, category)
428 const char *domainname;
429 const char *msgid1;
430 const char *msgid2;
431 int plural;
432 unsigned long int n;
433 int category;
435 #ifndef HAVE_ALLOCA
436 struct block_list *block_list = NULL;
437 #endif
438 struct loaded_l10nfile *domain;
439 struct binding *binding;
440 const char *categoryname;
441 const char *categoryvalue;
442 char *dirname, *xdomainname;
443 char *single_locale;
444 char *retval;
445 size_t retlen;
446 int saved_errno;
447 #if defined HAVE_TSEARCH || defined _LIBC
448 struct known_translation_t *search;
449 struct known_translation_t **foundp = NULL;
450 size_t msgid_len;
451 #endif
452 size_t domainname_len;
454 /* If no real MSGID is given return NULL. */
455 if (msgid1 == NULL)
456 return NULL;
458 #ifdef _LIBC
459 if (category < 0 || category >= __LC_LAST || category == LC_ALL)
460 /* Bogus. */
461 return (plural == 0
462 ? (char *) msgid1
463 /* Use the Germanic plural rule. */
464 : n == 1 ? (char *) msgid1 : (char *) msgid2);
465 #endif
467 __libc_rwlock_rdlock (_nl_state_lock);
469 /* If DOMAINNAME is NULL, we are interested in the default domain. If
470 CATEGORY is not LC_MESSAGES this might not make much sense but the
471 definition left this undefined. */
472 if (domainname == NULL)
473 domainname = _nl_current_default_domain;
475 /* OS/2 specific: backward compatibility with older libintl versions */
476 #ifdef LC_MESSAGES_COMPAT
477 if (category == LC_MESSAGES_COMPAT)
478 category = LC_MESSAGES;
479 #endif
481 #if defined HAVE_TSEARCH || defined _LIBC
482 msgid_len = strlen (msgid1) + 1;
484 /* Try to find the translation among those which we found at
485 some time. */
486 search = (struct known_translation_t *)
487 alloca (offsetof (struct known_translation_t, msgid) + msgid_len);
488 memcpy (search->msgid, msgid1, msgid_len);
489 search->domainname = (char *) domainname;
490 search->category = category;
492 foundp = (struct known_translation_t **) tfind (search, &root, transcmp);
493 freea (search);
494 if (foundp != NULL && (*foundp)->counter == _nl_msg_cat_cntr)
496 /* Now deal with plural. */
497 if (plural)
498 retval = plural_lookup ((*foundp)->domain, n, (*foundp)->translation,
499 (*foundp)->translation_length);
500 else
501 retval = (char *) (*foundp)->translation;
503 __libc_rwlock_unlock (_nl_state_lock);
504 return retval;
506 #endif
508 /* Preserve the `errno' value. */
509 saved_errno = errno;
511 /* See whether this is a SUID binary or not. */
512 DETERMINE_SECURE;
514 /* First find matching binding. */
515 for (binding = _nl_domain_bindings; binding != NULL; binding = binding->next)
517 int compare = strcmp (domainname, binding->domainname);
518 if (compare == 0)
519 /* We found it! */
520 break;
521 if (compare < 0)
523 /* It is not in the list. */
524 binding = NULL;
525 break;
529 if (binding == NULL)
530 dirname = (char *) INTUSE(_nl_default_dirname);
531 else if (IS_ABSOLUTE_PATH (binding->dirname))
532 dirname = binding->dirname;
533 else
535 /* We have a relative path. Make it absolute now. */
536 size_t dirname_len = strlen (binding->dirname) + 1;
537 size_t path_max;
538 char *ret;
540 path_max = (unsigned int) PATH_MAX;
541 path_max += 2; /* The getcwd docs say to do this. */
543 for (;;)
545 dirname = (char *) alloca (path_max + dirname_len);
546 ADD_BLOCK (block_list, dirname);
548 __set_errno (0);
549 ret = getcwd (dirname, path_max);
550 if (ret != NULL || errno != ERANGE)
551 break;
553 path_max += path_max / 2;
554 path_max += PATH_INCR;
557 if (ret == NULL)
558 /* We cannot get the current working directory. Don't signal an
559 error but simply return the default string. */
560 goto return_untranslated;
562 stpcpy (stpcpy (strchr (dirname, '\0'), "/"), binding->dirname);
565 /* Now determine the symbolic name of CATEGORY and its value. */
566 categoryname = category_to_name (category);
567 categoryvalue = guess_category_value (category, categoryname);
569 domainname_len = strlen (domainname);
570 xdomainname = (char *) alloca (strlen (categoryname)
571 + domainname_len + 5);
572 ADD_BLOCK (block_list, xdomainname);
574 stpcpy (mempcpy (stpcpy (stpcpy (xdomainname, categoryname), "/"),
575 domainname, domainname_len),
576 ".mo");
578 /* Creating working area. */
579 single_locale = (char *) alloca (strlen (categoryvalue) + 1);
580 ADD_BLOCK (block_list, single_locale);
583 /* Search for the given string. This is a loop because we perhaps
584 got an ordered list of languages to consider for the translation. */
585 while (1)
587 /* Make CATEGORYVALUE point to the next element of the list. */
588 while (categoryvalue[0] != '\0' && categoryvalue[0] == ':')
589 ++categoryvalue;
590 if (categoryvalue[0] == '\0')
592 /* The whole contents of CATEGORYVALUE has been searched but
593 no valid entry has been found. We solve this situation
594 by implicitly appending a "C" entry, i.e. no translation
595 will take place. */
596 single_locale[0] = 'C';
597 single_locale[1] = '\0';
599 else
601 char *cp = single_locale;
602 while (categoryvalue[0] != '\0' && categoryvalue[0] != ':')
603 *cp++ = *categoryvalue++;
604 *cp = '\0';
606 /* When this is a SUID binary we must not allow accessing files
607 outside the dedicated directories. */
608 if (ENABLE_SECURE && IS_PATH_WITH_DIR (single_locale))
609 /* Ingore this entry. */
610 continue;
613 /* If the current locale value is C (or POSIX) we don't load a
614 domain. Return the MSGID. */
615 if (strcmp (single_locale, "C") == 0
616 || strcmp (single_locale, "POSIX") == 0)
617 break;
619 /* Find structure describing the message catalog matching the
620 DOMAINNAME and CATEGORY. */
621 domain = _nl_find_domain (dirname, single_locale, xdomainname, binding);
623 if (domain != NULL)
625 retval = _nl_find_msg (domain, binding, msgid1, &retlen);
627 if (retval == NULL)
629 int cnt;
631 for (cnt = 0; domain->successor[cnt] != NULL; ++cnt)
633 retval = _nl_find_msg (domain->successor[cnt], binding,
634 msgid1, &retlen);
636 if (retval != NULL)
638 domain = domain->successor[cnt];
639 break;
644 if (retval != NULL)
646 /* Found the translation of MSGID1 in domain DOMAIN:
647 starting at RETVAL, RETLEN bytes. */
648 FREE_BLOCKS (block_list);
649 #if defined HAVE_TSEARCH || defined _LIBC
650 if (foundp == NULL)
652 /* Create a new entry and add it to the search tree. */
653 struct known_translation_t *newp;
655 newp = (struct known_translation_t *)
656 malloc (offsetof (struct known_translation_t, msgid)
657 + msgid_len + domainname_len + 1);
658 if (newp != NULL)
660 newp->domainname =
661 mempcpy (newp->msgid, msgid1, msgid_len);
662 memcpy (newp->domainname, domainname, domainname_len + 1);
663 newp->category = category;
664 newp->counter = _nl_msg_cat_cntr;
665 newp->domain = domain;
666 newp->translation = retval;
667 newp->translation_length = retlen;
669 /* Insert the entry in the search tree. */
670 foundp = (struct known_translation_t **)
671 tsearch (newp, &root, transcmp);
672 if (foundp == NULL
673 || __builtin_expect (*foundp != newp, 0))
674 /* The insert failed. */
675 free (newp);
678 else
680 /* We can update the existing entry. */
681 (*foundp)->counter = _nl_msg_cat_cntr;
682 (*foundp)->domain = domain;
683 (*foundp)->translation = retval;
684 (*foundp)->translation_length = retlen;
686 #endif
687 __set_errno (saved_errno);
689 /* Now deal with plural. */
690 if (plural)
691 retval = plural_lookup (domain, n, retval, retlen);
693 __libc_rwlock_unlock (_nl_state_lock);
694 return retval;
699 return_untranslated:
700 /* Return the untranslated MSGID. */
701 FREE_BLOCKS (block_list);
702 __libc_rwlock_unlock (_nl_state_lock);
703 #ifndef _LIBC
704 if (!ENABLE_SECURE)
706 extern void _nl_log_untranslated PARAMS ((const char *logfilename,
707 const char *domainname,
708 const char *msgid1,
709 const char *msgid2,
710 int plural));
711 const char *logfilename = getenv ("GETTEXT_LOG_UNTRANSLATED");
713 if (logfilename != NULL && logfilename[0] != '\0')
714 _nl_log_untranslated (logfilename, domainname, msgid1, msgid2, plural);
716 #endif
717 __set_errno (saved_errno);
718 return (plural == 0
719 ? (char *) msgid1
720 /* Use the Germanic plural rule. */
721 : n == 1 ? (char *) msgid1 : (char *) msgid2);
725 char *
726 internal_function
727 _nl_find_msg (domain_file, domainbinding, msgid, lengthp)
728 struct loaded_l10nfile *domain_file;
729 struct binding *domainbinding;
730 const char *msgid;
731 size_t *lengthp;
733 struct loaded_domain *domain;
734 nls_uint32 nstrings;
735 size_t act;
736 char *result;
737 size_t resultlen;
739 if (domain_file->decided == 0)
740 _nl_load_domain (domain_file, domainbinding);
742 if (domain_file->data == NULL)
743 return NULL;
745 domain = (struct loaded_domain *) domain_file->data;
747 nstrings = domain->nstrings;
749 /* Locate the MSGID and its translation. */
750 if (domain->hash_tab != NULL)
752 /* Use the hashing table. */
753 nls_uint32 len = strlen (msgid);
754 nls_uint32 hash_val = hash_string (msgid);
755 nls_uint32 idx = hash_val % domain->hash_size;
756 nls_uint32 incr = 1 + (hash_val % (domain->hash_size - 2));
758 while (1)
760 nls_uint32 nstr =
761 W (domain->must_swap_hash_tab, domain->hash_tab[idx]);
763 if (nstr == 0)
764 /* Hash table entry is empty. */
765 return NULL;
767 nstr--;
769 /* Compare msgid with the original string at index nstr.
770 We compare the lengths with >=, not ==, because plural entries
771 are represented by strings with an embedded NUL. */
772 if (nstr < nstrings
773 ? W (domain->must_swap, domain->orig_tab[nstr].length) >= len
774 && (strcmp (msgid,
775 domain->data + W (domain->must_swap,
776 domain->orig_tab[nstr].offset))
777 == 0)
778 : domain->orig_sysdep_tab[nstr - nstrings].length > len
779 && (strcmp (msgid,
780 domain->orig_sysdep_tab[nstr - nstrings].pointer)
781 == 0))
783 act = nstr;
784 goto found;
787 if (idx >= domain->hash_size - incr)
788 idx -= domain->hash_size - incr;
789 else
790 idx += incr;
792 /* NOTREACHED */
794 else
796 /* Try the default method: binary search in the sorted array of
797 messages. */
798 size_t top, bottom;
800 bottom = 0;
801 top = nstrings;
802 while (bottom < top)
804 int cmp_val;
806 act = (bottom + top) / 2;
807 cmp_val = strcmp (msgid, (domain->data
808 + W (domain->must_swap,
809 domain->orig_tab[act].offset)));
810 if (cmp_val < 0)
811 top = act;
812 else if (cmp_val > 0)
813 bottom = act + 1;
814 else
815 goto found;
817 /* No translation was found. */
818 return NULL;
821 found:
822 /* The translation was found at index ACT. If we have to convert the
823 string to use a different character set, this is the time. */
824 if (act < nstrings)
826 result = (char *)
827 (domain->data + W (domain->must_swap, domain->trans_tab[act].offset));
828 resultlen = W (domain->must_swap, domain->trans_tab[act].length) + 1;
830 else
832 result = (char *) domain->trans_sysdep_tab[act - nstrings].pointer;
833 resultlen = domain->trans_sysdep_tab[act - nstrings].length;
836 #if defined _LIBC || HAVE_ICONV
837 if (domain->codeset_cntr
838 != (domainbinding != NULL ? domainbinding->codeset_cntr : 0))
840 /* The domain's codeset has changed through bind_textdomain_codeset()
841 since the message catalog was initialized or last accessed. We
842 have to reinitialize the converter. */
843 _nl_free_domain_conv (domain);
844 _nl_init_domain_conv (domain_file, domain, domainbinding);
847 if (
848 # ifdef _LIBC
849 domain->conv != (__gconv_t) -1
850 # else
851 # if HAVE_ICONV
852 domain->conv != (iconv_t) -1
853 # endif
854 # endif
857 /* We are supposed to do a conversion. First allocate an
858 appropriate table with the same structure as the table
859 of translations in the file, where we can put the pointers
860 to the converted strings in.
861 There is a slight complication with plural entries. They
862 are represented by consecutive NUL terminated strings. We
863 handle this case by converting RESULTLEN bytes, including
864 NULs. */
866 if (domain->conv_tab == NULL
867 && ((domain->conv_tab =
868 (char **) calloc (nstrings + domain->n_sysdep_strings,
869 sizeof (char *)))
870 == NULL))
871 /* Mark that we didn't succeed allocating a table. */
872 domain->conv_tab = (char **) -1;
874 if (__builtin_expect (domain->conv_tab == (char **) -1, 0))
875 /* Nothing we can do, no more memory. */
876 goto converted;
878 if (domain->conv_tab[act] == NULL)
880 /* We haven't used this string so far, so it is not
881 translated yet. Do this now. */
882 /* We use a bit more efficient memory handling.
883 We allocate always larger blocks which get used over
884 time. This is faster than many small allocations. */
885 __libc_lock_define_initialized (static, lock)
886 # define INITIAL_BLOCK_SIZE 4080
887 static unsigned char *freemem;
888 static size_t freemem_size;
890 const unsigned char *inbuf;
891 unsigned char *outbuf;
892 int malloc_count;
893 # ifndef _LIBC
894 transmem_block_t *transmem_list = NULL;
895 # endif
897 __libc_lock_lock (lock);
899 inbuf = (const unsigned char *) result;
900 outbuf = freemem + sizeof (size_t);
902 malloc_count = 0;
903 while (1)
905 transmem_block_t *newmem;
906 # ifdef _LIBC
907 size_t non_reversible;
908 int res;
910 if (freemem_size < sizeof (size_t))
911 goto resize_freemem;
913 res = __gconv (domain->conv,
914 &inbuf, inbuf + resultlen,
915 &outbuf,
916 outbuf + freemem_size - sizeof (size_t),
917 &non_reversible);
919 if (res == __GCONV_OK || res == __GCONV_EMPTY_INPUT)
920 break;
922 if (res != __GCONV_FULL_OUTPUT)
924 __libc_lock_unlock (lock);
925 goto converted;
928 inbuf = result;
929 # else
930 # if HAVE_ICONV
931 const char *inptr = (const char *) inbuf;
932 size_t inleft = resultlen;
933 char *outptr = (char *) outbuf;
934 size_t outleft;
936 if (freemem_size < sizeof (size_t))
937 goto resize_freemem;
939 outleft = freemem_size - sizeof (size_t);
940 if (iconv (domain->conv,
941 (ICONV_CONST char **) &inptr, &inleft,
942 &outptr, &outleft)
943 != (size_t) (-1))
945 outbuf = (unsigned char *) outptr;
946 break;
948 if (errno != E2BIG)
950 __libc_lock_unlock (lock);
951 goto converted;
953 # endif
954 # endif
956 resize_freemem:
957 /* We must allocate a new buffer or resize the old one. */
958 if (malloc_count > 0)
960 ++malloc_count;
961 freemem_size = malloc_count * INITIAL_BLOCK_SIZE;
962 newmem = (transmem_block_t *) realloc (transmem_list,
963 freemem_size);
964 # ifdef _LIBC
965 if (newmem != NULL)
966 transmem_list = transmem_list->next;
967 else
969 struct transmem_list *old = transmem_list;
971 transmem_list = transmem_list->next;
972 free (old);
974 # endif
976 else
978 malloc_count = 1;
979 freemem_size = INITIAL_BLOCK_SIZE;
980 newmem = (transmem_block_t *) malloc (freemem_size);
982 if (__builtin_expect (newmem == NULL, 0))
984 freemem = NULL;
985 freemem_size = 0;
986 __libc_lock_unlock (lock);
987 goto converted;
990 # ifdef _LIBC
991 /* Add the block to the list of blocks we have to free
992 at some point. */
993 newmem->next = transmem_list;
994 transmem_list = newmem;
996 freemem = newmem->data;
997 freemem_size -= offsetof (struct transmem_list, data);
998 # else
999 transmem_list = newmem;
1000 freemem = newmem;
1001 # endif
1003 outbuf = freemem + sizeof (size_t);
1006 /* We have now in our buffer a converted string. Put this
1007 into the table of conversions. */
1008 *(size_t *) freemem = outbuf - freemem - sizeof (size_t);
1009 domain->conv_tab[act] = (char *) freemem;
1010 /* Shrink freemem, but keep it aligned. */
1011 freemem_size -= outbuf - freemem;
1012 freemem = outbuf;
1013 freemem += freemem_size & (alignof (size_t) - 1);
1014 freemem_size = freemem_size & ~ (alignof (size_t) - 1);
1016 __libc_lock_unlock (lock);
1019 /* Now domain->conv_tab[act] contains the translation of all
1020 the plural variants. */
1021 result = domain->conv_tab[act] + sizeof (size_t);
1022 resultlen = *(size_t *) domain->conv_tab[act];
1025 converted:
1026 /* The result string is converted. */
1028 #endif /* _LIBC || HAVE_ICONV */
1030 *lengthp = resultlen;
1031 return result;
1035 /* Look up a plural variant. */
1036 static char *
1037 internal_function
1038 plural_lookup (domain, n, translation, translation_len)
1039 struct loaded_l10nfile *domain;
1040 unsigned long int n;
1041 const char *translation;
1042 size_t translation_len;
1044 struct loaded_domain *domaindata = (struct loaded_domain *) domain->data;
1045 unsigned long int index;
1046 const char *p;
1048 index = plural_eval (domaindata->plural, n);
1049 if (index >= domaindata->nplurals)
1050 /* This should never happen. It means the plural expression and the
1051 given maximum value do not match. */
1052 index = 0;
1054 /* Skip INDEX strings at TRANSLATION. */
1055 p = translation;
1056 while (index-- > 0)
1058 #ifdef _LIBC
1059 p = __rawmemchr (p, '\0');
1060 #else
1061 p = strchr (p, '\0');
1062 #endif
1063 /* And skip over the NUL byte. */
1064 p++;
1066 if (p >= translation + translation_len)
1067 /* This should never happen. It means the plural expression
1068 evaluated to a value larger than the number of variants
1069 available for MSGID1. */
1070 return (char *) translation;
1072 return (char *) p;
1075 #ifndef _LIBC
1076 /* Return string representation of locale CATEGORY. */
1077 static const char *
1078 internal_function
1079 category_to_name (category)
1080 int category;
1082 const char *retval;
1084 switch (category)
1086 #ifdef LC_COLLATE
1087 case LC_COLLATE:
1088 retval = "LC_COLLATE";
1089 break;
1090 #endif
1091 #ifdef LC_CTYPE
1092 case LC_CTYPE:
1093 retval = "LC_CTYPE";
1094 break;
1095 #endif
1096 #ifdef LC_MONETARY
1097 case LC_MONETARY:
1098 retval = "LC_MONETARY";
1099 break;
1100 #endif
1101 #ifdef LC_NUMERIC
1102 case LC_NUMERIC:
1103 retval = "LC_NUMERIC";
1104 break;
1105 #endif
1106 #ifdef LC_TIME
1107 case LC_TIME:
1108 retval = "LC_TIME";
1109 break;
1110 #endif
1111 #ifdef LC_MESSAGES
1112 case LC_MESSAGES:
1113 retval = "LC_MESSAGES";
1114 break;
1115 #endif
1116 #ifdef LC_RESPONSE
1117 case LC_RESPONSE:
1118 retval = "LC_RESPONSE";
1119 break;
1120 #endif
1121 #ifdef LC_ALL
1122 case LC_ALL:
1123 /* This might not make sense but is perhaps better than any other
1124 value. */
1125 retval = "LC_ALL";
1126 break;
1127 #endif
1128 default:
1129 /* If you have a better idea for a default value let me know. */
1130 retval = "LC_XXX";
1133 return retval;
1135 #endif
1137 /* Guess value of current locale from value of the environment variables. */
1138 static const char *
1139 internal_function
1140 guess_category_value (category, categoryname)
1141 int category;
1142 const char *categoryname;
1144 const char *language;
1145 const char *retval;
1147 /* The highest priority value is the `LANGUAGE' environment
1148 variable. But we don't use the value if the currently selected
1149 locale is the C locale. This is a GNU extension. */
1150 language = getenv ("LANGUAGE");
1151 if (language != NULL && language[0] == '\0')
1152 language = NULL;
1154 /* We have to proceed with the POSIX methods of looking to `LC_ALL',
1155 `LC_xxx', and `LANG'. On some systems this can be done by the
1156 `setlocale' function itself. */
1157 #ifdef _LIBC
1158 retval = __current_locale_name (category);
1159 #else
1160 retval = _nl_locale_name (category, categoryname);
1161 #endif
1163 /* Ignore LANGUAGE if the locale is set to "C" because
1164 1. "C" locale usually uses the ASCII encoding, and most international
1165 messages use non-ASCII characters. These characters get displayed
1166 as question marks (if using glibc's iconv()) or as invalid 8-bit
1167 characters (because other iconv()s refuse to convert most non-ASCII
1168 characters to ASCII). In any case, the output is ugly.
1169 2. The precise output of some programs in the "C" locale is specified
1170 by POSIX and should not depend on environment variables like
1171 "LANGUAGE". We allow such programs to use gettext(). */
1172 return language != NULL && strcmp (retval, "C") != 0 ? language : retval;
1175 /* @@ begin of epilog @@ */
1177 /* We don't want libintl.a to depend on any other library. So we
1178 avoid the non-standard function stpcpy. In GNU C Library this
1179 function is available, though. Also allow the symbol HAVE_STPCPY
1180 to be defined. */
1181 #if !_LIBC && !HAVE_STPCPY
1182 static char *
1183 stpcpy (dest, src)
1184 char *dest;
1185 const char *src;
1187 while ((*dest++ = *src++) != '\0')
1188 /* Do nothing. */ ;
1189 return dest - 1;
1191 #endif
1193 #if !_LIBC && !HAVE_MEMPCPY
1194 static void *
1195 mempcpy (dest, src, n)
1196 void *dest;
1197 const void *src;
1198 size_t n;
1200 return (void *) ((char *) memcpy (dest, src, n) + n);
1202 #endif
1205 #ifdef _LIBC
1206 /* If we want to free all resources we have to do some work at
1207 program's end. */
1208 libc_freeres_fn (free_mem)
1210 void *old;
1212 while (_nl_domain_bindings != NULL)
1214 struct binding *oldp = _nl_domain_bindings;
1215 _nl_domain_bindings = _nl_domain_bindings->next;
1216 if (oldp->dirname != INTUSE(_nl_default_dirname))
1217 /* Yes, this is a pointer comparison. */
1218 free (oldp->dirname);
1219 free (oldp->codeset);
1220 free (oldp);
1223 if (_nl_current_default_domain != _nl_default_default_domain)
1224 /* Yes, again a pointer comparison. */
1225 free ((char *) _nl_current_default_domain);
1227 /* Remove the search tree with the known translations. */
1228 __tdestroy (root, free);
1229 root = NULL;
1231 while (transmem_list != NULL)
1233 old = transmem_list;
1234 transmem_list = transmem_list->next;
1235 free (old);
1238 #endif