1 /* Implementation of the internal dcigettext function.
2 Copyright (C) 1995-2005, 2006, 2007 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, write to the Free
17 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
20 /* Tell glibc's <string.h> to provide a prototype for mempcpy().
21 This must come before <config.h> because <config.h> may include
22 <features.h>, and once <features.h> has been included, it's too late. */
24 # define _GNU_SOURCE 1
31 #include <sys/types.h>
34 # define alloca __builtin_alloca
35 # define HAVE_ALLOCA 1
37 # if defined HAVE_ALLOCA_H || defined _LIBC
55 # define __set_errno(val) errno = (val)
62 #if defined HAVE_UNISTD_H || defined _LIBC
68 #if defined HAVE_SYS_PARAM_H || defined _LIBC
69 # include <sys/param.h>
73 #include "plural-exp.h"
77 # include "libgnuintl.h"
79 #include "hash-string.h"
81 /* Thread safetyness. */
83 # include <bits/libc-lock.h>
85 /* Provide dummy implementation if this is outside glibc. */
86 # define __libc_lock_define_initialized(CLASS, NAME)
87 # define __libc_lock_lock(NAME)
88 # define __libc_lock_unlock(NAME)
89 # define __libc_rwlock_define_initialized(CLASS, NAME)
90 # define __libc_rwlock_rdlock(NAME)
91 # define __libc_rwlock_unlock(NAME)
94 /* Alignment of types. */
95 #if defined __GNUC__ && __GNUC__ >= 2
96 # define alignof(TYPE) __alignof__ (TYPE)
98 # define alignof(TYPE) \
99 ((int) &((struct { char dummy1; TYPE dummy2; } *) 0)->dummy2)
102 /* The internal variables in the standalone libintl.a must have different
103 names than the internal variables in GNU libc, otherwise programs
104 using libintl.a cannot be linked statically. */
106 # define _nl_default_default_domain libintl_nl_default_default_domain
107 # define _nl_current_default_domain libintl_nl_current_default_domain
108 # define _nl_default_dirname libintl_nl_default_dirname
109 # define _nl_domain_bindings libintl_nl_domain_bindings
112 /* Some compilers, like SunOS4 cc, don't have offsetof in <stddef.h>. */
114 # define offsetof(type,ident) ((size_t)&(((type*)0)->ident))
117 /* @@ end of prolog @@ */
120 /* Rename the non ANSI C functions. This is required by the standard
121 because some ANSI C functions will require linking with this object
122 file and the name space must not be polluted. */
123 # define getcwd __getcwd
125 # define stpcpy __stpcpy
127 # define tfind __tfind
129 # if !defined HAVE_GETCWD
131 # define getcwd(buf, max) getwd (buf)
136 static char *stpcpy
PARAMS ((char *dest
, const char *src
));
138 # ifndef HAVE_MEMPCPY
139 static void *mempcpy
PARAMS ((void *dest
, const void *src
, size_t n
));
143 /* Amount to increase buffer size by in each try. */
146 /* The following is from pathmax.h. */
147 /* Non-POSIX BSD systems might have gcc's limits.h, which doesn't define
148 PATH_MAX but might cause redefinition warnings when sys/param.h is
149 later included (as on MORE/BSD 4.3). */
150 #if defined _POSIX_VERSION || (defined HAVE_LIMITS_H && !defined __GNUC__)
154 #ifndef _POSIX_PATH_MAX
155 # define _POSIX_PATH_MAX 255
158 #if !defined PATH_MAX && defined _PC_PATH_MAX
159 # define PATH_MAX (pathconf ("/", _PC_PATH_MAX) < 1 ? 1024 : pathconf ("/", _PC_PATH_MAX))
162 /* Don't include sys/param.h if it already has been. */
163 #if defined HAVE_SYS_PARAM_H && !defined PATH_MAX && !defined MAXPATHLEN
164 # include <sys/param.h>
167 #if !defined PATH_MAX && defined MAXPATHLEN
168 # define PATH_MAX MAXPATHLEN
172 # define PATH_MAX _POSIX_PATH_MAX
175 /* Whether to support different locales in different threads. */
176 #if defined _LIBC || HAVE_NL_LOCALE_NAME
177 # define HAVE_PER_THREAD_LOCALE
180 /* This is the type used for the search tree where known translations
182 struct known_translation_t
184 /* Domain in which to search. */
185 const char *domainname
;
190 #ifdef HAVE_PER_THREAD_LOCALE
191 /* Name of the relevant locale category, or "" for the global locale. */
192 const char *localename
;
195 /* State of the catalog counter at the point the string was found. */
198 /* Catalog where the string was found. */
199 struct loaded_l10nfile
*domain
;
201 /* And finally the translation. */
202 const char *translation
;
203 size_t translation_length
;
205 /* Pointer to the string in question. */
209 /* Root of the search tree with known translations. We can use this
210 only if the system provides the `tsearch' function family. */
211 #if defined HAVE_TSEARCH || defined _LIBC
217 # define tsearch __tsearch
220 /* Function to compare two entries in the table of known translations. */
221 static int transcmp
PARAMS ((const void *p1
, const void *p2
));
227 const struct known_translation_t
*s1
;
228 const struct known_translation_t
*s2
;
231 s1
= (const struct known_translation_t
*) p1
;
232 s2
= (const struct known_translation_t
*) p2
;
234 result
= strcmp (s1
->msgid
, s2
->msgid
);
237 result
= strcmp (s1
->domainname
, s2
->domainname
);
240 #ifdef HAVE_PER_THREAD_LOCALE
241 result
= strcmp (s1
->localename
, s2
->localename
);
244 /* We compare the category last (though this is the cheapest
245 operation) since it is hopefully always the same (namely
247 result
= s1
->category
- s2
->category
;
255 /* Name of the default domain used for gettext(3) prior any call to
256 textdomain(3). The default value for this is "messages". */
257 const char _nl_default_default_domain
[] attribute_hidden
= "messages";
259 /* Value used as the default domain for gettext(3). */
260 const char *_nl_current_default_domain attribute_hidden
261 = _nl_default_default_domain
;
263 /* Contains the default location of the message catalogs. */
266 extern const char _nl_default_dirname
[];
267 libc_hidden_proto (_nl_default_dirname
)
269 const char _nl_default_dirname
[] = LOCALEDIR
;
271 libc_hidden_data_def (_nl_default_dirname
)
274 /* List with bindings of specific domains created by bindtextdomain()
276 struct binding
*_nl_domain_bindings
;
278 /* Prototypes for local functions. */
279 static char *plural_lookup
PARAMS ((struct loaded_l10nfile
*domain
,
281 const char *translation
,
282 size_t translation_len
))
284 static const char *guess_category_value
PARAMS ((int category
,
285 const char *categoryname
))
288 # include "../locale/localeinfo.h"
289 # define category_to_name(category) \
290 _nl_category_names.str + _nl_category_name_idxs[category]
292 static const char *category_to_name
PARAMS ((int category
)) internal_function
;
296 /* For those loosing systems which don't have `alloca' we have to add
297 some additional code emulating it. */
299 /* Nothing has to be done. */
300 # define freea(p) /* nothing */
301 # define ADD_BLOCK(list, address) /* nothing */
302 # define FREE_BLOCKS(list) /* nothing */
307 struct block_list
*next
;
309 # define ADD_BLOCK(list, addr) \
311 struct block_list *newp = (struct block_list *) malloc (sizeof (*newp)); \
312 /* If we cannot get a free block we cannot add the new element to \
314 if (newp != NULL) { \
315 newp->address = (addr); \
316 newp->next = (list); \
320 # define FREE_BLOCKS(list) \
322 while (list != NULL) { \
323 struct block_list *old = list; \
325 free (old->address); \
330 # define alloca(size) (malloc (size))
331 # define freea(p) free (p)
332 #endif /* have alloca */
336 /* List of blocks allocated for translations. */
337 typedef struct transmem_list
339 struct transmem_list
*next
;
342 static struct transmem_list
*transmem_list
;
344 typedef unsigned char transmem_block_t
;
346 #if defined _LIBC || HAVE_ICONV
347 static const char *get_output_charset
PARAMS ((struct binding
*domainbinding
))
352 /* Names for the libintl functions are a problem. They must not clash
353 with existing names and they should follow ANSI C. But this source
354 code is also used in GNU C Library where the names have a __
355 prefix. So we have to make a difference here. */
357 # define DCIGETTEXT __dcigettext
359 # define DCIGETTEXT libintl_dcigettext
362 /* Lock variable to protect the global data in the gettext implementation. */
364 __libc_rwlock_define_initialized (, _nl_state_lock attribute_hidden
)
367 /* Checking whether the binaries runs SUID must be done and glibc provides
368 easier methods therefore we make a difference here. */
370 # define ENABLE_SECURE __libc_enable_secure
371 # define DETERMINE_SECURE
379 # ifndef HAVE_GETEUID
380 # define geteuid() getuid()
382 # ifndef HAVE_GETEGID
383 # define getegid() getgid()
385 static int enable_secure
;
386 # define ENABLE_SECURE (enable_secure == 1)
387 # define DETERMINE_SECURE \
388 if (enable_secure == 0) \
390 if (getuid () != geteuid () || getgid () != getegid ()) \
393 enable_secure = -1; \
397 /* Get the function to evaluate the plural expression. */
398 #include "plural-eval.c"
400 /* Look up MSGID in the DOMAINNAME message catalog for the current
401 CATEGORY locale and, if PLURAL is nonzero, search over string
402 depending on the plural form determined by N. */
404 DCIGETTEXT (domainname
, msgid1
, msgid2
, plural
, n
, category
)
405 const char *domainname
;
413 struct block_list
*block_list
= NULL
;
415 struct loaded_l10nfile
*domain
;
416 struct binding
*binding
;
417 const char *categoryname
;
418 const char *categoryvalue
;
419 char *dirname
, *xdomainname
;
424 #if defined HAVE_TSEARCH || defined _LIBC
425 struct known_translation_t
*search
;
426 struct known_translation_t
**foundp
= NULL
;
428 # ifdef HAVE_PER_THREAD_LOCALE
429 const char *localename
;
432 size_t domainname_len
;
434 /* If no real MSGID is given return NULL. */
439 if (category
< 0 || category
>= __LC_LAST
|| category
== LC_ALL
)
443 /* Use the Germanic plural rule. */
444 : n
== 1 ? (char *) msgid1
: (char *) msgid2
);
447 __libc_rwlock_rdlock (_nl_state_lock
);
449 /* If DOMAINNAME is NULL, we are interested in the default domain. If
450 CATEGORY is not LC_MESSAGES this might not make much sense but the
451 definition left this undefined. */
452 if (domainname
== NULL
)
453 domainname
= _nl_current_default_domain
;
455 #if defined HAVE_TSEARCH || defined _LIBC
456 msgid_len
= strlen (msgid1
) + 1;
458 /* Try to find the translation among those which we found at
460 search
= (struct known_translation_t
*)
461 alloca (offsetof (struct known_translation_t
, msgid
) + msgid_len
);
462 memcpy (search
->msgid
, msgid1
, msgid_len
);
463 search
->domainname
= domainname
;
464 search
->category
= category
;
465 # ifdef HAVE_PER_THREAD_LOCALE
467 localename
= __current_locale_name (category
);
469 search
->localename
= localename
;
472 /* Since tfind/tsearch manage a balanced tree, concurrent tfind and
473 tsearch calls can be fatal. */
474 __libc_rwlock_define_initialized (static, tree_lock
);
475 __libc_rwlock_rdlock (tree_lock
);
477 foundp
= (struct known_translation_t
**) tfind (search
, &root
, transcmp
);
479 __libc_rwlock_unlock (tree_lock
);
482 if (foundp
!= NULL
&& (*foundp
)->counter
== _nl_msg_cat_cntr
)
484 /* Now deal with plural. */
486 retval
= plural_lookup ((*foundp
)->domain
, n
, (*foundp
)->translation
,
487 (*foundp
)->translation_length
);
489 retval
= (char *) (*foundp
)->translation
;
491 __libc_rwlock_unlock (_nl_state_lock
);
496 /* Preserve the `errno' value. */
499 /* See whether this is a SUID binary or not. */
502 /* First find matching binding. */
503 for (binding
= _nl_domain_bindings
; binding
!= NULL
; binding
= binding
->next
)
505 int compare
= strcmp (domainname
, binding
->domainname
);
511 /* It is not in the list. */
518 dirname
= (char *) _nl_default_dirname
;
519 else if (binding
->dirname
[0] == '/')
520 dirname
= binding
->dirname
;
523 /* We have a relative path. Make it absolute now. */
524 size_t dirname_len
= strlen (binding
->dirname
) + 1;
528 path_max
= (unsigned int) PATH_MAX
;
529 path_max
+= 2; /* The getcwd docs say to do this. */
533 dirname
= (char *) alloca (path_max
+ dirname_len
);
534 ADD_BLOCK (block_list
, dirname
);
537 ret
= getcwd (dirname
, path_max
);
538 if (ret
!= NULL
|| errno
!= ERANGE
)
541 path_max
+= path_max
/ 2;
542 path_max
+= PATH_INCR
;
547 /* We cannot get the current working directory. Don't signal an
548 error but simply return the default string. */
549 FREE_BLOCKS (block_list
);
550 __libc_rwlock_unlock (_nl_state_lock
);
551 __set_errno (saved_errno
);
554 /* Use the Germanic plural rule. */
555 : n
== 1 ? (char *) msgid1
: (char *) msgid2
);
558 stpcpy (stpcpy (strchr (dirname
, '\0'), "/"), binding
->dirname
);
561 /* Now determine the symbolic name of CATEGORY and its value. */
562 categoryname
= category_to_name (category
);
563 categoryvalue
= guess_category_value (category
, categoryname
);
565 domainname_len
= strlen (domainname
);
566 xdomainname
= (char *) alloca (strlen (categoryname
)
567 + domainname_len
+ 5);
568 ADD_BLOCK (block_list
, xdomainname
);
570 stpcpy (mempcpy (stpcpy (stpcpy (xdomainname
, categoryname
), "/"),
571 domainname
, domainname_len
),
574 /* Creating working area. */
575 single_locale
= (char *) alloca (strlen (categoryvalue
) + 1);
576 ADD_BLOCK (block_list
, single_locale
);
579 /* Search for the given string. This is a loop because we perhaps
580 got an ordered list of languages to consider for the translation. */
583 /* Make CATEGORYVALUE point to the next element of the list. */
584 while (categoryvalue
[0] != '\0' && categoryvalue
[0] == ':')
586 if (categoryvalue
[0] == '\0')
588 /* The whole contents of CATEGORYVALUE has been searched but
589 no valid entry has been found. We solve this situation
590 by implicitly appending a "C" entry, i.e. no translation
592 single_locale
[0] = 'C';
593 single_locale
[1] = '\0';
597 char *cp
= single_locale
;
598 while (categoryvalue
[0] != '\0' && categoryvalue
[0] != ':')
599 *cp
++ = *categoryvalue
++;
602 /* When this is a SUID binary we must not allow accessing files
603 outside the dedicated directories. */
604 if (ENABLE_SECURE
&& strchr (single_locale
, '/') != NULL
)
605 /* Ingore this entry. */
609 /* If the current locale value is C (or POSIX) we don't load a
610 domain. Return the MSGID. */
611 if (strcmp (single_locale
, "C") == 0
612 || strcmp (single_locale
, "POSIX") == 0)
615 FREE_BLOCKS (block_list
);
616 __libc_rwlock_unlock (_nl_state_lock
);
617 __set_errno (saved_errno
);
620 /* Use the Germanic plural rule. */
621 : n
== 1 ? (char *) msgid1
: (char *) msgid2
);
625 /* Find structure describing the message catalog matching the
626 DOMAINNAME and CATEGORY. */
627 domain
= _nl_find_domain (dirname
, single_locale
, xdomainname
, binding
);
631 retval
= _nl_find_msg (domain
, binding
, msgid1
, 1, &retlen
);
637 for (cnt
= 0; domain
->successor
[cnt
] != NULL
; ++cnt
)
639 retval
= _nl_find_msg (domain
->successor
[cnt
], binding
,
644 domain
= domain
->successor
[cnt
];
650 /* Returning -1 means that some resource problem exists
651 (likely memory) and that the strings could not be
652 converted. Return the original strings. */
653 if (__builtin_expect (retval
== (char *) -1, 0))
658 /* Found the translation of MSGID1 in domain DOMAIN:
659 starting at RETVAL, RETLEN bytes. */
660 FREE_BLOCKS (block_list
);
661 #if defined HAVE_TSEARCH || defined _LIBC
664 /* Create a new entry and add it to the search tree. */
666 struct known_translation_t
*newp
;
668 size
= offsetof (struct known_translation_t
, msgid
)
669 + msgid_len
+ domainname_len
+ 1;
670 # ifdef HAVE_PER_THREAD_LOCALE
671 size
+= strlen (localename
) + 1;
673 newp
= (struct known_translation_t
*) malloc (size
);
676 char *new_domainname
;
677 # ifdef HAVE_PER_THREAD_LOCALE
678 char *new_localename
;
681 new_domainname
= mempcpy (newp
->msgid
, msgid1
, msgid_len
);
682 memcpy (new_domainname
, domainname
, domainname_len
+ 1);
683 # ifdef HAVE_PER_THREAD_LOCALE
684 new_localename
= new_domainname
+ domainname_len
+ 1;
685 strcpy (new_localename
, localename
);
687 newp
->domainname
= new_domainname
;
688 newp
->category
= category
;
689 # ifdef HAVE_PER_THREAD_LOCALE
690 newp
->localename
= new_localename
;
692 newp
->counter
= _nl_msg_cat_cntr
;
693 newp
->domain
= domain
;
694 newp
->translation
= retval
;
695 newp
->translation_length
= retlen
;
697 __libc_rwlock_wrlock (tree_lock
);
699 /* Insert the entry in the search tree. */
700 foundp
= (struct known_translation_t
**)
701 tsearch (newp
, &root
, transcmp
);
703 __libc_rwlock_unlock (tree_lock
);
706 || __builtin_expect (*foundp
!= newp
, 0))
707 /* The insert failed. */
713 /* We can update the existing entry. */
714 (*foundp
)->counter
= _nl_msg_cat_cntr
;
715 (*foundp
)->domain
= domain
;
716 (*foundp
)->translation
= retval
;
717 (*foundp
)->translation_length
= retlen
;
720 __set_errno (saved_errno
);
722 /* Now deal with plural. */
724 retval
= plural_lookup (domain
, n
, retval
, retlen
);
726 __libc_rwlock_unlock (_nl_state_lock
);
737 _nl_find_msg (domain_file
, domainbinding
, msgid
, convert
, lengthp
)
738 struct loaded_l10nfile
*domain_file
;
739 struct binding
*domainbinding
;
744 struct loaded_domain
*domain
;
750 if (domain_file
->decided
<= 0)
751 _nl_load_domain (domain_file
, domainbinding
);
753 if (domain_file
->data
== NULL
)
756 domain
= (struct loaded_domain
*) domain_file
->data
;
758 nstrings
= domain
->nstrings
;
760 /* Locate the MSGID and its translation. */
761 if (domain
->hash_tab
!= NULL
)
763 /* Use the hashing table. */
764 nls_uint32 len
= strlen (msgid
);
765 nls_uint32 hash_val
= __hash_string (msgid
);
766 nls_uint32 idx
= hash_val
% domain
->hash_size
;
767 nls_uint32 incr
= 1 + (hash_val
% (domain
->hash_size
- 2));
772 W (domain
->must_swap_hash_tab
, domain
->hash_tab
[idx
]);
775 /* Hash table entry is empty. */
780 /* Compare msgid with the original string at index nstr.
781 We compare the lengths with >=, not ==, because plural entries
782 are represented by strings with an embedded NUL. */
784 ? W (domain
->must_swap
, domain
->orig_tab
[nstr
].length
) >= len
786 domain
->data
+ W (domain
->must_swap
,
787 domain
->orig_tab
[nstr
].offset
))
789 : domain
->orig_sysdep_tab
[nstr
- nstrings
].length
> len
791 domain
->orig_sysdep_tab
[nstr
- nstrings
].pointer
)
798 if (idx
>= domain
->hash_size
- incr
)
799 idx
-= domain
->hash_size
- incr
;
807 /* Try the default method: binary search in the sorted array of
817 act
= (bottom
+ top
) / 2;
818 cmp_val
= strcmp (msgid
, (domain
->data
819 + W (domain
->must_swap
,
820 domain
->orig_tab
[act
].offset
)));
823 else if (cmp_val
> 0)
828 /* No translation was found. */
833 /* The translation was found at index ACT. If we have to convert the
834 string to use a different character set, this is the time. */
838 (domain
->data
+ W (domain
->must_swap
, domain
->trans_tab
[act
].offset
));
839 resultlen
= W (domain
->must_swap
, domain
->trans_tab
[act
].length
) + 1;
843 result
= (char *) domain
->trans_sysdep_tab
[act
- nstrings
].pointer
;
844 resultlen
= domain
->trans_sysdep_tab
[act
- nstrings
].length
;
847 #if defined _LIBC || HAVE_ICONV
850 /* We are supposed to do a conversion. */
851 const char *encoding
= get_output_charset (domainbinding
);
853 /* Search whether a table with converted translations for this
854 encoding has already been allocated. */
855 size_t nconversions
= domain
->nconversions
;
856 struct converted_domain
*convd
= NULL
;
859 for (i
= nconversions
; i
> 0; )
862 if (strcmp (domain
->conversions
[i
].encoding
, encoding
) == 0)
864 convd
= &domain
->conversions
[i
];
871 /* Allocate a table for the converted translations for this
873 struct converted_domain
*new_conversions
=
874 (struct converted_domain
*)
875 realloc (domain
->conversions
,
876 (nconversions
+ 1) * sizeof (struct converted_domain
));
878 if (__builtin_expect (new_conversions
== NULL
, 0))
879 /* Nothing we can do, no more memory. We cannot use the
880 translation because it might be encoded incorrectly. */
883 domain
->conversions
= new_conversions
;
885 /* Copy the 'encoding' string to permanent storage. */
886 encoding
= strdup (encoding
);
887 if (__builtin_expect (encoding
== NULL
, 0))
888 /* Nothing we can do, no more memory. We cannot use the
889 translation because it might be encoded incorrectly. */
892 convd
= &new_conversions
[nconversions
];
893 convd
->encoding
= encoding
;
895 /* Find out about the character set the file is encoded with.
896 This can be found (in textual form) in the entry "". If this
897 entry does not exist or if this does not contain the 'charset='
898 information, we will assume the charset matches the one the
899 current locale and we don't have to perform any conversion. */
901 convd
->conv
= (__gconv_t
) -1;
904 convd
->conv
= (iconv_t
) -1;
911 /* Get the header entry. This is a recursion, but it doesn't
912 reallocate domain->conversions because we pass convert = 0. */
914 _nl_find_msg (domain_file
, domainbinding
, "", 0, &nullentrylen
);
916 if (nullentry
!= NULL
)
918 const char *charsetstr
;
920 charsetstr
= strstr (nullentry
, "charset=");
921 if (charsetstr
!= NULL
)
925 const char *outcharset
;
927 charsetstr
+= strlen ("charset=");
928 len
= strcspn (charsetstr
, " \t\n");
930 charset
= (char *) alloca (len
+ 1);
931 # if defined _LIBC || HAVE_MEMPCPY
932 *((char *) mempcpy (charset
, charsetstr
, len
)) = '\0';
934 memcpy (charset
, charsetstr
, len
);
938 outcharset
= encoding
;
941 /* We always want to use transliteration. */
942 outcharset
= norm_add_slashes (outcharset
, "TRANSLIT");
943 charset
= norm_add_slashes (charset
, "");
944 int r
= __gconv_open (outcharset
, charset
, &convd
->conv
,
946 if (__builtin_expect (r
!= __GCONV_OK
, 0))
948 /* If the output encoding is the same there is
949 nothing to do. Otherwise do not use the
950 translation at all. */
951 if (__builtin_expect (r
!= __GCONV_NULCONV
, 1))
953 free ((char *) encoding
);
957 convd
->conv
= (__gconv_t
) -1;
961 /* When using GNU libc >= 2.2 or GNU libiconv >= 1.5,
962 we want to use transliteration. */
963 # if (__GLIBC__ == 2 && __GLIBC_MINOR__ >= 2) || __GLIBC__ > 2 \
964 || _LIBICONV_VERSION >= 0x0105
965 if (strchr (outcharset
, '/') == NULL
)
969 len
= strlen (outcharset
);
970 tmp
= (char *) alloca (len
+ 10 + 1);
971 memcpy (tmp
, outcharset
, len
);
972 memcpy (tmp
+ len
, "//TRANSLIT", 10 + 1);
975 convd
->conv
= iconv_open (outcharset
, charset
);
981 convd
->conv
= iconv_open (outcharset
, charset
);
989 convd
->conv_tab
= NULL
;
990 /* Here domain->conversions is still == new_conversions. */
991 domain
->nconversions
++;
996 convd
->conv
!= (__gconv_t
) -1
999 convd
->conv
!= (iconv_t
) -1
1004 /* We are supposed to do a conversion. First allocate an
1005 appropriate table with the same structure as the table
1006 of translations in the file, where we can put the pointers
1007 to the converted strings in.
1008 There is a slight complication with plural entries. They
1009 are represented by consecutive NUL terminated strings. We
1010 handle this case by converting RESULTLEN bytes, including
1013 if (convd
->conv_tab
== NULL
1014 && ((convd
->conv_tab
=
1015 (char **) calloc (nstrings
+ domain
->n_sysdep_strings
,
1018 /* Mark that we didn't succeed allocating a table. */
1019 convd
->conv_tab
= (char **) -1;
1021 if (__builtin_expect (convd
->conv_tab
== (char **) -1, 0))
1022 /* Nothing we can do, no more memory. We cannot use the
1023 translation because it might be encoded incorrectly. */
1026 if (convd
->conv_tab
[act
] == NULL
)
1028 /* We haven't used this string so far, so it is not
1029 translated yet. Do this now. */
1030 /* We use a bit more efficient memory handling.
1031 We allocate always larger blocks which get used over
1032 time. This is faster than many small allocations. */
1033 __libc_lock_define_initialized (static, lock
)
1034 # define INITIAL_BLOCK_SIZE 4080
1035 static unsigned char *freemem
;
1036 static size_t freemem_size
;
1038 const unsigned char *inbuf
;
1039 unsigned char *outbuf
;
1042 transmem_block_t
*transmem_list
= NULL
;
1045 __libc_lock_lock (lock
);
1047 inbuf
= (const unsigned char *) result
;
1048 outbuf
= freemem
+ sizeof (size_t);
1053 transmem_block_t
*newmem
;
1055 size_t non_reversible
;
1058 if (freemem_size
< sizeof (size_t))
1059 goto resize_freemem
;
1061 res
= __gconv (convd
->conv
,
1062 &inbuf
, inbuf
+ resultlen
,
1064 outbuf
+ freemem_size
- sizeof (size_t),
1067 if (res
== __GCONV_OK
|| res
== __GCONV_EMPTY_INPUT
)
1070 if (res
!= __GCONV_FULL_OUTPUT
)
1072 /* We should not use the translation at all, it
1073 is incorrectly encoded. */
1074 __libc_lock_unlock (lock
);
1078 inbuf
= (const unsigned char *) result
;
1081 const char *inptr
= (const char *) inbuf
;
1082 size_t inleft
= resultlen
;
1083 char *outptr
= (char *) outbuf
;
1086 if (freemem_size
< sizeof (size_t))
1087 goto resize_freemem
;
1089 outleft
= freemem_size
- sizeof (size_t);
1090 if (iconv (convd
->conv
,
1091 (ICONV_CONST
char **) &inptr
, &inleft
,
1095 outbuf
= (unsigned char *) outptr
;
1100 __libc_lock_unlock (lock
);
1107 /* We must allocate a new buffer or resize the old one. */
1108 if (malloc_count
> 0)
1111 freemem_size
= malloc_count
* INITIAL_BLOCK_SIZE
;
1112 newmem
= (transmem_block_t
*) realloc (transmem_list
,
1116 transmem_list
= transmem_list
->next
;
1119 struct transmem_list
*old
= transmem_list
;
1121 transmem_list
= transmem_list
->next
;
1129 freemem_size
= INITIAL_BLOCK_SIZE
;
1130 newmem
= (transmem_block_t
*) malloc (freemem_size
);
1132 if (__builtin_expect (newmem
== NULL
, 0))
1136 __libc_lock_unlock (lock
);
1141 /* Add the block to the list of blocks we have to free
1143 newmem
->next
= transmem_list
;
1144 transmem_list
= newmem
;
1146 freemem
= (unsigned char *) newmem
->data
;
1147 freemem_size
-= offsetof (struct transmem_list
, data
);
1149 transmem_list
= newmem
;
1153 outbuf
= freemem
+ sizeof (size_t);
1156 /* We have now in our buffer a converted string. Put this
1157 into the table of conversions. */
1158 *(size_t *) freemem
= outbuf
- freemem
- sizeof (size_t);
1159 convd
->conv_tab
[act
] = (char *) freemem
;
1160 /* Shrink freemem, but keep it aligned. */
1161 freemem_size
-= outbuf
- freemem
;
1163 freemem
+= freemem_size
& (alignof (size_t) - 1);
1164 freemem_size
= freemem_size
& ~ (alignof (size_t) - 1);
1166 __libc_lock_unlock (lock
);
1169 /* Now convd->conv_tab[act] contains the translation of all
1170 the plural variants. */
1171 result
= convd
->conv_tab
[act
] + sizeof (size_t);
1172 resultlen
= *(size_t *) convd
->conv_tab
[act
];
1176 /* The result string is converted. */
1178 #endif /* _LIBC || HAVE_ICONV */
1180 *lengthp
= resultlen
;
1185 /* Look up a plural variant. */
1188 plural_lookup (domain
, n
, translation
, translation_len
)
1189 struct loaded_l10nfile
*domain
;
1190 unsigned long int n
;
1191 const char *translation
;
1192 size_t translation_len
;
1194 struct loaded_domain
*domaindata
= (struct loaded_domain
*) domain
->data
;
1195 unsigned long int index
;
1198 index
= plural_eval (domaindata
->plural
, n
);
1199 if (index
>= domaindata
->nplurals
)
1200 /* This should never happen. It means the plural expression and the
1201 given maximum value do not match. */
1204 /* Skip INDEX strings at TRANSLATION. */
1209 p
= __rawmemchr (p
, '\0');
1211 p
= strchr (p
, '\0');
1213 /* And skip over the NUL byte. */
1216 if (p
>= translation
+ translation_len
)
1217 /* This should never happen. It means the plural expression
1218 evaluated to a value larger than the number of variants
1219 available for MSGID1. */
1220 return (char *) translation
;
1226 /* Return string representation of locale CATEGORY. */
1229 category_to_name (category
)
1238 retval
= "LC_COLLATE";
1243 retval
= "LC_CTYPE";
1248 retval
= "LC_MONETARY";
1253 retval
= "LC_NUMERIC";
1263 retval
= "LC_MESSAGES";
1268 retval
= "LC_RESPONSE";
1273 /* This might not make sense but is perhaps better than any other
1279 /* If you have a better idea for a default value let me know. */
1287 /* Guess value of current locale from value of the environment variables. */
1290 guess_category_value (category
, categoryname
)
1292 const char *categoryname
;
1294 const char *language
;
1297 /* The highest priority value is the `LANGUAGE' environment
1298 variable. But we don't use the value if the currently selected
1299 locale is the C locale. This is a GNU extension. */
1300 language
= getenv ("LANGUAGE");
1301 if (language
!= NULL
&& language
[0] == '\0')
1304 /* We have to proceed with the POSIX methods of looking to `LC_ALL',
1305 `LC_xxx', and `LANG'. On some systems this can be done by the
1306 `setlocale' function itself. */
1308 retval
= __current_locale_name (category
);
1310 retval
= _nl_locale_name (category
, categoryname
);
1313 return language
!= NULL
&& strcmp (retval
, "C") != 0 ? language
: retval
;
1316 #if defined _LIBC || HAVE_ICONV
1317 /* Returns the output charset. */
1320 get_output_charset (domainbinding
)
1321 struct binding
*domainbinding
;
1323 /* The output charset should normally be determined by the locale. But
1324 sometimes the locale is not used or not correctly set up, so we provide
1325 a possibility for the user to override this: the OUTPUT_CHARSET
1326 environment variable. Moreover, the value specified through
1327 bind_textdomain_codeset overrides both. */
1328 if (domainbinding
!= NULL
&& domainbinding
->codeset
!= NULL
)
1329 return domainbinding
->codeset
;
1332 /* For speed reasons, we look at the value of OUTPUT_CHARSET only
1333 once. This is a user variable that is not supposed to change
1334 during a program run. */
1335 static char *output_charset_cache
;
1336 static int output_charset_cached
;
1338 if (!output_charset_cached
)
1340 const char *value
= getenv ("OUTPUT_CHARSET");
1342 if (value
!= NULL
&& value
[0] != '\0')
1344 size_t len
= strlen (value
) + 1;
1345 char *value_copy
= (char *) malloc (len
);
1347 if (value_copy
!= NULL
)
1348 memcpy (value_copy
, value
, len
);
1349 output_charset_cache
= value_copy
;
1351 output_charset_cached
= 1;
1354 if (output_charset_cache
!= NULL
)
1355 return output_charset_cache
;
1359 return _NL_CURRENT (LC_CTYPE
, CODESET
);
1362 extern const char *locale_charset
PARAMS ((void);
1363 return locale_charset ();
1371 /* @@ begin of epilog @@ */
1373 /* We don't want libintl.a to depend on any other library. So we
1374 avoid the non-standard function stpcpy. In GNU C Library this
1375 function is available, though. Also allow the symbol HAVE_STPCPY
1377 #if !_LIBC && !HAVE_STPCPY
1383 while ((*dest
++ = *src
++) != '\0')
1389 #if !_LIBC && !HAVE_MEMPCPY
1391 mempcpy (dest
, src
, n
)
1396 return (void *) ((char *) memcpy (dest
, src
, n
) + n
);
1402 /* If we want to free all resources we have to do some work at
1404 libc_freeres_fn (free_mem
)
1408 while (_nl_domain_bindings
!= NULL
)
1410 struct binding
*oldp
= _nl_domain_bindings
;
1411 _nl_domain_bindings
= _nl_domain_bindings
->next
;
1412 if (oldp
->dirname
!= _nl_default_dirname
)
1413 /* Yes, this is a pointer comparison. */
1414 free (oldp
->dirname
);
1415 free (oldp
->codeset
);
1419 if (_nl_current_default_domain
!= _nl_default_default_domain
)
1420 /* Yes, again a pointer comparison. */
1421 free ((char *) _nl_current_default_domain
);
1423 /* Remove the search tree with the known translations. */
1424 __tdestroy (root
, free
);
1427 while (transmem_list
!= NULL
)
1429 old
= transmem_list
;
1430 transmem_list
= transmem_list
->next
;