1 /* Handle configuration data.
2 Copyright (C) 1997-2021 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, see
18 <https://www.gnu.org/licenses/>. */
29 #include <stdio_ext.h>
33 #include <sys/param.h>
34 #include <sys/types.h>
36 #include <libc-lock.h>
37 #include <gconv_int.h>
40 /* This is the default path where we look for module lists. */
41 static const char default_gconv_path
[] = GCONV_PATH
;
43 /* Type to represent search path. */
50 /* The path elements, as determined by the __gconv_get_path function.
51 All path elements end in a slash. */
52 struct path_elem
*__gconv_path_elem
;
53 /* Maximum length of a single path element in __gconv_path_elem. */
54 size_t __gconv_max_path_elem_len
;
56 /* We use the following struct if we couldn't allocate memory. */
57 static const struct path_elem empty_path_elem
= { NULL
, 0 };
59 /* Name of the file containing the module information in the directories
61 static const char gconv_conf_filename
[] = "gconv-modules";
62 static const char gconv_conf_dirname
[] = "gconv-modules.d";
64 /* Filename extension for the modules. */
66 # define MODULE_EXT ".so"
68 static const char gconv_module_ext
[] = MODULE_EXT
;
70 /* We have a few builtin transformations. */
71 static struct gconv_module builtin_modules
[] =
73 #define BUILTIN_TRANSFORMATION(From, To, Cost, Name, Fct, BtowcFct, \
74 MinF, MaxF, MinT, MaxT) \
76 .from_string = From, \
82 #define BUILTIN_ALIAS(From, To)
84 #include "gconv_builtin.h"
86 #undef BUILTIN_TRANSFORMATION
90 static const char builtin_aliases
[] =
92 #define BUILTIN_TRANSFORMATION(From, To, Cost, Name, Fct, BtowcFct, \
93 MinF, MaxF, MinT, MaxT)
94 #define BUILTIN_ALIAS(From, To) From "\0" To "\0"
96 #include "gconv_builtin.h"
98 #undef BUILTIN_TRANSFORMATION
102 #include <libio/libioP.h>
103 #define __getdelim(line, len, c, fp) _IO_getdelim (line, len, c, fp)
106 /* Value of the GCONV_PATH environment variable. */
107 const char *__gconv_path_envvar
;
110 /* Test whether there is already a matching module known. */
112 detect_conflict (const char *alias
)
114 struct gconv_module
*node
= __gconv_modules_db
;
118 int cmpres
= strcmp (alias
, node
->from_string
);
121 /* We have a conflict. */
133 /* The actual code to add aliases. */
135 add_alias2 (const char *from
, const char *to
, const char *wp
, void *modules
)
137 /* Test whether this alias conflicts with any available module. */
138 if (detect_conflict (from
))
139 /* It does conflict, don't add the alias. */
142 struct gconv_alias
*new_alias
= (struct gconv_alias
*)
143 malloc (sizeof (struct gconv_alias
) + (wp
- from
));
144 if (new_alias
!= NULL
)
148 new_alias
->fromname
= memcpy ((char *) new_alias
149 + sizeof (struct gconv_alias
),
151 new_alias
->toname
= new_alias
->fromname
+ (to
- from
);
153 inserted
= (void **) __tsearch (new_alias
, &__gconv_alias_db
,
154 __gconv_alias_compare
);
155 if (inserted
== NULL
|| *inserted
!= new_alias
)
156 /* Something went wrong, free this entry. */
164 add_alias (char *rp
, void *modules
)
166 /* We now expect two more string. The strings are normalized
167 (converted to UPPER case) and strored in the alias database. */
168 char *from
, *to
, *wp
;
170 while (__isspace_l (*rp
, _nl_C_locobj_ptr
))
173 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
174 *wp
++ = __toupper_l (*rp
++, _nl_C_locobj_ptr
);
176 /* There is no `to' string on the line. Ignore it. */
180 while (__isspace_l (*rp
, _nl_C_locobj_ptr
))
182 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
183 *wp
++ = __toupper_l (*rp
++, _nl_C_locobj_ptr
);
185 /* No `to' string, ignore the line. */
189 add_alias2 (from
, to
, wp
, modules
);
193 /* Insert a data structure for a new module in the search tree. */
195 insert_module (struct gconv_module
*newp
, int tobefreed
)
197 struct gconv_module
**rootp
= &__gconv_modules_db
;
199 while (*rootp
!= NULL
)
201 struct gconv_module
*root
= *rootp
;
204 cmpres
= strcmp (newp
->from_string
, root
->from_string
);
207 /* Both strings are identical. Insert the string at the
208 end of the `same' list if it is not already there. */
209 while (strcmp (newp
->from_string
, root
->from_string
) != 0
210 || strcmp (newp
->to_string
, root
->to_string
) != 0)
220 /* This is a no new conversion. But maybe the cost is
222 if (newp
->cost_hi
< root
->cost_hi
223 || (newp
->cost_hi
== root
->cost_hi
224 && newp
->cost_lo
< root
->cost_lo
))
226 newp
->left
= root
->left
;
227 newp
->right
= root
->right
;
228 newp
->same
= root
->same
;
243 rootp
= &root
->right
;
246 /* Plug in the new node here. */
251 /* Add new module. */
253 add_module (char *rp
, const char *directory
, size_t dir_len
, void **modules
,
254 size_t *nmodules
, int modcounter
)
259 3. filename of the module
260 4. an optional cost value
262 struct gconv_alias fake_alias
;
263 struct gconv_module
*new_module
;
264 char *from
, *to
, *module
, *wp
;
268 while (__isspace_l (*rp
, _nl_C_locobj_ptr
))
271 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
273 *rp
= __toupper_l (*rp
, _nl_C_locobj_ptr
);
280 while (__isspace_l (*rp
, _nl_C_locobj_ptr
))
282 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
283 *wp
++ = __toupper_l (*rp
++, _nl_C_locobj_ptr
);
289 while (__isspace_l (*rp
, _nl_C_locobj_ptr
));
291 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
295 /* There is no cost, use one by default. */
301 /* There might be a cost value. */
305 cost_hi
= strtol (rp
, &endp
, 10);
306 if (rp
== endp
|| cost_hi
< 1)
307 /* No useful information. */
311 if (module
[0] == '\0')
312 /* No module name given. */
314 if (module
[0] == '/')
317 /* See whether we must add the ending. */
319 if (wp
- module
< (ptrdiff_t) sizeof (gconv_module_ext
)
320 || memcmp (wp
- sizeof (gconv_module_ext
), gconv_module_ext
,
321 sizeof (gconv_module_ext
)) != 0)
322 /* We must add the module extension. */
323 need_ext
= sizeof (gconv_module_ext
) - 1;
325 /* See whether we have already an alias with this name defined. */
326 fake_alias
.fromname
= strndupa (from
, to
- from
);
328 if (__tfind (&fake_alias
, &__gconv_alias_db
, __gconv_alias_compare
) != NULL
)
329 /* This module duplicates an alias. */
332 new_module
= (struct gconv_module
*) calloc (1,
333 sizeof (struct gconv_module
)
335 + dir_len
+ need_ext
);
336 if (new_module
!= NULL
)
340 new_module
->from_string
= tmp
= (char *) (new_module
+ 1);
341 tmp
= __mempcpy (tmp
, from
, to
- from
);
343 new_module
->to_string
= tmp
;
344 tmp
= __mempcpy (tmp
, to
, module
- to
);
346 new_module
->cost_hi
= cost_hi
;
347 new_module
->cost_lo
= modcounter
;
349 new_module
->module_name
= tmp
;
352 tmp
= __mempcpy (tmp
, directory
, dir_len
);
354 tmp
= __mempcpy (tmp
, module
, wp
- module
);
357 memcpy (tmp
- 1, gconv_module_ext
, sizeof (gconv_module_ext
));
359 /* Now insert the new module data structure in our search tree. */
360 insert_module (new_module
, 1);
365 /* Read the next configuration file. */
367 read_conf_file (const char *filename
, const char *directory
, size_t dir_len
,
368 void **modules
, size_t *nmodules
)
370 /* Note the file is opened with cancellation in the I/O functions
372 FILE *fp
= fopen (filename
, "rce");
375 static int modcounter
;
377 /* Don't complain if a file is not present or readable, simply silently
382 /* No threads reading from this stream. */
383 __fsetlocking (fp
, FSETLOCKING_BYCALLER
);
385 /* Process the known entries of the file. Comments start with `#' and
386 end with the end of the line. Empty lines are ignored. */
387 while (!__feof_unlocked (fp
))
389 char *rp
, *endp
, *word
;
390 ssize_t n
= __getdelim (&line
, &line_len
, '\n', fp
);
392 /* An error occurred. */
396 /* Terminate the line (excluding comments or newline) by an NUL byte
397 to simplify the following code. */
398 endp
= strchr (rp
, '#');
402 if (rp
[n
- 1] == '\n')
405 while (__isspace_l (*rp
, _nl_C_locobj_ptr
))
408 /* If this is an empty line go on with the next one. */
413 while (*rp
!= '\0' && !__isspace_l (*rp
, _nl_C_locobj_ptr
))
416 if (rp
- word
== sizeof ("alias") - 1
417 && memcmp (word
, "alias", sizeof ("alias") - 1) == 0)
418 add_alias (rp
, *modules
);
419 else if (rp
- word
== sizeof ("module") - 1
420 && memcmp (word
, "module", sizeof ("module") - 1) == 0)
421 add_module (rp
, directory
, dir_len
, modules
, nmodules
, modcounter
++);
423 /* Otherwise ignore the line. */
432 /* Determine the directories we are looking for data in. This function should
433 only be called from __gconv_read_conf. */
435 __gconv_get_path (void)
437 struct path_elem
*result
;
439 /* This function is only ever called when __gconv_path_elem is NULL. */
440 result
= __gconv_path_elem
;
441 assert (result
== NULL
);
443 /* Determine the complete path first. */
445 size_t gconv_path_len
;
453 if (__gconv_path_envvar
== NULL
)
455 /* No user-defined path. Make a modifiable copy of the
457 gconv_path
= strdupa (default_gconv_path
);
458 gconv_path_len
= sizeof (default_gconv_path
);
464 /* Append the default path to the user-defined path. */
465 size_t user_len
= strlen (__gconv_path_envvar
);
467 gconv_path_len
= user_len
+ 1 + sizeof (default_gconv_path
);
468 gconv_path
= alloca (gconv_path_len
);
469 __mempcpy (__mempcpy (__mempcpy (gconv_path
, __gconv_path_envvar
,
472 default_gconv_path
, sizeof (default_gconv_path
));
473 cwd
= __getcwd (NULL
, 0);
474 cwdlen
= __glibc_unlikely (cwd
== NULL
) ? 0 : strlen (cwd
);
476 assert (default_gconv_path
[0] == '/');
478 /* In a first pass we calculate the number of elements. */
480 cp
= strchr (gconv_path
, ':');
487 cp
= strchr (cp
+ 1, ':');
490 /* Allocate the memory for the result. */
491 result
= malloc ((nelems
+ 1)
492 * sizeof (struct path_elem
)
493 + gconv_path_len
+ nelems
494 + (nelems
- 1) * (cwdlen
+ 1));
497 char *strspace
= (char *) &result
[nelems
+ 1];
500 /* Separate the individual parts. */
501 __gconv_max_path_elem_len
= 0;
502 elem
= __strtok_r (gconv_path
, ":", &gconv_path
);
503 assert (elem
!= NULL
);
506 result
[n
].name
= strspace
;
509 assert (cwd
!= NULL
);
510 strspace
= __mempcpy (strspace
, cwd
, cwdlen
);
513 strspace
= __stpcpy (strspace
, elem
);
514 if (strspace
[-1] != '/')
517 result
[n
].len
= strspace
- result
[n
].name
;
518 if (result
[n
].len
> __gconv_max_path_elem_len
)
519 __gconv_max_path_elem_len
= result
[n
].len
;
524 while ((elem
= __strtok_r (NULL
, ":", &gconv_path
)) != NULL
);
526 result
[n
].name
= NULL
;
530 __gconv_path_elem
= result
?: (struct path_elem
*) &empty_path_elem
;
536 /* Read all configuration files found in the user-specified and the default
537 path. This function should only be called once during the program's
538 lifetime. It disregards locking and synchronization because its only
539 caller, __gconv_load_conf, handles this. */
541 __gconv_read_conf (void)
543 void *modules
= NULL
;
545 int save_errno
= errno
;
548 /* First see whether we should use the cache. */
549 if (__gconv_load_cache () == 0)
551 /* Yes, we are done. */
552 __set_errno (save_errno
);
557 /* Find out where we have to look. */
560 for (cnt
= 0; __gconv_path_elem
[cnt
].name
!= NULL
; ++cnt
)
562 #define BUF_LEN elem_len + sizeof (gconv_conf_dirname)
564 const char *elem
= __gconv_path_elem
[cnt
].name
;
565 size_t elem_len
= __gconv_path_elem
[cnt
].len
;
568 /* No slash needs to be inserted between elem and gconv_conf_filename;
569 elem already ends in a slash. */
570 buf
= alloca (BUF_LEN
);
571 char *cp
= __mempcpy (__mempcpy (buf
, elem
, elem_len
),
572 gconv_conf_filename
, sizeof (gconv_conf_filename
));
574 /* Read the gconv-modules configuration file first. */
575 read_conf_file (buf
, elem
, elem_len
, &modules
, &nmodules
);
577 /* Next, see if there is a gconv-modules.d directory containing
578 configuration files and if it is non-empty. */
584 DIR *confdir
= __opendir (buf
);
588 while ((ent
= __readdir (confdir
)) != NULL
)
590 if (ent
->d_type
!= DT_REG
)
593 size_t len
= strlen (ent
->d_name
);
594 const char *suffix
= ".conf";
596 if (len
> strlen (suffix
)
597 && strcmp (ent
->d_name
+ len
- strlen (suffix
), suffix
) == 0)
599 /* LEN <= PATH_MAX so this alloca is not unbounded. */
600 char *conf
= alloca (BUF_LEN
+ len
+ 1);
601 cp
= stpcpy (conf
, buf
);
602 sprintf (cp
, "/%s", ent
->d_name
);
603 read_conf_file (conf
, elem
, elem_len
, &modules
, &nmodules
);
606 __closedir (confdir
);
611 /* Add the internal modules. */
612 for (cnt
= 0; cnt
< sizeof (builtin_modules
) / sizeof (builtin_modules
[0]);
615 struct gconv_alias fake_alias
;
617 fake_alias
.fromname
= (char *) builtin_modules
[cnt
].from_string
;
619 if (__tfind (&fake_alias
, &__gconv_alias_db
, __gconv_alias_compare
)
621 /* It'll conflict so don't add it. */
624 insert_module (&builtin_modules
[cnt
], 0);
627 /* Add aliases for builtin conversions. */
628 const char *cp
= builtin_aliases
;
631 const char *from
= cp
;
632 const char *to
= __rawmemchr (from
, '\0') + 1;
633 cp
= __rawmemchr (to
, '\0') + 1;
635 add_alias2 (from
, to
, cp
, modules
);
639 /* Restore the error number. */
640 __set_errno (save_errno
);
644 /* This "once" variable is used to do a one-time load of the configuration. */
645 __libc_once_define (static, once
);
648 /* Read all configuration files found in the user-specified and the default
649 path, but do it only "once" using __gconv_read_conf to do the actual
650 work. This is the function that must be called when reading iconv
653 __gconv_load_conf (void)
655 __libc_once (once
, __gconv_read_conf
);
659 /* Free all resources if necessary. */
660 libc_freeres_fn (free_mem
)
662 if (__gconv_path_elem
!= NULL
&& __gconv_path_elem
!= &empty_path_elem
)
663 free ((void *) __gconv_path_elem
);