opendirat: don’t depend on openat-safer
[gnulib.git] / lib / c32rtomb.c
blobc899af1b2e1797d931a18b7c57196af6d9c80ddf
1 /* Convert 32-bit wide character to multibyte character.
2 Copyright (C) 2020-2024 Free Software Foundation, Inc.
4 This file is free software: you can redistribute it and/or modify
5 it under the terms of the GNU Lesser General Public License as
6 published by the Free Software Foundation; either version 2.1 of the
7 License, or (at your option) any later version.
9 This file is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU Lesser General Public License for more details.
14 You should have received a copy of the GNU Lesser General Public License
15 along with this program. If not, see <https://www.gnu.org/licenses/>. */
17 /* Written by Bruno Haible <bruno@clisp.org>, 2020. */
19 #include <config.h>
21 /* Specification. */
22 #include <uchar.h>
24 #include <errno.h>
25 #include <wchar.h>
27 #include "attribute.h" /* FALLTHROUGH */
28 #include "localcharset.h"
29 #include "streq.h"
31 #if GL_CHAR32_T_IS_UNICODE
32 # include "lc-charset-unicode.h"
33 #endif
35 size_t
36 c32rtomb (char *s, char32_t wc, mbstate_t *ps)
37 #undef c32rtomb
39 #if HAVE_WORKING_MBRTOC32 && HAVE_WORKING_C32RTOMB
41 # if C32RTOMB_RETVAL_BUG
42 if (s == NULL)
43 /* We know the NUL wide character corresponds to the NUL character. */
44 return 1;
45 # endif
47 return c32rtomb (s, wc, ps);
49 #elif _GL_SMALL_WCHAR_T
51 if (s == NULL)
52 return wcrtomb (NULL, 0, ps);
53 else
55 /* Special-case all encodings that may produce wide character values
56 > WCHAR_MAX. */
57 const char *encoding = locale_charset ();
58 if (STREQ_OPT (encoding, "UTF-8", 'U', 'T', 'F', '-', '8', 0, 0, 0, 0))
60 /* Special-case the UTF-8 encoding. Assume that the wide-character
61 encoding in a UTF-8 locale is UCS-2 or, equivalently, UTF-16. */
62 if (wc < 0x80)
64 s[0] = (unsigned char) wc;
65 return 1;
67 else
69 int count;
71 if (wc < 0x800)
72 count = 2;
73 else if (wc < 0x10000)
75 if (wc < 0xd800 || wc >= 0xe000)
76 count = 3;
77 else
79 errno = EILSEQ;
80 return (size_t)(-1);
83 else if (wc < 0x110000)
84 count = 4;
85 else
87 errno = EILSEQ;
88 return (size_t)(-1);
91 switch (count) /* note: code falls through cases! */
93 case 4: s[3] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x10000;
94 FALLTHROUGH;
95 case 3: s[2] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x800;
96 FALLTHROUGH;
97 case 2: s[1] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0xc0;
98 /*case 1:*/ s[0] = wc;
100 return count;
103 else
105 if ((wchar_t) wc == wc)
106 return wcrtomb (s, (wchar_t) wc, ps);
107 else
109 errno = EILSEQ;
110 return (size_t)(-1);
115 #else
117 /* char32_t and wchar_t are equivalent. */
118 # if GL_CHAR32_T_IS_UNICODE && GL_CHAR32_T_VS_WCHAR_T_NEEDS_CONVERSION
119 if (wc != 0)
121 wc = unicode_to_locale_encoding (wc);
122 if (wc == 0)
124 errno = EILSEQ;
125 return (size_t)(-1);
128 # endif
129 return wcrtomb (s, (wchar_t) wc, ps);
131 #endif