1 /* Copyright (C) 1999-2017 Free Software Foundation, Inc.
2 This file is part of the GNU C Library.
4 The GNU C Library is free software; you can redistribute it and/or
5 modify it under the terms of the GNU Lesser General Public
6 License as published by the Free Software Foundation; either
7 version 2.1 of the License, or (at your option) any later version.
9 The GNU C Library is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 Lesser General Public License for more details.
14 You should have received a copy of the GNU Lesser General Public
15 License along with the GNU C Library; if not, see
16 <http://www.gnu.org/licenses/>.
18 As a special exception, if you link the code in this file with
19 files compiled with a GNU compiler to produce an executable,
20 that does not cause the resulting executable to be covered by
21 the GNU Lesser General Public License. This exception does not
22 however invalidate any other reasons why the executable file
23 might be covered by the GNU Lesser General Public License.
24 This exception applies to code released by its copyright holders
25 in files containing the exception. */
35 #include <locale/localeinfo.h>
36 #include <wcsmbs/wcsmbsload.h>
37 #include <iconv/gconv_int.h>
38 #include <shlib-compat.h>
42 /* Prototypes of libio's codecvt functions. */
43 static enum __codecvt_result
do_out (struct _IO_codecvt
*codecvt
,
45 const wchar_t *from_start
,
46 const wchar_t *from_end
,
47 const wchar_t **from_stop
, char *to_start
,
48 char *to_end
, char **to_stop
);
49 static enum __codecvt_result
do_unshift (struct _IO_codecvt
*codecvt
,
50 __mbstate_t
*statep
, char *to_start
,
51 char *to_end
, char **to_stop
);
52 static enum __codecvt_result
do_in (struct _IO_codecvt
*codecvt
,
54 const char *from_start
,
56 const char **from_stop
, wchar_t *to_start
,
57 wchar_t *to_end
, wchar_t **to_stop
);
58 static int do_encoding (struct _IO_codecvt
*codecvt
);
59 static int do_length (struct _IO_codecvt
*codecvt
, __mbstate_t
*statep
,
60 const char *from_start
,
61 const char *from_end
, _IO_size_t max
);
62 static int do_max_length (struct _IO_codecvt
*codecvt
);
63 static int do_always_noconv (struct _IO_codecvt
*codecvt
);
66 /* The functions used in `codecvt' for libio are always the same. */
67 const struct _IO_codecvt __libio_codecvt
=
69 .__codecvt_destr
= NULL
, /* Destructor, never used. */
70 .__codecvt_do_out
= do_out
,
71 .__codecvt_do_unshift
= do_unshift
,
72 .__codecvt_do_in
= do_in
,
73 .__codecvt_do_encoding
= do_encoding
,
74 .__codecvt_do_always_noconv
= do_always_noconv
,
75 .__codecvt_do_length
= do_length
,
76 .__codecvt_do_max_length
= do_max_length
80 /* Return orientation of stream. If mode is nonzero try to change
81 the orientation first. */
84 _IO_fwide (_IO_FILE
*fp
, int mode
)
86 /* Normalize the value. */
87 mode
= mode
< 0 ? -1 : (mode
== 0 ? 0 : 1);
89 #if SHLIB_COMPAT (libc, GLIBC_2_0, GLIBC_2_1)
90 if (__builtin_expect (&_IO_stdin_used
== NULL
, 0)
91 && (fp
== _IO_stdin
|| fp
== _IO_stdout
|| fp
== _IO_stderr
))
92 /* This is for a stream in the glibc 2.0 format. */
96 /* The orientation already has been determined. */
98 /* Or the caller simply wants to know about the current orientation. */
102 /* Set the orientation appropriately. */
105 struct _IO_codecvt
*cc
= fp
->_codecvt
= &fp
->_wide_data
->_codecvt
;
107 fp
->_wide_data
->_IO_read_ptr
= fp
->_wide_data
->_IO_read_end
;
108 fp
->_wide_data
->_IO_write_ptr
= fp
->_wide_data
->_IO_write_base
;
110 /* Get the character conversion functions based on the currently
111 selected locale for LC_CTYPE. */
113 /* Clear the state. We start all over again. */
114 memset (&fp
->_wide_data
->_IO_state
, '\0', sizeof (__mbstate_t
));
115 memset (&fp
->_wide_data
->_IO_last_state
, '\0', sizeof (__mbstate_t
));
117 struct gconv_fcts fcts
;
118 __wcsmbs_clone_conv (&fcts
);
119 assert (fcts
.towc_nsteps
== 1);
120 assert (fcts
.tomb_nsteps
== 1);
122 /* The functions are always the same. */
123 *cc
= __libio_codecvt
;
125 cc
->__cd_in
.__cd
.__nsteps
= fcts
.towc_nsteps
;
126 cc
->__cd_in
.__cd
.__steps
= fcts
.towc
;
128 cc
->__cd_in
.__cd
.__data
[0].__invocation_counter
= 0;
129 cc
->__cd_in
.__cd
.__data
[0].__internal_use
= 1;
130 cc
->__cd_in
.__cd
.__data
[0].__flags
= __GCONV_IS_LAST
;
131 cc
->__cd_in
.__cd
.__data
[0].__statep
= &fp
->_wide_data
->_IO_state
;
133 cc
->__cd_out
.__cd
.__nsteps
= fcts
.tomb_nsteps
;
134 cc
->__cd_out
.__cd
.__steps
= fcts
.tomb
;
136 cc
->__cd_out
.__cd
.__data
[0].__invocation_counter
= 0;
137 cc
->__cd_out
.__cd
.__data
[0].__internal_use
= 1;
138 cc
->__cd_out
.__cd
.__data
[0].__flags
139 = __GCONV_IS_LAST
| __GCONV_TRANSLIT
;
140 cc
->__cd_out
.__cd
.__data
[0].__statep
= &fp
->_wide_data
->_IO_state
;
143 /* From now on use the wide character callback functions. */
144 _IO_JUMPS_FILE_plus (fp
) = fp
->_wide_data
->_wide_vtable
;
147 /* Set the mode now. */
154 static enum __codecvt_result
155 do_out (struct _IO_codecvt
*codecvt
, __mbstate_t
*statep
,
156 const wchar_t *from_start
, const wchar_t *from_end
,
157 const wchar_t **from_stop
, char *to_start
, char *to_end
,
160 enum __codecvt_result result
;
162 struct __gconv_step
*gs
= codecvt
->__cd_out
.__cd
.__steps
;
165 const unsigned char *from_start_copy
= (unsigned char *) from_start
;
167 codecvt
->__cd_out
.__cd
.__data
[0].__outbuf
= (unsigned char *) to_start
;
168 codecvt
->__cd_out
.__cd
.__data
[0].__outbufend
= (unsigned char *) to_end
;
169 codecvt
->__cd_out
.__cd
.__data
[0].__statep
= statep
;
171 __gconv_fct fct
= gs
->__fct
;
173 if (gs
->__shlib_handle
!= NULL
)
177 status
= DL_CALL_FCT (fct
,
178 (gs
, codecvt
->__cd_out
.__cd
.__data
, &from_start_copy
,
179 (const unsigned char *) from_end
, NULL
,
182 *from_stop
= (wchar_t *) from_start_copy
;
183 *to_stop
= (char *) codecvt
->__cd_out
.__cd
.__data
[0].__outbuf
;
188 case __GCONV_EMPTY_INPUT
:
189 result
= __codecvt_ok
;
192 case __GCONV_FULL_OUTPUT
:
193 case __GCONV_INCOMPLETE_INPUT
:
194 result
= __codecvt_partial
;
198 result
= __codecvt_error
;
206 static enum __codecvt_result
207 do_unshift (struct _IO_codecvt
*codecvt
, __mbstate_t
*statep
,
208 char *to_start
, char *to_end
, char **to_stop
)
210 enum __codecvt_result result
;
212 struct __gconv_step
*gs
= codecvt
->__cd_out
.__cd
.__steps
;
216 codecvt
->__cd_out
.__cd
.__data
[0].__outbuf
= (unsigned char *) to_start
;
217 codecvt
->__cd_out
.__cd
.__data
[0].__outbufend
= (unsigned char *) to_end
;
218 codecvt
->__cd_out
.__cd
.__data
[0].__statep
= statep
;
220 __gconv_fct fct
= gs
->__fct
;
222 if (gs
->__shlib_handle
!= NULL
)
226 status
= DL_CALL_FCT (fct
,
227 (gs
, codecvt
->__cd_out
.__cd
.__data
, NULL
, NULL
,
228 NULL
, &dummy
, 1, 0));
230 *to_stop
= (char *) codecvt
->__cd_out
.__cd
.__data
[0].__outbuf
;
235 case __GCONV_EMPTY_INPUT
:
236 result
= __codecvt_ok
;
239 case __GCONV_FULL_OUTPUT
:
240 case __GCONV_INCOMPLETE_INPUT
:
241 result
= __codecvt_partial
;
245 result
= __codecvt_error
;
253 static enum __codecvt_result
254 do_in (struct _IO_codecvt
*codecvt
, __mbstate_t
*statep
,
255 const char *from_start
, const char *from_end
, const char **from_stop
,
256 wchar_t *to_start
, wchar_t *to_end
, wchar_t **to_stop
)
258 enum __codecvt_result result
;
260 struct __gconv_step
*gs
= codecvt
->__cd_in
.__cd
.__steps
;
263 const unsigned char *from_start_copy
= (unsigned char *) from_start
;
265 codecvt
->__cd_in
.__cd
.__data
[0].__outbuf
= (unsigned char *) to_start
;
266 codecvt
->__cd_in
.__cd
.__data
[0].__outbufend
= (unsigned char *) to_end
;
267 codecvt
->__cd_in
.__cd
.__data
[0].__statep
= statep
;
269 __gconv_fct fct
= gs
->__fct
;
271 if (gs
->__shlib_handle
!= NULL
)
275 status
= DL_CALL_FCT (fct
,
276 (gs
, codecvt
->__cd_in
.__cd
.__data
, &from_start_copy
,
277 (const unsigned char *) from_end
, NULL
,
280 *from_stop
= (const char *) from_start_copy
;
281 *to_stop
= (wchar_t *) codecvt
->__cd_in
.__cd
.__data
[0].__outbuf
;
286 case __GCONV_EMPTY_INPUT
:
287 result
= __codecvt_ok
;
290 case __GCONV_FULL_OUTPUT
:
291 case __GCONV_INCOMPLETE_INPUT
:
292 result
= __codecvt_partial
;
296 result
= __codecvt_error
;
305 do_encoding (struct _IO_codecvt
*codecvt
)
307 /* See whether the encoding is stateful. */
308 if (codecvt
->__cd_in
.__cd
.__steps
[0].__stateful
)
310 /* Fortunately not. Now determine the input bytes for the conversion
311 necessary for each wide character. */
312 if (codecvt
->__cd_in
.__cd
.__steps
[0].__min_needed_from
313 != codecvt
->__cd_in
.__cd
.__steps
[0].__max_needed_from
)
314 /* Not a constant value. */
317 return codecvt
->__cd_in
.__cd
.__steps
[0].__min_needed_from
;
322 do_always_noconv (struct _IO_codecvt
*codecvt
)
329 do_length (struct _IO_codecvt
*codecvt
, __mbstate_t
*statep
,
330 const char *from_start
, const char *from_end
, _IO_size_t max
)
333 const unsigned char *cp
= (const unsigned char *) from_start
;
335 struct __gconv_step
*gs
= codecvt
->__cd_in
.__cd
.__steps
;
338 codecvt
->__cd_in
.__cd
.__data
[0].__outbuf
= (unsigned char *) to_buf
;
339 codecvt
->__cd_in
.__cd
.__data
[0].__outbufend
= (unsigned char *) &to_buf
[max
];
340 codecvt
->__cd_in
.__cd
.__data
[0].__statep
= statep
;
342 __gconv_fct fct
= gs
->__fct
;
344 if (gs
->__shlib_handle
!= NULL
)
349 (gs
, codecvt
->__cd_in
.__cd
.__data
, &cp
,
350 (const unsigned char *) from_end
, NULL
,
353 result
= cp
- (const unsigned char *) from_start
;
360 do_max_length (struct _IO_codecvt
*codecvt
)
362 return codecvt
->__cd_in
.__cd
.__steps
[0].__max_needed_from
;