1 /* Access functions for CNS 11643 handling.
2 Copyright (C) 1998-2020 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Ulrich Drepper <drepper@cygnus.com>, 1998.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Lesser General Public
8 License as published by the Free Software Foundation; either
9 version 2.1 of the License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public
17 License along with the GNU C Library; if not, see
18 <https://www.gnu.org/licenses/>. */
23 /* Table for CNS 11643, plane 1 to UCS4 conversion. */
24 extern const uint16_t __cns11643l1_to_ucs4_tab
[];
25 /* Table for CNS 11643, plane 2 to UCS4 conversion. */
26 extern const uint16_t __cns11643l2_to_ucs4_tab
[];
27 /* Table for CNS 11643, plane 3 to UCS4 conversion. */
28 extern const uint32_t __cns11643l3_to_ucs4_tab
[];
29 /* Table for CNS 11643, plane 4 to UCS4 conversion. */
30 extern const uint32_t __cns11643l4_to_ucs4_tab
[];
31 /* Table for CNS 11643, plane 5 to UCS4 conversion. */
32 extern const uint32_t __cns11643l5_to_ucs4_tab
[];
33 /* Table for CNS 11643, plane 6 to UCS4 conversion. */
34 extern const uint32_t __cns11643l6_to_ucs4_tab
[];
35 /* Table for CNS 11643, plane 7 to UCS4 conversion. */
36 extern const uint32_t __cns11643l7_to_ucs4_tab
[];
37 /* Table for CNS 11643, plane 15 (old) to UCS4 conversion. */
38 extern const uint32_t __cns11643l15_to_ucs4_tab
[];
41 static inline uint32_t
42 __attribute ((always_inline
))
43 cns11643_to_ucs4 (const unsigned char **s
, size_t avail
, unsigned char offset
)
45 unsigned char ch
= *(*s
);
51 if (ch
< offset
|| (ch
- offset
) <= 0x20 || (ch
- offset
) > 0x30)
52 return __UNKNOWN_10646_CHAR
;
58 if ((ch2
- offset
) <= 0x20 || (ch2
- offset
) >= 0x7f)
59 return __UNKNOWN_10646_CHAR
;
62 if ((ch3
- offset
) <= 0x20 || (ch3
- offset
) >= 0x7f)
63 return __UNKNOWN_10646_CHAR
;
65 idx
= (ch2
- 0x21 - offset
) * 94 + (ch3
- 0x21 - offset
);
67 switch (ch
- 0x20 - offset
)
71 return __UNKNOWN_10646_CHAR
;
72 result
= __cns11643l1_to_ucs4_tab
[idx
];
76 return __UNKNOWN_10646_CHAR
;
77 result
= __cns11643l2_to_ucs4_tab
[idx
];
81 return __UNKNOWN_10646_CHAR
;
82 result
= __cns11643l3_to_ucs4_tab
[idx
];
86 return __UNKNOWN_10646_CHAR
;
87 result
= __cns11643l4_to_ucs4_tab
[idx
];
91 return __UNKNOWN_10646_CHAR
;
92 result
= __cns11643l5_to_ucs4_tab
[idx
];
96 return __UNKNOWN_10646_CHAR
;
97 result
= __cns11643l6_to_ucs4_tab
[idx
];
101 return __UNKNOWN_10646_CHAR
;
102 result
= __cns11643l7_to_ucs4_tab
[idx
];
106 return __UNKNOWN_10646_CHAR
;
107 result
= __cns11643l15_to_ucs4_tab
[idx
];
110 return __UNKNOWN_10646_CHAR
;
116 result
= __UNKNOWN_10646_CHAR
;
122 /* Tables for the UCS4 -> CNS conversion. */
123 extern const char __cns11643l1_from_ucs4_tab1
[][2];
124 extern const char __cns11643l1_from_ucs4_tab2
[][2];
125 extern const char __cns11643l1_from_ucs4_tab3
[][2];
126 extern const char __cns11643l1_from_ucs4_tab4
[][2];
127 extern const char __cns11643l1_from_ucs4_tab5
[][2];
128 extern const char __cns11643l1_from_ucs4_tab6
[][2];
129 extern const char __cns11643l1_from_ucs4_tab7
[][2];
130 extern const char __cns11643l1_from_ucs4_tab8
[][2];
131 extern const char __cns11643l1_from_ucs4_tab9
[][2];
132 extern const char __cns11643l1_from_ucs4_tab10
[][2];
133 extern const char __cns11643l1_from_ucs4_tab11
[][2];
134 extern const char __cns11643l1_from_ucs4_tab12
[][2];
135 extern const char __cns11643l1_from_ucs4_tab13
[][2];
136 extern const char __cns11643l1_from_ucs4_tab14
[][2];
137 extern const char __cns11643_from_ucs4p0_tab
[][3];
138 extern const char __cns11643_from_ucs4p2_tab
[][3];
139 extern const char __cns11643_from_ucs4p2c_tab
[][3];
143 __attribute ((always_inline
))
144 ucs4_to_cns11643 (uint32_t wch
, unsigned char *s
, size_t avail
)
146 unsigned int ch
= (unsigned int) wch
;
148 const char *cp
= buf
;
154 cp
= __cns11643l1_from_ucs4_tab1
[ch
- 0xa7];
156 case 0x2c7 ... 0x2d9:
157 cp
= __cns11643l1_from_ucs4_tab2
[ch
- 0x2c7];
159 case 0x391 ... 0x3c9:
160 cp
= __cns11643l1_from_ucs4_tab3
[ch
- 0x391];
162 case 0x2013 ... 0x203e:
163 cp
= __cns11643l1_from_ucs4_tab4
[ch
- 0x2013];
174 case 0x2160 ... 0x2169:
176 buf
[1] = '\x2b' + (ch
- 0x2160);
178 case 0x2170 ... 0x2179:
180 buf
[1] = '\x35' + (ch
- 0x2170);
182 case 0x2190 ... 0x2199:
183 cp
= __cns11643l1_from_ucs4_tab5
[ch
- 0x2190];
185 case 0x2215 ... 0x2267:
186 cp
= __cns11643l1_from_ucs4_tab6
[ch
- 0x2215];
194 case 0x2400 ... 0x2421:
195 cp
= __cns11643l1_from_ucs4_tab7
[ch
- 0x2400];
197 case 0x2460 ... 0x247d:
198 cp
= __cns11643l1_from_ucs4_tab8
[ch
- 0x2460];
200 case 0x2500 ... 0x2642:
201 cp
= __cns11643l1_from_ucs4_tab9
[ch
- 0x2500];
203 case 0x3000 ... 0x3029:
204 cp
= __cns11643l1_from_ucs4_tab10
[ch
- 0x3000];
209 case 0x3105 ... 0x3129:
211 buf
[1] = '\x47' + (ch
- 0x3105);
216 case 0x338e ... 0x33d5:
217 cp
= __cns11643l1_from_ucs4_tab11
[ch
- 0x338e];
219 case 0x4e00 ... 0x9f9c:
220 cp
= __cns11643l1_from_ucs4_tab12
[ch
- 0x4e00];
223 /* Let's try the other planes. */
225 case 0x3400 ... 0x4dff:
226 case 0x9f9d ... 0x9fa5:
227 /* Let's try the other planes. */
229 cp
= __cns11643_from_ucs4p0_tab
[ch
- 0x3400];
235 case 0xfe30 ... 0xfe6b:
236 cp
= __cns11643l1_from_ucs4_tab13
[ch
- 0xfe30];
238 case 0xff01 ... 0xff5d:
239 cp
= __cns11643l1_from_ucs4_tab14
[ch
- 0xff01];
250 case 0x20000 ... 0x2a6d6:
252 cp
= __cns11643_from_ucs4p2_tab
[ch
- 0x20000];
254 case 0x2f800 ... 0x2fa1d:
256 cp
= __cns11643_from_ucs4p2c_tab
[ch
- 0x2f800];
259 return __UNKNOWN_10646_CHAR
;
263 return __UNKNOWN_10646_CHAR
;