1 /* Access functions for KS C 5601-1992 based encoding conversion.
2 Copyright (C) 1998, 1999, 2000 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, write to the Free
17 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
23 #define KSC5601_HANGUL 2350
24 #define KSC5601_HANJA 4888
25 #define KSC5601_SYMBOL 988
30 /* Structure to map from UCS to KSC. This structure should be packed
38 /* Conversion table. */
39 extern const uint16_t __ksc5601_hangul_to_ucs
[KSC5601_HANGUL
];
40 extern const uint16_t __ksc5601_sym_to_ucs
[];
41 extern const struct map __ksc5601_sym_from_ucs
[KSC5601_SYMBOL
];
42 extern const uint16_t __ksc5601_hanja_to_ucs
[KSC5601_HANJA
];
43 extern const struct map __ksc5601_hanja_from_ucs
[KSC5601_HANJA
];
46 static inline uint32_t
47 ksc5601_to_ucs4 (const unsigned char **s
, size_t avail
, unsigned char offset
)
49 unsigned char ch
= **s
;
53 /* row 94(0x7e) and row 41(0x49) are user-defined area in KS C 5601 */
55 if (ch
< offset
|| (ch
- offset
) <= 0x20 || (ch
- offset
) >= 0x7e
56 || (ch
- offset
) == 0x49)
57 return __UNKNOWN_10646_CHAR
;
63 if (ch2
< offset
|| (ch2
- offset
) <= 0x20 || (ch2
- offset
) >= 0x7f)
64 return __UNKNOWN_10646_CHAR
;
66 idx
= (ch
- offset
- 0x21) * 94 + (ch2
- offset
- 0x21);
68 /* 1410 = 15 * 94 , 3760 = 40 * 94
69 Hangul in KS C 5601 : row 16 - row 40 */
73 if (idx
>= 1410 && idx
< 1410 + KSC5601_HANGUL
)
74 return (__ksc5601_hangul_to_ucs
[idx
- 1410]
75 ?: (*s
-= 2, __UNKNOWN_10646_CHAR
));
77 /* Hanja : row 42 - row 93 : 3854 = 94 * (42-1) */
78 return (__ksc5601_hanja_to_ucs
[idx
- 3854]
79 ?: (*s
-= 2, __UNKNOWN_10646_CHAR
));
81 return __ksc5601_sym_to_ucs
[idx
] ?: (*s
-= 2, __UNKNOWN_10646_CHAR
);
84 return __UNKNOWN_10646_CHAR
;
88 ucs4_to_ksc5601_hangul (uint32_t wch
, unsigned char *s
, size_t avail
)
91 int u
= KSC5601_HANGUL
- 1;
97 try = (uint32_t) __ksc5601_hangul_to_ucs
[m
];
107 s
[0] = (m
/ 94) + 0x30;
108 s
[1] = (m
% 94) + 0x21;
114 return __UNKNOWN_10646_CHAR
;
119 ucs4_to_ksc5601_hanja (uint32_t wch
, unsigned char *s
, size_t avail
)
122 int u
= KSC5601_HANJA
- 1;
128 try = (uint32_t) __ksc5601_hanja_from_ucs
[m
].ucs
;
138 s
[0] = __ksc5601_hanja_from_ucs
[m
].val
[0];
139 s
[1] = __ksc5601_hanja_from_ucs
[m
].val
[1];
145 return __UNKNOWN_10646_CHAR
;
149 ucs4_to_ksc5601_sym (uint32_t wch
, unsigned char *s
, size_t avail
)
152 int u
= KSC5601_SYMBOL
- 1;
158 try = __ksc5601_sym_from_ucs
[m
].ucs
;
168 s
[0] = __ksc5601_sym_from_ucs
[m
].val
[0];
169 s
[1] = __ksc5601_sym_from_ucs
[m
].val
[1];
175 return __UNKNOWN_10646_CHAR
;
180 ucs4_to_ksc5601 (uint32_t wch
, unsigned char *s
, size_t avail
)
182 if (wch
>= 0xac00 && wch
<= 0xd7a3)
183 return ucs4_to_ksc5601_hangul (wch
, s
, avail
);
184 else if ((wch
>= 0x4e00 && wch
<= 0x9fff)
185 || (wch
>= 0xf900 && wch
<= 0xfa0b))
186 return ucs4_to_ksc5601_hanja (wch
, s
, avail
);
188 return ucs4_to_ksc5601_sym (wch
, s
, avail
);
191 #endif /* ksc5601.h */