1 /* Access functions for KS C 5601-1992 based encoding conversion.
2 Copyright (C) 1998, 1999 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Library General Public License as
7 published by the Free Software Foundation; either version 2 of the
8 License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Library General Public License for more details.
15 You should have received a copy of the GNU Library General Public
16 License along with the GNU C Library; see the file COPYING.LIB. If not,
17 write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
18 Boston, MA 02111-1307, USA. */
23 #define KSC5601_HANGUL 2350
24 #define KSC5601_HANJA 4888
25 #define KSC5601_SYMBOL 986
30 /* Structure to map from UCS to KSC. This structure should be packed
38 /* Conversion table. */
39 extern const uint16_t __ksc5601_hangul_to_ucs
[KSC5601_HANGUL
];
40 extern const uint16_t __ksc5601_sym_to_ucs
[];
41 extern const struct map __ksc5601_sym_from_ucs
[KSC5601_SYMBOL
];
42 extern const uint16_t __ksc5601_hanja_to_ucs
[KSC5601_HANJA
];
43 extern const struct map __ksc5601_hanja_from_ucs
[KSC5601_HANJA
];
46 static inline uint32_t
47 ksc5601_to_ucs4 (const unsigned char **s
, size_t avail
, unsigned char offset
)
49 unsigned char ch
= **s
;
53 /* row 94(0x7e) and row 41(0x49) are user-defined area in KS C 5601 */
55 if (ch
< offset
|| (ch
- offset
) <= 0x20 || (ch
- offset
) >= 0x7e
56 || (ch
- offset
) == 0x49)
57 return __UNKNOWN_10646_CHAR
;
63 if (ch2
< offset
|| (ch2
- offset
) <= 0x20 || (ch2
- offset
) >= 0x7f)
64 return __UNKNOWN_10646_CHAR
;
66 idx
= (ch
- offset
- 0x21) * 94 + (ch2
- offset
- 0x21);
68 /* 1410 = 15 * 94 , 3760 = 40 * 94
69 Hangul in KS C 5601 : row 16 - row 40 */
73 if (idx
>= 1410 && idx
< 1410 + KSC5601_HANGUL
)
74 return (__ksc5601_hangul_to_ucs
[idx
- 1410]
75 ?: ((*s
) -= 2, __UNKNOWN_10646_CHAR
));
77 /* Hanja : row 42 - row 93 : 3854 = 94 * (42-1) */
78 return (__ksc5601_hanja_to_ucs
[idx
- 3854]
79 ?: ((*s
) -= 2, __UNKNOWN_10646_CHAR
));
81 return __ksc5601_sym_to_ucs
[idx
] ?: ((*s
) -= 2, __UNKNOWN_10646_CHAR
);
83 return __UNKNOWN_10646_CHAR
;
87 ucs4_to_ksc5601_hangul (uint32_t wch
, unsigned char *s
, size_t avail
)
90 int u
= KSC5601_HANGUL
- 1;
96 try = (uint32_t) __ksc5601_hangul_to_ucs
[m
];
106 s
[0] = (m
/ 94) + 0x30;
107 s
[1] = (m
% 94) + 0x21;
113 return __UNKNOWN_10646_CHAR
;
118 ucs4_to_ksc5601_hanja (uint32_t wch
, unsigned char *s
, size_t avail
)
121 int u
= KSC5601_HANJA
- 1;
127 try = (uint32_t) __ksc5601_hanja_from_ucs
[m
].ucs
;
137 s
[0] = __ksc5601_hanja_from_ucs
[m
].val
[0];
138 s
[1] = __ksc5601_hanja_from_ucs
[m
].val
[1];
144 return __UNKNOWN_10646_CHAR
;
148 ucs4_to_ksc5601_sym (uint32_t wch
, unsigned char *s
, size_t avail
)
151 int u
= KSC5601_SYMBOL
- 1;
157 try = __ksc5601_sym_from_ucs
[m
].ucs
;
167 s
[0] = __ksc5601_sym_from_ucs
[m
].val
[0];
168 s
[1] = __ksc5601_sym_from_ucs
[m
].val
[1];
174 return __UNKNOWN_10646_CHAR
;
179 ucs4_to_ksc5601 (uint32_t wch
, unsigned char *s
, size_t avail
)
181 if (wch
>= 0xac00 && wch
<= 0xd7a3)
182 return ucs4_to_ksc5601_hangul (wch
, s
, avail
);
183 else if ((wch
>= 0x4e00 && wch
<= 0x9fff)
184 || (wch
>= 0xf900 && wch
<= 0xfa0b))
185 return ucs4_to_ksc5601_hanja (wch
, s
, avail
);
187 return ucs4_to_ksc5601_sym (wch
, s
, avail
);
190 #endif /* ksc5601.h */