2 * Wine internal Unicode definitions
4 * Copyright 2000 Alexandre Julliard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #ifndef __WINE_UNICODE_H
22 #define __WINE_UNICODE_H
27 /* code page info common to SBCS and DBCS */
30 unsigned int codepage
; /* codepage id */
31 unsigned int char_size
; /* char size (1 or 2 bytes) */
32 WCHAR def_char
; /* default char value (can be double-byte) */
33 WCHAR def_unicode_char
; /* default Unicode char value */
34 const char *name
; /* code page name */
40 const WCHAR
*cp2uni
; /* code page -> Unicode map */
41 const unsigned char *uni2cp_low
; /* Unicode -> code page map */
42 const unsigned short *uni2cp_high
;
48 const WCHAR
*cp2uni
; /* code page -> Unicode map */
49 const unsigned char *cp2uni_leadbytes
;
50 const unsigned short *uni2cp_low
; /* Unicode -> code page map */
51 const unsigned short *uni2cp_high
;
52 unsigned char lead_bytes
[12]; /* lead bytes ranges */
58 struct sbcs_table sbcs
;
59 struct dbcs_table dbcs
;
62 extern const union cptable
*cp_get_table( unsigned int codepage
);
63 extern const union cptable
*cp_enum_table( unsigned int index
);
65 extern int cp_mbstowcs( const union cptable
*table
, int flags
,
66 const char *src
, int srclen
,
67 WCHAR
*dst
, int dstlen
);
68 extern int cp_wcstombs( const union cptable
*table
, int flags
,
69 const WCHAR
*src
, int srclen
,
70 char *dst
, int dstlen
, const char *defchar
, int *used
);
71 extern int utf8_wcstombs( const WCHAR
*src
, int srclen
, char *dst
, int dstlen
);
72 extern int utf8_mbstowcs( int flags
, const char *src
, int srclen
, WCHAR
*dst
, int dstlen
);
74 extern int strcmpiW( const WCHAR
*str1
, const WCHAR
*str2
);
75 extern int strncmpiW( const WCHAR
*str1
, const WCHAR
*str2
, int n
);
76 extern WCHAR
*strstrW( const WCHAR
*str
, const WCHAR
*sub
);
77 extern long int strtolW( const WCHAR
*nptr
, WCHAR
**endptr
, int base
);
78 extern unsigned long int strtoulW( const WCHAR
*nptr
, WCHAR
**endptr
, int base
);
80 static inline int is_dbcs_leadbyte( const union cptable
*table
, unsigned char ch
)
82 return (table
->info
.char_size
== 2) && (table
->dbcs
.cp2uni_leadbytes
[ch
]);
85 static inline WCHAR
tolowerW( WCHAR ch
)
87 extern const WCHAR casemap_lower
[];
88 return ch
+ casemap_lower
[casemap_lower
[ch
>> 8] + (ch
& 0xff)];
91 static inline WCHAR
toupperW( WCHAR ch
)
93 extern const WCHAR casemap_upper
[];
94 return ch
+ casemap_upper
[casemap_upper
[ch
>> 8] + (ch
& 0xff)];
97 /* the character type contains the C1_* flags in the low 12 bits */
98 /* and the C2_* type in the high 4 bits */
99 static inline unsigned short get_char_typeW( WCHAR ch
)
101 extern const unsigned short wctype_table
[];
102 return wctype_table
[wctype_table
[ch
>> 8] + (ch
& 0xff)];
105 inline static int iscntrlW( WCHAR wc
)
107 return get_char_typeW(wc
) & C1_CNTRL
;
110 inline static int ispunctW( WCHAR wc
)
112 return get_char_typeW(wc
) & C1_PUNCT
;
115 inline static int isspaceW( WCHAR wc
)
117 return get_char_typeW(wc
) & C1_SPACE
;
120 inline static int isdigitW( WCHAR wc
)
122 return get_char_typeW(wc
) & C1_DIGIT
;
125 inline static int isxdigitW( WCHAR wc
)
127 return get_char_typeW(wc
) & C1_XDIGIT
;
130 inline static int islowerW( WCHAR wc
)
132 return get_char_typeW(wc
) & C1_LOWER
;
135 inline static int isupperW( WCHAR wc
)
137 return get_char_typeW(wc
) & C1_UPPER
;
140 inline static int isalnumW( WCHAR wc
)
142 return get_char_typeW(wc
) & (C1_ALPHA
|C1_DIGIT
|C1_LOWER
|C1_UPPER
);
145 inline static int isalphaW( WCHAR wc
)
147 return get_char_typeW(wc
) & (C1_ALPHA
|C1_LOWER
|C1_UPPER
);
150 inline static int isgraphW( WCHAR wc
)
152 return get_char_typeW(wc
) & (C1_ALPHA
|C1_PUNCT
|C1_DIGIT
|C1_LOWER
|C1_UPPER
);
155 inline static int isprintW( WCHAR wc
)
157 return get_char_typeW(wc
) & (C1_ALPHA
|C1_BLANK
|C1_PUNCT
|C1_DIGIT
|C1_LOWER
|C1_UPPER
);
160 /* some useful string manipulation routines */
162 static inline unsigned int strlenW( const WCHAR
*str
)
164 #if defined(__i386__) && defined(__GNUC__)
166 __asm__
__volatile__( "cld\n\t"
170 : "=c" (res
), "=&D" (dummy
)
171 : "0" (0xffffffff), "1" (str
), "a" (0) );
174 const WCHAR
*s
= str
;
180 static inline WCHAR
*strcpyW( WCHAR
*dst
, const WCHAR
*src
)
182 #if defined(__i386__) && defined(__GNUC__)
183 int dummy1
, dummy2
, dummy3
;
184 __asm__
__volatile__( "cld\n"
187 "testw %%ax,%%ax\n\t"
189 : "=&S" (dummy1
), "=&D" (dummy2
), "=&a" (dummy3
)
190 : "0" (src
), "1" (dst
)
194 while ((*p
++ = *src
++));
199 static inline int strcmpW( const WCHAR
*str1
, const WCHAR
*str2
)
201 while (*str1
&& (*str1
== *str2
)) { str1
++; str2
++; }
202 return *str1
- *str2
;
205 static inline int strncmpW( const WCHAR
*str1
, const WCHAR
*str2
, int n
)
207 if (n
<= 0) return 0;
208 while ((--n
> 0) && *str1
&& (*str1
== *str2
)) { str1
++; str2
++; }
209 return *str1
- *str2
;
212 static inline WCHAR
*strncpyW( WCHAR
*str1
, const WCHAR
*str2
, int n
)
215 while (n
-- > 0) if (!(*str1
++ = *str2
++)) break;
216 while (n
-- > 0) *str1
++ = 0;
220 static inline WCHAR
*strcatW( WCHAR
*dst
, const WCHAR
*src
)
222 strcpyW( dst
+ strlenW(dst
), src
);
226 static inline WCHAR
*strchrW( const WCHAR
*str
, WCHAR ch
)
228 for ( ; *str
; str
++) if (*str
== ch
) return (WCHAR
*)str
;
232 static inline WCHAR
*strrchrW( const WCHAR
*str
, WCHAR ch
)
235 for ( ; *str
; str
++) if (*str
== ch
) ret
= (WCHAR
*)str
;
239 static inline WCHAR
*strlwrW( WCHAR
*str
)
242 while ((*str
= tolowerW(*str
))) str
++;
246 static inline WCHAR
*struprW( WCHAR
*str
)
249 while ((*str
= toupperW(*str
))) str
++;
253 static inline long int atolW( const WCHAR
*str
)
255 return strtolW( str
, (WCHAR
**)0, 10 );
258 static inline int atoiW( const WCHAR
*str
)
260 return (int)atolW( str
);
263 #endif /* __WINE_UNICODE_H */