1 /* Copyright (C) 1991,92,93,95,96,97,98,99,2001,2002,2004,2007-2009,2011,2012
2 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, see
17 <http://www.gnu.org/licenses/>. */
20 * ISO C99 Standard 7.4: Character handling <ctype.h>
27 #include <bits/types.h>
32 /* These are all the characteristics of characters.
33 If there get to be more than 16 distinct characteristics,
34 many things must be changed that use `unsigned short int's.
36 The characteristics are stored always in network byte order (big
37 endian). We define the bit value interpretations here dependent on the
38 machine's byte order. */
41 # if __BYTE_ORDER == __BIG_ENDIAN
42 # define _ISbit(bit) (1 << (bit))
43 # else /* __BYTE_ORDER == __LITTLE_ENDIAN */
44 # define _ISbit(bit) ((bit) < 8 ? ((1 << (bit)) << 8) : ((1 << (bit)) >> 8))
49 _ISupper
= _ISbit (0), /* UPPERCASE. */
50 _ISlower
= _ISbit (1), /* lowercase. */
51 _ISalpha
= _ISbit (2), /* Alphabetic. */
52 _ISdigit
= _ISbit (3), /* Numeric. */
53 _ISxdigit
= _ISbit (4), /* Hexadecimal numeric. */
54 _ISspace
= _ISbit (5), /* Whitespace. */
55 _ISprint
= _ISbit (6), /* Printing. */
56 _ISgraph
= _ISbit (7), /* Graphical. */
57 _ISblank
= _ISbit (8), /* Blank (usually SPC and TAB). */
58 _IScntrl
= _ISbit (9), /* Control character. */
59 _ISpunct
= _ISbit (10), /* Punctuation. */
60 _ISalnum
= _ISbit (11) /* Alphanumeric. */
64 /* These are defined in ctype-info.c.
65 The declarations here must match those in localeinfo.h.
67 In the thread-specific locale model (see `uselocale' in <locale.h>)
68 we cannot use global variables for these as was done in the past.
69 Instead, the following accessor functions return the address of
70 each variable, which is local to the current thread if multithreaded.
72 These point into arrays of 384, so they can be indexed by any `unsigned
73 char' value [0,255]; by EOF (-1); or by any `signed char' value
74 [-128,-1). ISO C requires that the ctype functions work for `unsigned
75 char' values and for EOF; we also support negative `signed char' values
76 for broken old programs. The case conversion arrays are of `int's
77 rather than `unsigned char's because tolower (EOF) must be EOF, which
78 doesn't fit into an `unsigned char'. But today more important is that
79 the arrays are also used for multi-byte character sets. */
80 extern const unsigned short int **__ctype_b_loc (void)
81 __THROW
__attribute__ ((__const__
));
82 extern const __int32_t
**__ctype_tolower_loc (void)
83 __THROW
__attribute__ ((__const__
));
84 extern const __int32_t
**__ctype_toupper_loc (void)
85 __THROW
__attribute__ ((__const__
));
89 # define __isctype(c, type) \
90 ((*__ctype_b_loc ())[(int) (c)] & (unsigned short int) type)
91 #elif defined __USE_EXTERN_INLINES
92 # define __isctype_f(type) \
94 is##type (int __c) __THROW \
96 return (*__ctype_b_loc ())[(int) (__c)] & (unsigned short int) _IS##type; \
100 #define __isascii(c) (((c) & ~0x7f) == 0) /* If C is a 7 bit value. */
101 #define __toascii(c) ((c) & 0x7f) /* Mask off high bits. */
103 #define __exctype(name) extern int name (int) __THROW
105 __BEGIN_NAMESPACE_STD
107 /* The following names are all functions:
108 int isCHARACTERISTIC(int c);
109 which return nonzero iff C has CHARACTERISTIC.
110 For the meaning of the characteristic names, see the `enum' above. */
121 __exctype (isxdigit
);
124 /* Return the lowercase version of C. */
125 extern int tolower (int __c
) __THROW
;
127 /* Return the uppercase version of C. */
128 extern int toupper (int __c
) __THROW
;
133 /* ISO C99 introduced one new function. */
135 __BEGIN_NAMESPACE_C99
143 /* Test C for a set of character classes according to MASK. */
144 extern int isctype (int __c
, int __mask
) __THROW
;
147 #if defined __USE_SVID || defined __USE_MISC || defined __USE_XOPEN
149 /* Return nonzero iff C is in the ASCII set
150 (i.e., is no more than 7 bits wide). */
151 extern int isascii (int __c
) __THROW
;
153 /* Return the part of C that is in the ASCII set
154 (i.e., the low-order 7 bits of C). */
155 extern int toascii (int __c
) __THROW
;
157 /* These are the same as `toupper' and `tolower' except that they do not
158 check the argument for being in the range of a `char'. */
159 __exctype (_toupper
);
160 __exctype (_tolower
);
161 #endif /* Use SVID or use misc. */
163 /* This code is needed for the optimized mapping functions. */
164 #define __tobody(c, f, a, args) \
167 if (sizeof (c) > 1) \
169 if (__builtin_constant_p (c)) \
172 __res = __c < -128 || __c > 255 ? __c : (a)[__c]; \
178 __res = (a)[(int) (c)]; \
181 #if !defined __NO_CTYPE
197 # elif defined __isctype
198 # define isalnum(c) __isctype((c), _ISalnum)
199 # define isalpha(c) __isctype((c), _ISalpha)
200 # define iscntrl(c) __isctype((c), _IScntrl)
201 # define isdigit(c) __isctype((c), _ISdigit)
202 # define islower(c) __isctype((c), _ISlower)
203 # define isgraph(c) __isctype((c), _ISgraph)
204 # define isprint(c) __isctype((c), _ISprint)
205 # define ispunct(c) __isctype((c), _ISpunct)
206 # define isspace(c) __isctype((c), _ISspace)
207 # define isupper(c) __isctype((c), _ISupper)
208 # define isxdigit(c) __isctype((c), _ISxdigit)
210 # define isblank(c) __isctype((c), _ISblank)
214 # ifdef __USE_EXTERN_INLINES
216 __NTH (tolower (int __c
))
218 return __c
>= -128 && __c
< 256 ? (*__ctype_tolower_loc ())[__c
] : __c
;
222 __NTH (toupper (int __c
))
224 return __c
>= -128 && __c
< 256 ? (*__ctype_toupper_loc ())[__c
] : __c
;
228 # if __GNUC__ >= 2 && defined __OPTIMIZE__ && !defined __cplusplus
229 # define tolower(c) __tobody (c, tolower, *__ctype_tolower_loc (), (c))
230 # define toupper(c) __tobody (c, toupper, *__ctype_toupper_loc (), (c))
231 # endif /* Optimizing gcc */
233 # if defined __USE_SVID || defined __USE_MISC || defined __USE_XOPEN
234 # define isascii(c) __isascii (c)
235 # define toascii(c) __toascii (c)
237 # define _tolower(c) ((int) (*__ctype_tolower_loc ())[(int) (c)])
238 # define _toupper(c) ((int) (*__ctype_toupper_loc ())[(int) (c)])
241 #endif /* Not __NO_CTYPE. */
244 #ifdef __USE_XOPEN2K8
245 /* The concept of one static locale per category is not very well
246 thought out. Many applications will need to process its data using
247 information from several different locales. Another application is
248 the implementation of the internationalization handling in the
249 upcoming ISO C++ standard library. To support this another set of
250 the functions using locale data exist which have an additional
253 Attention: all these functions are *not* standardized in any form.
254 This is a proof-of-concept implementation. */
256 /* Structure for reentrant locale using functions. This is an
257 (almost) opaque type for the user level programs. */
258 # include <xlocale.h>
260 /* These definitions are similar to the ones above but all functions
261 take as an argument a handle for the locale which shall be used. */
262 # define __isctype_l(c, type, locale) \
263 ((locale)->__ctype_b[(int) (c)] & (unsigned short int) type)
265 # define __exctype_l(name) \
266 extern int name (int, __locale_t) __THROW
268 /* The following names are all functions:
269 int isCHARACTERISTIC(int c, locale_t *locale);
270 which return nonzero iff C has CHARACTERISTIC.
271 For the meaning of the characteristic names, see the `enum' above. */
272 __exctype_l (isalnum_l
);
273 __exctype_l (isalpha_l
);
274 __exctype_l (iscntrl_l
);
275 __exctype_l (isdigit_l
);
276 __exctype_l (islower_l
);
277 __exctype_l (isgraph_l
);
278 __exctype_l (isprint_l
);
279 __exctype_l (ispunct_l
);
280 __exctype_l (isspace_l
);
281 __exctype_l (isupper_l
);
282 __exctype_l (isxdigit_l
);
284 __exctype_l (isblank_l
);
287 /* Return the lowercase version of C in locale L. */
288 extern int __tolower_l (int __c
, __locale_t __l
) __THROW
;
289 extern int tolower_l (int __c
, __locale_t __l
) __THROW
;
291 /* Return the uppercase version of C. */
292 extern int __toupper_l (int __c
, __locale_t __l
) __THROW
;
293 extern int toupper_l (int __c
, __locale_t __l
) __THROW
;
295 # if __GNUC__ >= 2 && defined __OPTIMIZE__ && !defined __cplusplus
296 # define __tolower_l(c, locale) \
297 __tobody (c, __tolower_l, (locale)->__ctype_tolower, (c, locale))
298 # define __toupper_l(c, locale) \
299 __tobody (c, __toupper_l, (locale)->__ctype_toupper, (c, locale))
300 # define tolower_l(c, locale) __tolower_l ((c), (locale))
301 # define toupper_l(c, locale) __toupper_l ((c), (locale))
302 # endif /* Optimizing gcc */
306 # define __isalnum_l(c,l) __isctype_l((c), _ISalnum, (l))
307 # define __isalpha_l(c,l) __isctype_l((c), _ISalpha, (l))
308 # define __iscntrl_l(c,l) __isctype_l((c), _IScntrl, (l))
309 # define __isdigit_l(c,l) __isctype_l((c), _ISdigit, (l))
310 # define __islower_l(c,l) __isctype_l((c), _ISlower, (l))
311 # define __isgraph_l(c,l) __isctype_l((c), _ISgraph, (l))
312 # define __isprint_l(c,l) __isctype_l((c), _ISprint, (l))
313 # define __ispunct_l(c,l) __isctype_l((c), _ISpunct, (l))
314 # define __isspace_l(c,l) __isctype_l((c), _ISspace, (l))
315 # define __isupper_l(c,l) __isctype_l((c), _ISupper, (l))
316 # define __isxdigit_l(c,l) __isctype_l((c), _ISxdigit, (l))
318 # define __isblank_l(c,l) __isctype_l((c), _ISblank, (l))
320 # if defined __USE_SVID || defined __USE_MISC
321 # define __isascii_l(c,l) ((l), __isascii (c))
322 # define __toascii_l(c,l) ((l), __toascii (c))
325 # define isalnum_l(c,l) __isalnum_l ((c), (l))
326 # define isalpha_l(c,l) __isalpha_l ((c), (l))
327 # define iscntrl_l(c,l) __iscntrl_l ((c), (l))
328 # define isdigit_l(c,l) __isdigit_l ((c), (l))
329 # define islower_l(c,l) __islower_l ((c), (l))
330 # define isgraph_l(c,l) __isgraph_l ((c), (l))
331 # define isprint_l(c,l) __isprint_l ((c), (l))
332 # define ispunct_l(c,l) __ispunct_l ((c), (l))
333 # define isspace_l(c,l) __isspace_l ((c), (l))
334 # define isupper_l(c,l) __isupper_l ((c), (l))
335 # define isxdigit_l(c,l) __isxdigit_l ((c), (l))
337 # define isblank_l(c,l) __isblank_l ((c), (l))
339 # if defined __USE_SVID || defined __USE_MISC
340 # define isascii_l(c,l) __isascii_l ((c), (l))
341 # define toascii_l(c,l) __toascii_l ((c), (l))
344 # endif /* Not __NO_CTYPE. */
346 #endif /* Use POSIX 2008. */