lgl/c-ctype.h

   1 /* Character handling in C locale.
   2
   3    These functions work like the corresponding functions in <ctype.h>,
   4    except that they have the C (POSIX) locale hardwired, whereas the
   5    <ctype.h> functions' behaviour depends on the current locale set via
   6    setlocale.
   7
   8    Copyright (C) 2000-2003, 2006 Free Software Foundation, Inc.
   9
  10 This program is free software; you can redistribute it and/or modify
  11 it under the terms of the GNU Lesser General Public License as published by
  12 the Free Software Foundation; either version 2.1 of the License, or
  13 (at your option) any later version.
  14
  15 This program is distributed in the hope that it will be useful,
  16 but WITHOUT ANY WARRANTY; without even the implied warranty of
  17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  18 GNU Lesser General Public License for more details.
  19
  20 You should have received a copy of the GNU Lesser General Public License
  21 along with this program; if not, write to the Free Software Foundation,
  22 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.  */
  23
  24 #ifndef C_CTYPE_H
  25 #define C_CTYPE_H
  26
  27 #include <stdbool.h>
  28
  29
  30 #ifdef __cplusplus
  31 extern "C" {
  32 #endif
  33
  34
  35 /* The functions defined in this file assume the "C" locale and a character
  36    set without diacritics (ASCII-US or EBCDIC-US or something like that).
  37    Even if the "C" locale on a particular system is an extension of the ASCII
  38    character set (like on BeOS, where it is UTF-8, or on AmigaOS, where it
  39    is ISO-8859-1), the functions in this file recognize only the ASCII
  40    characters.  */
  41
  42
  43 /* Check whether the ASCII optimizations apply. */
  44
  45 /* ANSI C89 (and ISO C99 5.2.1.3 too) already guarantees that
  46    '0', '1', ..., '9' have consecutive integer values.  */
  47 #define C_CTYPE_CONSECUTIVE_DIGITS 1
  48
  49 #if ('A' <= 'Z') \
  50     && ('A' + 1 == 'B') && ('B' + 1 == 'C') && ('C' + 1 == 'D') \
  51     && ('D' + 1 == 'E') && ('E' + 1 == 'F') && ('F' + 1 == 'G') \
  52     && ('G' + 1 == 'H') && ('H' + 1 == 'I') && ('I' + 1 == 'J') \
  53     && ('J' + 1 == 'K') && ('K' + 1 == 'L') && ('L' + 1 == 'M') \
  54     && ('M' + 1 == 'N') && ('N' + 1 == 'O') && ('O' + 1 == 'P') \
  55     && ('P' + 1 == 'Q') && ('Q' + 1 == 'R') && ('R' + 1 == 'S') \
  56     && ('S' + 1 == 'T') && ('T' + 1 == 'U') && ('U' + 1 == 'V') \
  57     && ('V' + 1 == 'W') && ('W' + 1 == 'X') && ('X' + 1 == 'Y') \
  58     && ('Y' + 1 == 'Z')
  59 #define C_CTYPE_CONSECUTIVE_UPPERCASE 1
  60 #endif
  61
  62 #if ('a' <= 'z') \
  63     && ('a' + 1 == 'b') && ('b' + 1 == 'c') && ('c' + 1 == 'd') \
  64     && ('d' + 1 == 'e') && ('e' + 1 == 'f') && ('f' + 1 == 'g') \
  65     && ('g' + 1 == 'h') && ('h' + 1 == 'i') && ('i' + 1 == 'j') \
  66     && ('j' + 1 == 'k') && ('k' + 1 == 'l') && ('l' + 1 == 'm') \
  67     && ('m' + 1 == 'n') && ('n' + 1 == 'o') && ('o' + 1 == 'p') \
  68     && ('p' + 1 == 'q') && ('q' + 1 == 'r') && ('r' + 1 == 's') \
  69     && ('s' + 1 == 't') && ('t' + 1 == 'u') && ('u' + 1 == 'v') \
  70     && ('v' + 1 == 'w') && ('w' + 1 == 'x') && ('x' + 1 == 'y') \
  71     && ('y' + 1 == 'z')
  72 #define C_CTYPE_CONSECUTIVE_LOWERCASE 1
  73 #endif
  74
  75 #if (' ' == 32) && ('!' == 33) && ('"' == 34) && ('#' == 35) \
  76     && ('%' == 37) && ('&' == 38) && ('\'' == 39) && ('(' == 40) \
  77     && (')' == 41) && ('*' == 42) && ('+' == 43) && (',' == 44) \
  78     && ('-' == 45) && ('.' == 46) && ('/' == 47) && ('0' == 48) \
  79     && ('1' == 49) && ('2' == 50) && ('3' == 51) && ('4' == 52) \
  80     && ('5' == 53) && ('6' == 54) && ('7' == 55) && ('8' == 56) \
  81     && ('9' == 57) && (':' == 58) && (';' == 59) && ('<' == 60) \
  82     && ('=' == 61) && ('>' == 62) && ('?' == 63) && ('A' == 65) \
  83     && ('B' == 66) && ('C' == 67) && ('D' == 68) && ('E' == 69) \
  84     && ('F' == 70) && ('G' == 71) && ('H' == 72) && ('I' == 73) \
  85     && ('J' == 74) && ('K' == 75) && ('L' == 76) && ('M' == 77) \
  86     && ('N' == 78) && ('O' == 79) && ('P' == 80) && ('Q' == 81) \
  87     && ('R' == 82) && ('S' == 83) && ('T' == 84) && ('U' == 85) \
  88     && ('V' == 86) && ('W' == 87) && ('X' == 88) && ('Y' == 89) \
  89     && ('Z' == 90) && ('[' == 91) && ('\\' == 92) && (']' == 93) \
  90     && ('^' == 94) && ('_' == 95) && ('a' == 97) && ('b' == 98) \
  91     && ('c' == 99) && ('d' == 100) && ('e' == 101) && ('f' == 102) \
  92     && ('g' == 103) && ('h' == 104) && ('i' == 105) && ('j' == 106) \
  93     && ('k' == 107) && ('l' == 108) && ('m' == 109) && ('n' == 110) \
  94     && ('o' == 111) && ('p' == 112) && ('q' == 113) && ('r' == 114) \
  95     && ('s' == 115) && ('t' == 116) && ('u' == 117) && ('v' == 118) \
  96     && ('w' == 119) && ('x' == 120) && ('y' == 121) && ('z' == 122) \
  97     && ('{' == 123) && ('|' == 124) && ('}' == 125) && ('~' == 126)
  98 /* The character set is ASCII or one of its variants or extensions, not EBCDIC.
  99    Testing the value of '\n' and '\r' is not relevant.  */
 100 #define C_CTYPE_ASCII 1
 101 #endif
 102
 103
 104 /* Function declarations. */
 105
 106 extern bool c_isascii (int c); /* not locale dependent */
 107
 108 extern bool c_isalnum (int c);
 109 extern bool c_isalpha (int c);
 110 extern bool c_isblank (int c);
 111 extern bool c_iscntrl (int c);
 112 extern bool c_isdigit (int c);
 113 extern bool c_islower (int c);
 114 extern bool c_isgraph (int c);
 115 extern bool c_isprint (int c);
 116 extern bool c_ispunct (int c);
 117 extern bool c_isspace (int c);
 118 extern bool c_isupper (int c);
 119 extern bool c_isxdigit (int c);
 120
 121 extern int c_tolower (int c);
 122 extern int c_toupper (int c);
 123
 124
 125 #if defined __GNUC__ && defined __OPTIMIZE__ && !defined __OPTIMIZE_SIZE__ && !defined NO_C_CTYPE_MACROS
 126
 127 /* ASCII optimizations. */
 128
 129 #undef c_isascii
 130 #define c_isascii(c) \
 131   ({ int __c = (c); \
 132      (__c >= 0x00 && __c <= 0x7f); \
 133    })
 134
 135 #if C_CTYPE_CONSECUTIVE_DIGITS \
 136     && C_CTYPE_CONSECUTIVE_UPPERCASE && C_CTYPE_CONSECUTIVE_LOWERCASE
 137 #if C_CTYPE_ASCII
 138 #undef c_isalnum
 139 #define c_isalnum(c) \
 140   ({ int __c = (c); \
 141      ((__c >= '0' && __c <= '9') \
 142       || ((__c & ~0x20) >= 'A' && (__c & ~0x20) <= 'Z')); \
 143    })
 144 #else
 145 #undef c_isalnum
 146 #define c_isalnum(c) \
 147   ({ int __c = (c); \
 148      ((__c >= '0' && __c <= '9') \
 149       || (__c >= 'A' && __c <= 'Z') \
 150       || (__c >= 'a' && __c <= 'z')); \
 151    })
 152 #endif
 153 #endif
 154
 155 #if C_CTYPE_CONSECUTIVE_UPPERCASE && C_CTYPE_CONSECUTIVE_LOWERCASE
 156 #if C_CTYPE_ASCII
 157 #undef c_isalpha
 158 #define c_isalpha(c) \
 159   ({ int __c = (c); \
 160      ((__c & ~0x20) >= 'A' && (__c & ~0x20) <= 'Z'); \
 161    })
 162 #else
 163 #undef c_isalpha
 164 #define c_isalpha(c) \
 165   ({ int __c = (c); \
 166      ((__c >= 'A' && __c <= 'Z') || (__c >= 'a' && __c <= 'z')); \
 167    })
 168 #endif
 169 #endif
 170
 171 #undef c_isblank
 172 #define c_isblank(c) \
 173   ({ int __c = (c); \
 174      (__c == ' ' || __c == '\t'); \
 175    })
 176
 177 #if C_CTYPE_ASCII
 178 #undef c_iscntrl
 179 #define c_iscntrl(c) \
 180   ({ int __c = (c); \
 181      ((__c & ~0x1f) == 0 || __c == 0x7f); \
 182    })
 183 #endif
 184
 185 #if C_CTYPE_CONSECUTIVE_DIGITS
 186 #undef c_isdigit
 187 #define c_isdigit(c) \
 188   ({ int __c = (c); \
 189      (__c >= '0' && __c <= '9'); \
 190    })
 191 #endif
 192
 193 #if C_CTYPE_CONSECUTIVE_LOWERCASE
 194 #undef c_islower
 195 #define c_islower(c) \
 196   ({ int __c = (c); \
 197      (__c >= 'a' && __c <= 'z'); \
 198    })
 199 #endif
 200
 201 #if C_CTYPE_ASCII
 202 #undef c_isgraph
 203 #define c_isgraph(c) \
 204   ({ int __c = (c); \
 205      (__c >= '!' && __c <= '~'); \
 206    })
 207 #endif
 208
 209 #if C_CTYPE_ASCII
 210 #undef c_isprint
 211 #define c_isprint(c) \
 212   ({ int __c = (c); \
 213      (__c >= ' ' && __c <= '~'); \
 214    })
 215 #endif
 216
 217 #if C_CTYPE_ASCII
 218 #undef c_ispunct
 219 #define c_ispunct(c) \
 220   ({ int _c = (c); \
 221      (c_isgraph (_c) && ! c_isalnum (_c)); \
 222    })
 223 #endif
 224
 225 #undef c_isspace
 226 #define c_isspace(c) \
 227   ({ int __c = (c); \
 228      (__c == ' ' || __c == '\t' \
 229       || __c == '\n' || __c == '\v' || __c == '\f' || __c == '\r'); \
 230    })
 231
 232 #if C_CTYPE_CONSECUTIVE_UPPERCASE
 233 #undef c_isupper
 234 #define c_isupper(c) \
 235   ({ int __c = (c); \
 236      (__c >= 'A' && __c <= 'Z'); \
 237    })
 238 #endif
 239
 240 #if C_CTYPE_CONSECUTIVE_DIGITS \
 241     && C_CTYPE_CONSECUTIVE_UPPERCASE && C_CTYPE_CONSECUTIVE_LOWERCASE
 242 #if C_CTYPE_ASCII
 243 #undef c_isxdigit
 244 #define c_isxdigit(c) \
 245   ({ int __c = (c); \
 246      ((__c >= '0' && __c <= '9') \
 247       || ((__c & ~0x20) >= 'A' && (__c & ~0x20) <= 'F')); \
 248    })
 249 #else
 250 #undef c_isxdigit
 251 #define c_isxdigit(c) \
 252   ({ int __c = (c); \
 253      ((__c >= '0' && __c <= '9') \
 254       || (__c >= 'A' && __c <= 'F') \
 255       || (__c >= 'a' && __c <= 'f')); \
 256    })
 257 #endif
 258 #endif
 259
 260 #if C_CTYPE_CONSECUTIVE_UPPERCASE && C_CTYPE_CONSECUTIVE_LOWERCASE
 261 #undef c_tolower
 262 #define c_tolower(c) \
 263   ({ int __c = (c); \
 264      (__c >= 'A' && __c <= 'Z' ? __c - 'A' + 'a' : __c); \
 265    })
 266 #undef c_toupper
 267 #define c_toupper(c) \
 268   ({ int __c = (c); \
 269      (__c >= 'a' && __c <= 'z' ? __c - 'a' + 'A' : __c); \
 270    })
 271 #endif
 272
 273 #endif /* optimizing for speed */
 274
 275
 276 #ifdef __cplusplus
 277 }
 278 #endif
 279
 280 #endif /* C_CTYPE_H */