Lib/locale.py

   1 """ Locale support.
   2
   3     The module provides low-level access to the C lib's locale APIs
   4     and adds high level number formatting APIs as well as a locale
   5     aliasing engine to complement these.
   6
   7     The aliasing engine includes support for many commonly used locale
   8     names and maps them to values suitable for passing to the C lib's
   9     setlocale() function. It also includes default encodings for all
  10     supported locale names.
  11
  12 """
  13
  14 import sys
  15 import encodings
  16 import encodings.aliases
  17 import re
  18 import operator
  19 import functools
  20
  21 # Try importing the _locale module.
  22 #
  23 # If this fails, fall back on a basic 'C' locale emulation.
  24
  25 # Yuck:  LC_MESSAGES is non-standard:  can't tell whether it exists before
  26 # trying the import.  So __all__ is also fiddled at the end of the file.
  27 __all__ = ["getlocale", "getdefaultlocale", "getpreferredencoding", "Error",
  28            "setlocale", "resetlocale", "localeconv", "strcoll", "strxfrm",
  29            "str", "atof", "atoi", "format", "format_string", "currency",
  30            "normalize", "LC_CTYPE", "LC_COLLATE", "LC_TIME", "LC_MONETARY",
  31            "LC_NUMERIC", "LC_ALL", "CHAR_MAX"]
  32
  33 try:
  34
  35     from _locale import *
  36
  37 except ImportError:
  38
  39     # Locale emulation
  40
  41     CHAR_MAX = 127
  42     LC_ALL = 6
  43     LC_COLLATE = 3
  44     LC_CTYPE = 0
  45     LC_MESSAGES = 5
  46     LC_MONETARY = 4
  47     LC_NUMERIC = 1
  48     LC_TIME = 2
  49     Error = ValueError
  50
  51     def localeconv():
  52         """ localeconv() -> dict.
  53             Returns numeric and monetary locale-specific parameters.
  54         """
  55         # 'C' locale default values
  56         return {'grouping': [127],
  57                 'currency_symbol': '',
  58                 'n_sign_posn': 127,
  59                 'p_cs_precedes': 127,
  60                 'n_cs_precedes': 127,
  61                 'mon_grouping': [],
  62                 'n_sep_by_space': 127,
  63                 'decimal_point': '.',
  64                 'negative_sign': '',
  65                 'positive_sign': '',
  66                 'p_sep_by_space': 127,
  67                 'int_curr_symbol': '',
  68                 'p_sign_posn': 127,
  69                 'thousands_sep': '',
  70                 'mon_thousands_sep': '',
  71                 'frac_digits': 127,
  72                 'mon_decimal_point': '',
  73                 'int_frac_digits': 127}
  74
  75     def setlocale(category, value=None):
  76         """ setlocale(integer,string=None) -> string.
  77             Activates/queries locale processing.
  78         """
  79         if value not in (None, '', 'C'):
  80             raise Error, '_locale emulation only supports "C" locale'
  81         return 'C'
  82
  83     def strcoll(a,b):
  84         """ strcoll(string,string) -> int.
  85             Compares two strings according to the locale.
  86         """
  87         return cmp(a,b)
  88
  89     def strxfrm(s):
  90         """ strxfrm(string) -> string.
  91             Returns a string that behaves for cmp locale-aware.
  92         """
  93         return s
  94
  95
  96 _localeconv = localeconv
  97
  98 # With this dict, you can override some items of localeconv's return value.
  99 # This is useful for testing purposes.
 100 _override_localeconv = {}
 101
 102 @functools.wraps(_localeconv)
 103 def localeconv():
 104     d = _localeconv()
 105     if _override_localeconv:
 106         d.update(_override_localeconv)
 107     return d
 108
 109
 110 ### Number formatting APIs
 111
 112 # Author: Martin von Loewis
 113 # improved by Georg Brandl
 114
 115 # Iterate over grouping intervals
 116 def _grouping_intervals(grouping):
 117     last_interval = None
 118     for interval in grouping:
 119         # if grouping is -1, we are done
 120         if interval == CHAR_MAX:
 121             return
 122         # 0: re-use last group ad infinitum
 123         if interval == 0:
 124             if last_interval is None:
 125                 raise ValueError("invalid grouping")
 126             while True:
 127                 yield last_interval
 128         yield interval
 129         last_interval = interval
 130
 131 #perform the grouping from right to left
 132 def _group(s, monetary=False):
 133     conv = localeconv()
 134     thousands_sep = conv[monetary and 'mon_thousands_sep' or 'thousands_sep']
 135     grouping = conv[monetary and 'mon_grouping' or 'grouping']
 136     if not grouping:
 137         return (s, 0)
 138     result = ""
 139     seps = 0
 140     if s[-1] == ' ':
 141         stripped = s.rstrip()
 142         right_spaces = s[len(stripped):]
 143         s = stripped
 144     else:
 145         right_spaces = ''
 146     left_spaces = ''
 147     groups = []
 148     for interval in _grouping_intervals(grouping):
 149         if not s or s[-1] not in "0123456789":
 150             # only non-digit characters remain (sign, spaces)
 151             left_spaces = s
 152             s = ''
 153             break
 154         groups.append(s[-interval:])
 155         s = s[:-interval]
 156     if s:
 157         groups.append(s)
 158     groups.reverse()
 159     return (
 160         left_spaces + thousands_sep.join(groups) + right_spaces,
 161         len(thousands_sep) * (len(groups) - 1)
 162     )
 163
 164 # Strip a given amount of excess padding from the given string
 165 def _strip_padding(s, amount):
 166     lpos = 0
 167     while amount and s[lpos] == ' ':
 168         lpos += 1
 169         amount -= 1
 170     rpos = len(s) - 1
 171     while amount and s[rpos] == ' ':
 172         rpos -= 1
 173         amount -= 1
 174     return s[lpos:rpos+1]
 175
 176 _percent_re = re.compile(r'%(?:\((?P<key>.*?)\))?'
 177                          r'(?P<modifiers>[-#0-9 +*.hlL]*?)[eEfFgGdiouxXcrs%]')
 178
 179 def format(percent, value, grouping=False, monetary=False, *additional):
 180     """Returns the locale-aware substitution of a %? specifier
 181     (percent).
 182
 183     additional is for format strings which contain one or more
 184     '*' modifiers."""
 185     # this is only for one-percent-specifier strings and this should be checked
 186     match = _percent_re.match(percent)
 187     if not match or len(match.group())!= len(percent):
 188         raise ValueError(("format() must be given exactly one %%char "
 189                          "format specifier, %s not valid") % repr(percent))
 190     return _format(percent, value, grouping, monetary, *additional)
 191
 192 def _format(percent, value, grouping=False, monetary=False, *additional):
 193     if additional:
 194         formatted = percent % ((value,) + additional)
 195     else:
 196         formatted = percent % value
 197     # floats and decimal ints need special action!
 198     if percent[-1] in 'eEfFgG':
 199         seps = 0
 200         parts = formatted.split('.')
 201         if grouping:
 202             parts[0], seps = _group(parts[0], monetary=monetary)
 203         decimal_point = localeconv()[monetary and 'mon_decimal_point'
 204                                               or 'decimal_point']
 205         formatted = decimal_point.join(parts)
 206         if seps:
 207             formatted = _strip_padding(formatted, seps)
 208     elif percent[-1] in 'diu':
 209         seps = 0
 210         if grouping:
 211             formatted, seps = _group(formatted, monetary=monetary)
 212         if seps:
 213             formatted = _strip_padding(formatted, seps)
 214     return formatted
 215
 216 def format_string(f, val, grouping=False):
 217     """Formats a string in the same way that the % formatting would use,
 218     but takes the current locale into account.
 219     Grouping is applied if the third parameter is true."""
 220     percents = list(_percent_re.finditer(f))
 221     new_f = _percent_re.sub('%s', f)
 222
 223     if isinstance(val, tuple):
 224         new_val = list(val)
 225         i = 0
 226         for perc in percents:
 227             starcount = perc.group('modifiers').count('*')
 228             new_val[i] = format(perc.group(), new_val[i], grouping, False, *new_val[i+1:i+1+starcount])
 229             del new_val[i+1:i+1+starcount]
 230             i += (1 + starcount)
 231         val = tuple(new_val)
 232     elif operator.isMappingType(val):
 233         for perc in percents:
 234             key = perc.group("key")
 235             val[key] = format(perc.group(), val[key], grouping)
 236     else:
 237         # val is a single value
 238         val = format(percents[0].group(), val, grouping)
 239
 240     return new_f % val
 241
 242 def currency(val, symbol=True, grouping=False, international=False):
 243     """Formats val according to the currency settings
 244     in the current locale."""
 245     conv = localeconv()
 246
 247     # check for illegal values
 248     digits = conv[international and 'int_frac_digits' or 'frac_digits']
 249     if digits == 127:
 250         raise ValueError("Currency formatting is not possible using "
 251                          "the 'C' locale.")
 252
 253     s = format('%%.%if' % digits, abs(val), grouping, monetary=True)
 254     # '<' and '>' are markers if the sign must be inserted between symbol and value
 255     s = '<' + s + '>'
 256
 257     if symbol:
 258         smb = conv[international and 'int_curr_symbol' or 'currency_symbol']
 259         precedes = conv[val<0 and 'n_cs_precedes' or 'p_cs_precedes']
 260         separated = conv[val<0 and 'n_sep_by_space' or 'p_sep_by_space']
 261
 262         if precedes:
 263             s = smb + (separated and ' ' or '') + s
 264         else:
 265             s = s + (separated and ' ' or '') + smb
 266
 267     sign_pos = conv[val<0 and 'n_sign_posn' or 'p_sign_posn']
 268     sign = conv[val<0 and 'negative_sign' or 'positive_sign']
 269
 270     if sign_pos == 0:
 271         s = '(' + s + ')'
 272     elif sign_pos == 1:
 273         s = sign + s
 274     elif sign_pos == 2:
 275         s = s + sign
 276     elif sign_pos == 3:
 277         s = s.replace('<', sign)
 278     elif sign_pos == 4:
 279         s = s.replace('>', sign)
 280     else:
 281         # the default if nothing specified;
 282         # this should be the most fitting sign position
 283         s = sign + s
 284
 285     return s.replace('<', '').replace('>', '')
 286
 287 def str(val):
 288     """Convert float to integer, taking the locale into account."""
 289     return format("%.12g", val)
 290
 291 def atof(string, func=float):
 292     "Parses a string as a float according to the locale settings."
 293     #First, get rid of the grouping
 294     ts = localeconv()['thousands_sep']
 295     if ts:
 296         string = string.replace(ts, '')
 297     #next, replace the decimal point with a dot
 298     dd = localeconv()['decimal_point']
 299     if dd:
 300         string = string.replace(dd, '.')
 301     #finally, parse the string
 302     return func(string)
 303
 304 def atoi(str):
 305     "Converts a string to an integer according to the locale settings."
 306     return atof(str, int)
 307
 308 def _test():
 309     setlocale(LC_ALL, "")
 310     #do grouping
 311     s1 = format("%d", 123456789,1)
 312     print s1, "is", atoi(s1)
 313     #standard formatting
 314     s1 = str(3.14)
 315     print s1, "is", atof(s1)
 316
 317 ### Locale name aliasing engine
 318
 319 # Author: Marc-Andre Lemburg, mal@lemburg.com
 320 # Various tweaks by Fredrik Lundh <fredrik@pythonware.com>
 321
 322 # store away the low-level version of setlocale (it's
 323 # overridden below)
 324 _setlocale = setlocale
 325
 326 def normalize(localename):
 327
 328     """ Returns a normalized locale code for the given locale
 329         name.
 330
 331         The returned locale code is formatted for use with
 332         setlocale().
 333
 334         If normalization fails, the original name is returned
 335         unchanged.
 336
 337         If the given encoding is not known, the function defaults to
 338         the default encoding for the locale code just like setlocale()
 339         does.
 340
 341     """
 342     # Normalize the locale name and extract the encoding
 343     fullname = localename.lower()
 344     if ':' in fullname:
 345         # ':' is sometimes used as encoding delimiter.
 346         fullname = fullname.replace(':', '.')
 347     if '.' in fullname:
 348         langname, encoding = fullname.split('.')[:2]
 349         fullname = langname + '.' + encoding
 350     else:
 351         langname = fullname
 352         encoding = ''
 353
 354     # First lookup: fullname (possibly with encoding)
 355     norm_encoding = encoding.replace('-', '')
 356     norm_encoding = norm_encoding.replace('_', '')
 357     lookup_name = langname + '.' + encoding
 358     code = locale_alias.get(lookup_name, None)
 359     if code is not None:
 360         return code
 361     #print 'first lookup failed'
 362
 363     # Second try: langname (without encoding)
 364     code = locale_alias.get(langname, None)
 365     if code is not None:
 366         #print 'langname lookup succeeded'
 367         if '.' in code:
 368             langname, defenc = code.split('.')
 369         else:
 370             langname = code
 371             defenc = ''
 372         if encoding:
 373             # Convert the encoding to a C lib compatible encoding string
 374             norm_encoding = encodings.normalize_encoding(encoding)
 375             #print 'norm encoding: %r' % norm_encoding
 376             norm_encoding = encodings.aliases.aliases.get(norm_encoding,
 377                                                           norm_encoding)
 378             #print 'aliased encoding: %r' % norm_encoding
 379             encoding = locale_encoding_alias.get(norm_encoding,
 380                                                  norm_encoding)
 381         else:
 382             encoding = defenc
 383         #print 'found encoding %r' % encoding
 384         if encoding:
 385             return langname + '.' + encoding
 386         else:
 387             return langname
 388
 389     else:
 390         return localename
 391
 392 def _parse_localename(localename):
 393
 394     """ Parses the locale code for localename and returns the
 395         result as tuple (language code, encoding).
 396
 397         The localename is normalized and passed through the locale
 398         alias engine. A ValueError is raised in case the locale name
 399         cannot be parsed.
 400
 401         The language code corresponds to RFC 1766.  code and encoding
 402         can be None in case the values cannot be determined or are
 403         unknown to this implementation.
 404
 405     """
 406     code = normalize(localename)
 407     if '@' in code:
 408         # Deal with locale modifiers
 409         code, modifier = code.split('@')
 410         if modifier == 'euro' and '.' not in code:
 411             # Assume Latin-9 for @euro locales. This is bogus,
 412             # since some systems may use other encodings for these
 413             # locales. Also, we ignore other modifiers.
 414             return code, 'iso-8859-15'
 415
 416     if '.' in code:
 417         return tuple(code.split('.')[:2])
 418     elif code == 'C':
 419         return None, None
 420     raise ValueError, 'unknown locale: %s' % localename
 421
 422 def _build_localename(localetuple):
 423
 424     """ Builds a locale code from the given tuple (language code,
 425         encoding).
 426
 427         No aliasing or normalizing takes place.
 428
 429     """
 430     language, encoding = localetuple
 431     if language is None:
 432         language = 'C'
 433     if encoding is None:
 434         return language
 435     else:
 436         return language + '.' + encoding
 437
 438 def getdefaultlocale(envvars=('LC_ALL', 'LC_CTYPE', 'LANG', 'LANGUAGE')):
 439
 440     """ Tries to determine the default locale settings and returns
 441         them as tuple (language code, encoding).
 442
 443         According to POSIX, a program which has not called
 444         setlocale(LC_ALL, "") runs using the portable 'C' locale.
 445         Calling setlocale(LC_ALL, "") lets it use the default locale as
 446         defined by the LANG variable. Since we don't want to interfere
 447         with the current locale setting we thus emulate the behavior
 448         in the way described above.
 449
 450         To maintain compatibility with other platforms, not only the
 451         LANG variable is tested, but a list of variables given as
 452         envvars parameter. The first found to be defined will be
 453         used. envvars defaults to the search path used in GNU gettext;
 454         it must always contain the variable name 'LANG'.
 455
 456         Except for the code 'C', the language code corresponds to RFC
 457         1766.  code and encoding can be None in case the values cannot
 458         be determined.
 459
 460     """
 461
 462     try:
 463         # check if it's supported by the _locale module
 464         import _locale
 465         code, encoding = _locale._getdefaultlocale()
 466     except (ImportError, AttributeError):
 467         pass
 468     else:
 469         # make sure the code/encoding values are valid
 470         if sys.platform == "win32" and code and code[:2] == "0x":
 471             # map windows language identifier to language name
 472             code = windows_locale.get(int(code, 0))
 473         # ...add other platform-specific processing here, if
 474         # necessary...
 475         return code, encoding
 476
 477     # fall back on POSIX behaviour
 478     import os
 479     lookup = os.environ.get
 480     for variable in envvars:
 481         localename = lookup(variable,None)
 482         if localename:
 483             if variable == 'LANGUAGE':
 484                 localename = localename.split(':')[0]
 485             break
 486     else:
 487         localename = 'C'
 488     return _parse_localename(localename)
 489
 490
 491 def getlocale(category=LC_CTYPE):
 492
 493     """ Returns the current setting for the given locale category as
 494         tuple (language code, encoding).
 495
 496         category may be one of the LC_* value except LC_ALL. It
 497         defaults to LC_CTYPE.
 498
 499         Except for the code 'C', the language code corresponds to RFC
 500         1766.  code and encoding can be None in case the values cannot
 501         be determined.
 502
 503     """
 504     localename = _setlocale(category)
 505     if category == LC_ALL and ';' in localename:
 506         raise TypeError, 'category LC_ALL is not supported'
 507     return _parse_localename(localename)
 508
 509 def setlocale(category, locale=None):
 510
 511     """ Set the locale for the given category.  The locale can be
 512         a string, a locale tuple (language code, encoding), or None.
 513
 514         Locale tuples are converted to strings the locale aliasing
 515         engine.  Locale strings are passed directly to the C lib.
 516
 517         category may be given as one of the LC_* values.
 518
 519     """
 520     if locale and type(locale) is not type(""):
 521         # convert to string
 522         locale = normalize(_build_localename(locale))
 523     return _setlocale(category, locale)
 524
 525 def resetlocale(category=LC_ALL):
 526
 527     """ Sets the locale for category to the default setting.
 528
 529         The default setting is determined by calling
 530         getdefaultlocale(). category defaults to LC_ALL.
 531
 532     """
 533     _setlocale(category, _build_localename(getdefaultlocale()))
 534
 535 if sys.platform.startswith("win"):
 536     # On Win32, this will return the ANSI code page
 537     def getpreferredencoding(do_setlocale = True):
 538         """Return the charset that the user is likely using."""
 539         import _locale
 540         return _locale._getdefaultlocale()[1]
 541 else:
 542     # On Unix, if CODESET is available, use that.
 543     try:
 544         CODESET
 545     except NameError:
 546         # Fall back to parsing environment variables :-(
 547         def getpreferredencoding(do_setlocale = True):
 548             """Return the charset that the user is likely using,
 549             by looking at environment variables."""
 550             return getdefaultlocale()[1]
 551     else:
 552         def getpreferredencoding(do_setlocale = True):
 553             """Return the charset that the user is likely using,
 554             according to the system configuration."""
 555             if do_setlocale:
 556                 oldloc = setlocale(LC_CTYPE)
 557                 try:
 558                     setlocale(LC_CTYPE, "")
 559                 except Error:
 560                     pass
 561                 result = nl_langinfo(CODESET)
 562                 setlocale(LC_CTYPE, oldloc)
 563                 return result
 564             else:
 565                 return nl_langinfo(CODESET)
 566
 567
 568 ### Database
 569 #
 570 # The following data was extracted from the locale.alias file which
 571 # comes with X11 and then hand edited removing the explicit encoding
 572 # definitions and adding some more aliases. The file is usually
 573 # available as /usr/lib/X11/locale/locale.alias.
 574 #
 575
 576 #
 577 # The local_encoding_alias table maps lowercase encoding alias names
 578 # to C locale encoding names (case-sensitive). Note that normalize()
 579 # first looks up the encoding in the encodings.aliases dictionary and
 580 # then applies this mapping to find the correct C lib name for the
 581 # encoding.
 582 #
 583 locale_encoding_alias = {
 584
 585     # Mappings for non-standard encoding names used in locale names
 586     '437':                          'C',
 587     'c':                            'C',
 588     'en':                           'ISO8859-1',
 589     'jis':                          'JIS7',
 590     'jis7':                         'JIS7',
 591     'ajec':                         'eucJP',
 592
 593     # Mappings from Python codec names to C lib encoding names
 594     'ascii':                        'ISO8859-1',
 595     'latin_1':                      'ISO8859-1',
 596     'iso8859_1':                    'ISO8859-1',
 597     'iso8859_10':                   'ISO8859-10',
 598     'iso8859_11':                   'ISO8859-11',
 599     'iso8859_13':                   'ISO8859-13',
 600     'iso8859_14':                   'ISO8859-14',
 601     'iso8859_15':                   'ISO8859-15',
 602     'iso8859_16':                   'ISO8859-16',
 603     'iso8859_2':                    'ISO8859-2',
 604     'iso8859_3':                    'ISO8859-3',
 605     'iso8859_4':                    'ISO8859-4',
 606     'iso8859_5':                    'ISO8859-5',
 607     'iso8859_6':                    'ISO8859-6',
 608     'iso8859_7':                    'ISO8859-7',
 609     'iso8859_8':                    'ISO8859-8',
 610     'iso8859_9':                    'ISO8859-9',
 611     'iso2022_jp':                   'JIS7',
 612     'shift_jis':                    'SJIS',
 613     'tactis':                       'TACTIS',
 614     'euc_jp':                       'eucJP',
 615     'euc_kr':                       'eucKR',
 616     'utf_8':                        'UTF8',
 617     'koi8_r':                       'KOI8-R',
 618     'koi8_u':                       'KOI8-U',
 619     # XXX This list is still incomplete. If you know more
 620     # mappings, please file a bug report. Thanks.
 621 }
 622
 623 #
 624 # The locale_alias table maps lowercase alias names to C locale names
 625 # (case-sensitive). Encodings are always separated from the locale
 626 # name using a dot ('.'); they should only be given in case the
 627 # language name is needed to interpret the given encoding alias
 628 # correctly (CJK codes often have this need).
 629 #
 630 # Note that the normalize() function which uses this tables
 631 # removes '_' and '-' characters from the encoding part of the
 632 # locale name before doing the lookup. This saves a lot of
 633 # space in the table.
 634 #
 635 # MAL 2004-12-10:
 636 # Updated alias mapping to most recent locale.alias file
 637 # from X.org distribution using makelocalealias.py.
 638 #
 639 # These are the differences compared to the old mapping (Python 2.4
 640 # and older):
 641 #
 642 #    updated 'bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 643 #    updated 'bg_bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 644 #    updated 'bulgarian' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 645 #    updated 'cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
 646 #    updated 'cz_cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
 647 #    updated 'czech' -> 'cs_CS.ISO8859-2' to 'cs_CZ.ISO8859-2'
 648 #    updated 'dutch' -> 'nl_BE.ISO8859-1' to 'nl_NL.ISO8859-1'
 649 #    updated 'et' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
 650 #    updated 'et_ee' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
 651 #    updated 'fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
 652 #    updated 'fi_fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
 653 #    updated 'iw' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
 654 #    updated 'iw_il' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
 655 #    updated 'japanese' -> 'ja_JP.SJIS' to 'ja_JP.eucJP'
 656 #    updated 'lt' -> 'lt_LT.ISO8859-4' to 'lt_LT.ISO8859-13'
 657 #    updated 'lv' -> 'lv_LV.ISO8859-4' to 'lv_LV.ISO8859-13'
 658 #    updated 'sl' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
 659 #    updated 'slovene' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
 660 #    updated 'th_th' -> 'th_TH.TACTIS' to 'th_TH.ISO8859-11'
 661 #    updated 'zh_cn' -> 'zh_CN.eucCN' to 'zh_CN.gb2312'
 662 #    updated 'zh_cn.big5' -> 'zh_TW.eucTW' to 'zh_TW.big5'
 663 #    updated 'zh_tw' -> 'zh_TW.eucTW' to 'zh_TW.big5'
 664 #
 665 # MAL 2008-05-30:
 666 # Updated alias mapping to most recent locale.alias file
 667 # from X.org distribution using makelocalealias.py.
 668 #
 669 # These are the differences compared to the old mapping (Python 2.5
 670 # and older):
 671 #
 672 #    updated 'cs_cs.iso88592' -> 'cs_CZ.ISO8859-2' to 'cs_CS.ISO8859-2'
 673 #    updated 'serbocroatian' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 674 #    updated 'sh' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 675 #    updated 'sh_hr.iso88592' -> 'sh_HR.ISO8859-2' to 'hr_HR.ISO8859-2'
 676 #    updated 'sh_sp' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 677 #    updated 'sh_yu' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 678 #    updated 'sp' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 679 #    updated 'sp_yu' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 680 #    updated 'sr' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 681 #    updated 'sr@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 682 #    updated 'sr_sp' -> 'sr_SP.ISO8859-2' to 'sr_CS.ISO8859-2'
 683 #    updated 'sr_yu' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 684 #    updated 'sr_yu.cp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
 685 #    updated 'sr_yu.iso88592' -> 'sr_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 686 #    updated 'sr_yu.iso88595' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 687 #    updated 'sr_yu.iso88595@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 688 #    updated 'sr_yu.microsoftcp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
 689 #    updated 'sr_yu.utf8@cyrillic' -> 'sr_YU.UTF-8' to 'sr_CS.UTF-8'
 690 #    updated 'sr_yu@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 691
 692 locale_alias = {
 693     'a3':                                   'a3_AZ.KOI8-C',
 694     'a3_az':                                'a3_AZ.KOI8-C',
 695     'a3_az.koi8c':                          'a3_AZ.KOI8-C',
 696     'af':                                   'af_ZA.ISO8859-1',
 697     'af_za':                                'af_ZA.ISO8859-1',
 698     'af_za.iso88591':                       'af_ZA.ISO8859-1',
 699     'am':                                   'am_ET.UTF-8',
 700     'am_et':                                'am_ET.UTF-8',
 701     'american':                             'en_US.ISO8859-1',
 702     'american.iso88591':                    'en_US.ISO8859-1',
 703     'ar':                                   'ar_AA.ISO8859-6',
 704     'ar_aa':                                'ar_AA.ISO8859-6',
 705     'ar_aa.iso88596':                       'ar_AA.ISO8859-6',
 706     'ar_ae':                                'ar_AE.ISO8859-6',
 707     'ar_ae.iso88596':                       'ar_AE.ISO8859-6',
 708     'ar_bh':                                'ar_BH.ISO8859-6',
 709     'ar_bh.iso88596':                       'ar_BH.ISO8859-6',
 710     'ar_dz':                                'ar_DZ.ISO8859-6',
 711     'ar_dz.iso88596':                       'ar_DZ.ISO8859-6',
 712     'ar_eg':                                'ar_EG.ISO8859-6',
 713     'ar_eg.iso88596':                       'ar_EG.ISO8859-6',
 714     'ar_iq':                                'ar_IQ.ISO8859-6',
 715     'ar_iq.iso88596':                       'ar_IQ.ISO8859-6',
 716     'ar_jo':                                'ar_JO.ISO8859-6',
 717     'ar_jo.iso88596':                       'ar_JO.ISO8859-6',
 718     'ar_kw':                                'ar_KW.ISO8859-6',
 719     'ar_kw.iso88596':                       'ar_KW.ISO8859-6',
 720     'ar_lb':                                'ar_LB.ISO8859-6',
 721     'ar_lb.iso88596':                       'ar_LB.ISO8859-6',
 722     'ar_ly':                                'ar_LY.ISO8859-6',
 723     'ar_ly.iso88596':                       'ar_LY.ISO8859-6',
 724     'ar_ma':                                'ar_MA.ISO8859-6',
 725     'ar_ma.iso88596':                       'ar_MA.ISO8859-6',
 726     'ar_om':                                'ar_OM.ISO8859-6',
 727     'ar_om.iso88596':                       'ar_OM.ISO8859-6',
 728     'ar_qa':                                'ar_QA.ISO8859-6',
 729     'ar_qa.iso88596':                       'ar_QA.ISO8859-6',
 730     'ar_sa':                                'ar_SA.ISO8859-6',
 731     'ar_sa.iso88596':                       'ar_SA.ISO8859-6',
 732     'ar_sd':                                'ar_SD.ISO8859-6',
 733     'ar_sd.iso88596':                       'ar_SD.ISO8859-6',
 734     'ar_sy':                                'ar_SY.ISO8859-6',
 735     'ar_sy.iso88596':                       'ar_SY.ISO8859-6',
 736     'ar_tn':                                'ar_TN.ISO8859-6',
 737     'ar_tn.iso88596':                       'ar_TN.ISO8859-6',
 738     'ar_ye':                                'ar_YE.ISO8859-6',
 739     'ar_ye.iso88596':                       'ar_YE.ISO8859-6',
 740     'arabic':                               'ar_AA.ISO8859-6',
 741     'arabic.iso88596':                      'ar_AA.ISO8859-6',
 742     'az':                                   'az_AZ.ISO8859-9E',
 743     'az_az':                                'az_AZ.ISO8859-9E',
 744     'az_az.iso88599e':                      'az_AZ.ISO8859-9E',
 745     'be':                                   'be_BY.CP1251',
 746     'be_by':                                'be_BY.CP1251',
 747     'be_by.cp1251':                         'be_BY.CP1251',
 748     'be_by.microsoftcp1251':                'be_BY.CP1251',
 749     'bg':                                   'bg_BG.CP1251',
 750     'bg_bg':                                'bg_BG.CP1251',
 751     'bg_bg.cp1251':                         'bg_BG.CP1251',
 752     'bg_bg.iso88595':                       'bg_BG.ISO8859-5',
 753     'bg_bg.koi8r':                          'bg_BG.KOI8-R',
 754     'bg_bg.microsoftcp1251':                'bg_BG.CP1251',
 755     'bn_in':                                'bn_IN.UTF-8',
 756     'bokmal':                               'nb_NO.ISO8859-1',
 757     'bokm\xe5l':                            'nb_NO.ISO8859-1',
 758     'br':                                   'br_FR.ISO8859-1',
 759     'br_fr':                                'br_FR.ISO8859-1',
 760     'br_fr.iso88591':                       'br_FR.ISO8859-1',
 761     'br_fr.iso885914':                      'br_FR.ISO8859-14',
 762     'br_fr.iso885915':                      'br_FR.ISO8859-15',
 763     'br_fr.iso885915@euro':                 'br_FR.ISO8859-15',
 764     'br_fr.utf8@euro':                      'br_FR.UTF-8',
 765     'br_fr@euro':                           'br_FR.ISO8859-15',
 766     'bs':                                   'bs_BA.ISO8859-2',
 767     'bs_ba':                                'bs_BA.ISO8859-2',
 768     'bs_ba.iso88592':                       'bs_BA.ISO8859-2',
 769     'bulgarian':                            'bg_BG.CP1251',
 770     'c':                                    'C',
 771     'c-french':                             'fr_CA.ISO8859-1',
 772     'c-french.iso88591':                    'fr_CA.ISO8859-1',
 773     'c.en':                                 'C',
 774     'c.iso88591':                           'en_US.ISO8859-1',
 775     'c_c':                                  'C',
 776     'c_c.c':                                'C',
 777     'ca':                                   'ca_ES.ISO8859-1',
 778     'ca_es':                                'ca_ES.ISO8859-1',
 779     'ca_es.iso88591':                       'ca_ES.ISO8859-1',
 780     'ca_es.iso885915':                      'ca_ES.ISO8859-15',
 781     'ca_es.iso885915@euro':                 'ca_ES.ISO8859-15',
 782     'ca_es.utf8@euro':                      'ca_ES.UTF-8',
 783     'ca_es@euro':                           'ca_ES.ISO8859-15',
 784     'catalan':                              'ca_ES.ISO8859-1',
 785     'cextend':                              'en_US.ISO8859-1',
 786     'cextend.en':                           'en_US.ISO8859-1',
 787     'chinese-s':                            'zh_CN.eucCN',
 788     'chinese-t':                            'zh_TW.eucTW',
 789     'croatian':                             'hr_HR.ISO8859-2',
 790     'cs':                                   'cs_CZ.ISO8859-2',
 791     'cs_cs':                                'cs_CZ.ISO8859-2',
 792     'cs_cs.iso88592':                       'cs_CS.ISO8859-2',
 793     'cs_cz':                                'cs_CZ.ISO8859-2',
 794     'cs_cz.iso88592':                       'cs_CZ.ISO8859-2',
 795     'cy':                                   'cy_GB.ISO8859-1',
 796     'cy_gb':                                'cy_GB.ISO8859-1',
 797     'cy_gb.iso88591':                       'cy_GB.ISO8859-1',
 798     'cy_gb.iso885914':                      'cy_GB.ISO8859-14',
 799     'cy_gb.iso885915':                      'cy_GB.ISO8859-15',
 800     'cy_gb@euro':                           'cy_GB.ISO8859-15',
 801     'cz':                                   'cs_CZ.ISO8859-2',
 802     'cz_cz':                                'cs_CZ.ISO8859-2',
 803     'czech':                                'cs_CZ.ISO8859-2',
 804     'da':                                   'da_DK.ISO8859-1',
 805     'da_dk':                                'da_DK.ISO8859-1',
 806     'da_dk.88591':                          'da_DK.ISO8859-1',
 807     'da_dk.885915':                         'da_DK.ISO8859-15',
 808     'da_dk.iso88591':                       'da_DK.ISO8859-1',
 809     'da_dk.iso885915':                      'da_DK.ISO8859-15',
 810     'da_dk@euro':                           'da_DK.ISO8859-15',
 811     'danish':                               'da_DK.ISO8859-1',
 812     'danish.iso88591':                      'da_DK.ISO8859-1',
 813     'dansk':                                'da_DK.ISO8859-1',
 814     'de':                                   'de_DE.ISO8859-1',
 815     'de_at':                                'de_AT.ISO8859-1',
 816     'de_at.iso88591':                       'de_AT.ISO8859-1',
 817     'de_at.iso885915':                      'de_AT.ISO8859-15',
 818     'de_at.iso885915@euro':                 'de_AT.ISO8859-15',
 819     'de_at.utf8@euro':                      'de_AT.UTF-8',
 820     'de_at@euro':                           'de_AT.ISO8859-15',
 821     'de_be':                                'de_BE.ISO8859-1',
 822     'de_be.iso88591':                       'de_BE.ISO8859-1',
 823     'de_be.iso885915':                      'de_BE.ISO8859-15',
 824     'de_be.iso885915@euro':                 'de_BE.ISO8859-15',
 825     'de_be.utf8@euro':                      'de_BE.UTF-8',
 826     'de_be@euro':                           'de_BE.ISO8859-15',
 827     'de_ch':                                'de_CH.ISO8859-1',
 828     'de_ch.iso88591':                       'de_CH.ISO8859-1',
 829     'de_ch.iso885915':                      'de_CH.ISO8859-15',
 830     'de_ch@euro':                           'de_CH.ISO8859-15',
 831     'de_de':                                'de_DE.ISO8859-1',
 832     'de_de.88591':                          'de_DE.ISO8859-1',
 833     'de_de.885915':                         'de_DE.ISO8859-15',
 834     'de_de.885915@euro':                    'de_DE.ISO8859-15',
 835     'de_de.iso88591':                       'de_DE.ISO8859-1',
 836     'de_de.iso885915':                      'de_DE.ISO8859-15',
 837     'de_de.iso885915@euro':                 'de_DE.ISO8859-15',
 838     'de_de.utf8@euro':                      'de_DE.UTF-8',
 839     'de_de@euro':                           'de_DE.ISO8859-15',
 840     'de_lu':                                'de_LU.ISO8859-1',
 841     'de_lu.iso88591':                       'de_LU.ISO8859-1',
 842     'de_lu.iso885915':                      'de_LU.ISO8859-15',
 843     'de_lu.iso885915@euro':                 'de_LU.ISO8859-15',
 844     'de_lu.utf8@euro':                      'de_LU.UTF-8',
 845     'de_lu@euro':                           'de_LU.ISO8859-15',
 846     'deutsch':                              'de_DE.ISO8859-1',
 847     'dutch':                                'nl_NL.ISO8859-1',
 848     'dutch.iso88591':                       'nl_BE.ISO8859-1',
 849     'ee':                                   'ee_EE.ISO8859-4',
 850     'ee_ee':                                'ee_EE.ISO8859-4',
 851     'ee_ee.iso88594':                       'ee_EE.ISO8859-4',
 852     'eesti':                                'et_EE.ISO8859-1',
 853     'el':                                   'el_GR.ISO8859-7',
 854     'el_gr':                                'el_GR.ISO8859-7',
 855     'el_gr.iso88597':                       'el_GR.ISO8859-7',
 856     'el_gr@euro':                           'el_GR.ISO8859-15',
 857     'en':                                   'en_US.ISO8859-1',
 858     'en.iso88591':                          'en_US.ISO8859-1',
 859     'en_au':                                'en_AU.ISO8859-1',
 860     'en_au.iso88591':                       'en_AU.ISO8859-1',
 861     'en_be':                                'en_BE.ISO8859-1',
 862     'en_be@euro':                           'en_BE.ISO8859-15',
 863     'en_bw':                                'en_BW.ISO8859-1',
 864     'en_bw.iso88591':                       'en_BW.ISO8859-1',
 865     'en_ca':                                'en_CA.ISO8859-1',
 866     'en_ca.iso88591':                       'en_CA.ISO8859-1',
 867     'en_gb':                                'en_GB.ISO8859-1',
 868     'en_gb.88591':                          'en_GB.ISO8859-1',
 869     'en_gb.iso88591':                       'en_GB.ISO8859-1',
 870     'en_gb.iso885915':                      'en_GB.ISO8859-15',
 871     'en_gb@euro':                           'en_GB.ISO8859-15',
 872     'en_hk':                                'en_HK.ISO8859-1',
 873     'en_hk.iso88591':                       'en_HK.ISO8859-1',
 874     'en_ie':                                'en_IE.ISO8859-1',
 875     'en_ie.iso88591':                       'en_IE.ISO8859-1',
 876     'en_ie.iso885915':                      'en_IE.ISO8859-15',
 877     'en_ie.iso885915@euro':                 'en_IE.ISO8859-15',
 878     'en_ie.utf8@euro':                      'en_IE.UTF-8',
 879     'en_ie@euro':                           'en_IE.ISO8859-15',
 880     'en_in':                                'en_IN.ISO8859-1',
 881     'en_nz':                                'en_NZ.ISO8859-1',
 882     'en_nz.iso88591':                       'en_NZ.ISO8859-1',
 883     'en_ph':                                'en_PH.ISO8859-1',
 884     'en_ph.iso88591':                       'en_PH.ISO8859-1',
 885     'en_sg':                                'en_SG.ISO8859-1',
 886     'en_sg.iso88591':                       'en_SG.ISO8859-1',
 887     'en_uk':                                'en_GB.ISO8859-1',
 888     'en_us':                                'en_US.ISO8859-1',
 889     'en_us.88591':                          'en_US.ISO8859-1',
 890     'en_us.885915':                         'en_US.ISO8859-15',
 891     'en_us.iso88591':                       'en_US.ISO8859-1',
 892     'en_us.iso885915':                      'en_US.ISO8859-15',
 893     'en_us.iso885915@euro':                 'en_US.ISO8859-15',
 894     'en_us@euro':                           'en_US.ISO8859-15',
 895     'en_us@euro@euro':                      'en_US.ISO8859-15',
 896     'en_za':                                'en_ZA.ISO8859-1',
 897     'en_za.88591':                          'en_ZA.ISO8859-1',
 898     'en_za.iso88591':                       'en_ZA.ISO8859-1',
 899     'en_za.iso885915':                      'en_ZA.ISO8859-15',
 900     'en_za@euro':                           'en_ZA.ISO8859-15',
 901     'en_zw':                                'en_ZW.ISO8859-1',
 902     'en_zw.iso88591':                       'en_ZW.ISO8859-1',
 903     'eng_gb':                               'en_GB.ISO8859-1',
 904     'eng_gb.8859':                          'en_GB.ISO8859-1',
 905     'english':                              'en_EN.ISO8859-1',
 906     'english.iso88591':                     'en_EN.ISO8859-1',
 907     'english_uk':                           'en_GB.ISO8859-1',
 908     'english_uk.8859':                      'en_GB.ISO8859-1',
 909     'english_united-states':                'en_US.ISO8859-1',
 910     'english_united-states.437':            'C',
 911     'english_us':                           'en_US.ISO8859-1',
 912     'english_us.8859':                      'en_US.ISO8859-1',
 913     'english_us.ascii':                     'en_US.ISO8859-1',
 914     'eo':                                   'eo_XX.ISO8859-3',
 915     'eo_eo':                                'eo_EO.ISO8859-3',
 916     'eo_eo.iso88593':                       'eo_EO.ISO8859-3',
 917     'eo_xx':                                'eo_XX.ISO8859-3',
 918     'eo_xx.iso88593':                       'eo_XX.ISO8859-3',
 919     'es':                                   'es_ES.ISO8859-1',
 920     'es_ar':                                'es_AR.ISO8859-1',
 921     'es_ar.iso88591':                       'es_AR.ISO8859-1',
 922     'es_bo':                                'es_BO.ISO8859-1',
 923     'es_bo.iso88591':                       'es_BO.ISO8859-1',
 924     'es_cl':                                'es_CL.ISO8859-1',
 925     'es_cl.iso88591':                       'es_CL.ISO8859-1',
 926     'es_co':                                'es_CO.ISO8859-1',
 927     'es_co.iso88591':                       'es_CO.ISO8859-1',
 928     'es_cr':                                'es_CR.ISO8859-1',
 929     'es_cr.iso88591':                       'es_CR.ISO8859-1',
 930     'es_do':                                'es_DO.ISO8859-1',
 931     'es_do.iso88591':                       'es_DO.ISO8859-1',
 932     'es_ec':                                'es_EC.ISO8859-1',
 933     'es_ec.iso88591':                       'es_EC.ISO8859-1',
 934     'es_es':                                'es_ES.ISO8859-1',
 935     'es_es.88591':                          'es_ES.ISO8859-1',
 936     'es_es.iso88591':                       'es_ES.ISO8859-1',
 937     'es_es.iso885915':                      'es_ES.ISO8859-15',
 938     'es_es.iso885915@euro':                 'es_ES.ISO8859-15',
 939     'es_es.utf8@euro':                      'es_ES.UTF-8',
 940     'es_es@euro':                           'es_ES.ISO8859-15',
 941     'es_gt':                                'es_GT.ISO8859-1',
 942     'es_gt.iso88591':                       'es_GT.ISO8859-1',
 943     'es_hn':                                'es_HN.ISO8859-1',
 944     'es_hn.iso88591':                       'es_HN.ISO8859-1',
 945     'es_mx':                                'es_MX.ISO8859-1',
 946     'es_mx.iso88591':                       'es_MX.ISO8859-1',
 947     'es_ni':                                'es_NI.ISO8859-1',
 948     'es_ni.iso88591':                       'es_NI.ISO8859-1',
 949     'es_pa':                                'es_PA.ISO8859-1',
 950     'es_pa.iso88591':                       'es_PA.ISO8859-1',
 951     'es_pa.iso885915':                      'es_PA.ISO8859-15',
 952     'es_pa@euro':                           'es_PA.ISO8859-15',
 953     'es_pe':                                'es_PE.ISO8859-1',
 954     'es_pe.iso88591':                       'es_PE.ISO8859-1',
 955     'es_pe.iso885915':                      'es_PE.ISO8859-15',
 956     'es_pe@euro':                           'es_PE.ISO8859-15',
 957     'es_pr':                                'es_PR.ISO8859-1',
 958     'es_pr.iso88591':                       'es_PR.ISO8859-1',
 959     'es_py':                                'es_PY.ISO8859-1',
 960     'es_py.iso88591':                       'es_PY.ISO8859-1',
 961     'es_py.iso885915':                      'es_PY.ISO8859-15',
 962     'es_py@euro':                           'es_PY.ISO8859-15',
 963     'es_sv':                                'es_SV.ISO8859-1',
 964     'es_sv.iso88591':                       'es_SV.ISO8859-1',
 965     'es_sv.iso885915':                      'es_SV.ISO8859-15',
 966     'es_sv@euro':                           'es_SV.ISO8859-15',
 967     'es_us':                                'es_US.ISO8859-1',
 968     'es_us.iso88591':                       'es_US.ISO8859-1',
 969     'es_uy':                                'es_UY.ISO8859-1',
 970     'es_uy.iso88591':                       'es_UY.ISO8859-1',
 971     'es_uy.iso885915':                      'es_UY.ISO8859-15',
 972     'es_uy@euro':                           'es_UY.ISO8859-15',
 973     'es_ve':                                'es_VE.ISO8859-1',
 974     'es_ve.iso88591':                       'es_VE.ISO8859-1',
 975     'es_ve.iso885915':                      'es_VE.ISO8859-15',
 976     'es_ve@euro':                           'es_VE.ISO8859-15',
 977     'estonian':                             'et_EE.ISO8859-1',
 978     'et':                                   'et_EE.ISO8859-15',
 979     'et_ee':                                'et_EE.ISO8859-15',
 980     'et_ee.iso88591':                       'et_EE.ISO8859-1',
 981     'et_ee.iso885913':                      'et_EE.ISO8859-13',
 982     'et_ee.iso885915':                      'et_EE.ISO8859-15',
 983     'et_ee.iso88594':                       'et_EE.ISO8859-4',
 984     'et_ee@euro':                           'et_EE.ISO8859-15',
 985     'eu':                                   'eu_ES.ISO8859-1',
 986     'eu_es':                                'eu_ES.ISO8859-1',
 987     'eu_es.iso88591':                       'eu_ES.ISO8859-1',
 988     'eu_es.iso885915':                      'eu_ES.ISO8859-15',
 989     'eu_es.iso885915@euro':                 'eu_ES.ISO8859-15',
 990     'eu_es.utf8@euro':                      'eu_ES.UTF-8',
 991     'eu_es@euro':                           'eu_ES.ISO8859-15',
 992     'fa':                                   'fa_IR.UTF-8',
 993     'fa_ir':                                'fa_IR.UTF-8',
 994     'fa_ir.isiri3342':                      'fa_IR.ISIRI-3342',
 995     'fi':                                   'fi_FI.ISO8859-15',
 996     'fi_fi':                                'fi_FI.ISO8859-15',
 997     'fi_fi.88591':                          'fi_FI.ISO8859-1',
 998     'fi_fi.iso88591':                       'fi_FI.ISO8859-1',
 999     'fi_fi.iso885915':                      'fi_FI.ISO8859-15',
1000     'fi_fi.iso885915@euro':                 'fi_FI.ISO8859-15',
1001     'fi_fi.utf8@euro':                      'fi_FI.UTF-8',
1002     'fi_fi@euro':                           'fi_FI.ISO8859-15',
1003     'finnish':                              'fi_FI.ISO8859-1',
1004     'finnish.iso88591':                     'fi_FI.ISO8859-1',
1005     'fo':                                   'fo_FO.ISO8859-1',
1006     'fo_fo':                                'fo_FO.ISO8859-1',
1007     'fo_fo.iso88591':                       'fo_FO.ISO8859-1',
1008     'fo_fo.iso885915':                      'fo_FO.ISO8859-15',
1009     'fo_fo@euro':                           'fo_FO.ISO8859-15',
1010     'fr':                                   'fr_FR.ISO8859-1',
1011     'fr_be':                                'fr_BE.ISO8859-1',
1012     'fr_be.88591':                          'fr_BE.ISO8859-1',
1013     'fr_be.iso88591':                       'fr_BE.ISO8859-1',
1014     'fr_be.iso885915':                      'fr_BE.ISO8859-15',
1015     'fr_be.iso885915@euro':                 'fr_BE.ISO8859-15',
1016     'fr_be.utf8@euro':                      'fr_BE.UTF-8',
1017     'fr_be@euro':                           'fr_BE.ISO8859-15',
1018     'fr_ca':                                'fr_CA.ISO8859-1',
1019     'fr_ca.88591':                          'fr_CA.ISO8859-1',
1020     'fr_ca.iso88591':                       'fr_CA.ISO8859-1',
1021     'fr_ca.iso885915':                      'fr_CA.ISO8859-15',
1022     'fr_ca@euro':                           'fr_CA.ISO8859-15',
1023     'fr_ch':                                'fr_CH.ISO8859-1',
1024     'fr_ch.88591':                          'fr_CH.ISO8859-1',
1025     'fr_ch.iso88591':                       'fr_CH.ISO8859-1',
1026     'fr_ch.iso885915':                      'fr_CH.ISO8859-15',
1027     'fr_ch@euro':                           'fr_CH.ISO8859-15',
1028     'fr_fr':                                'fr_FR.ISO8859-1',
1029     'fr_fr.88591':                          'fr_FR.ISO8859-1',
1030     'fr_fr.iso88591':                       'fr_FR.ISO8859-1',
1031     'fr_fr.iso885915':                      'fr_FR.ISO8859-15',
1032     'fr_fr.iso885915@euro':                 'fr_FR.ISO8859-15',
1033     'fr_fr.utf8@euro':                      'fr_FR.UTF-8',
1034     'fr_fr@euro':                           'fr_FR.ISO8859-15',
1035     'fr_lu':                                'fr_LU.ISO8859-1',
1036     'fr_lu.88591':                          'fr_LU.ISO8859-1',
1037     'fr_lu.iso88591':                       'fr_LU.ISO8859-1',
1038     'fr_lu.iso885915':                      'fr_LU.ISO8859-15',
1039     'fr_lu.iso885915@euro':                 'fr_LU.ISO8859-15',
1040     'fr_lu.utf8@euro':                      'fr_LU.UTF-8',
1041     'fr_lu@euro':                           'fr_LU.ISO8859-15',
1042     'fran\xe7ais':                          'fr_FR.ISO8859-1',
1043     'fre_fr':                               'fr_FR.ISO8859-1',
1044     'fre_fr.8859':                          'fr_FR.ISO8859-1',
1045     'french':                               'fr_FR.ISO8859-1',
1046     'french.iso88591':                      'fr_CH.ISO8859-1',
1047     'french_france':                        'fr_FR.ISO8859-1',
1048     'french_france.8859':                   'fr_FR.ISO8859-1',
1049     'ga':                                   'ga_IE.ISO8859-1',
1050     'ga_ie':                                'ga_IE.ISO8859-1',
1051     'ga_ie.iso88591':                       'ga_IE.ISO8859-1',
1052     'ga_ie.iso885914':                      'ga_IE.ISO8859-14',
1053     'ga_ie.iso885915':                      'ga_IE.ISO8859-15',
1054     'ga_ie.iso885915@euro':                 'ga_IE.ISO8859-15',
1055     'ga_ie.utf8@euro':                      'ga_IE.UTF-8',
1056     'ga_ie@euro':                           'ga_IE.ISO8859-15',
1057     'galego':                               'gl_ES.ISO8859-1',
1058     'galician':                             'gl_ES.ISO8859-1',
1059     'gd':                                   'gd_GB.ISO8859-1',
1060     'gd_gb':                                'gd_GB.ISO8859-1',
1061     'gd_gb.iso88591':                       'gd_GB.ISO8859-1',
1062     'gd_gb.iso885914':                      'gd_GB.ISO8859-14',
1063     'gd_gb.iso885915':                      'gd_GB.ISO8859-15',
1064     'gd_gb@euro':                           'gd_GB.ISO8859-15',
1065     'ger_de':                               'de_DE.ISO8859-1',
1066     'ger_de.8859':                          'de_DE.ISO8859-1',
1067     'german':                               'de_DE.ISO8859-1',
1068     'german.iso88591':                      'de_CH.ISO8859-1',
1069     'german_germany':                       'de_DE.ISO8859-1',
1070     'german_germany.8859':                  'de_DE.ISO8859-1',
1071     'gl':                                   'gl_ES.ISO8859-1',
1072     'gl_es':                                'gl_ES.ISO8859-1',
1073     'gl_es.iso88591':                       'gl_ES.ISO8859-1',
1074     'gl_es.iso885915':                      'gl_ES.ISO8859-15',
1075     'gl_es.iso885915@euro':                 'gl_ES.ISO8859-15',
1076     'gl_es.utf8@euro':                      'gl_ES.UTF-8',
1077     'gl_es@euro':                           'gl_ES.ISO8859-15',
1078     'greek':                                'el_GR.ISO8859-7',
1079     'greek.iso88597':                       'el_GR.ISO8859-7',
1080     'gu_in':                                'gu_IN.UTF-8',
1081     'gv':                                   'gv_GB.ISO8859-1',
1082     'gv_gb':                                'gv_GB.ISO8859-1',
1083     'gv_gb.iso88591':                       'gv_GB.ISO8859-1',
1084     'gv_gb.iso885914':                      'gv_GB.ISO8859-14',
1085     'gv_gb.iso885915':                      'gv_GB.ISO8859-15',
1086     'gv_gb@euro':                           'gv_GB.ISO8859-15',
1087     'he':                                   'he_IL.ISO8859-8',
1088     'he_il':                                'he_IL.ISO8859-8',
1089     'he_il.cp1255':                         'he_IL.CP1255',
1090     'he_il.iso88598':                       'he_IL.ISO8859-8',
1091     'he_il.microsoftcp1255':                'he_IL.CP1255',
1092     'hebrew':                               'iw_IL.ISO8859-8',
1093     'hebrew.iso88598':                      'iw_IL.ISO8859-8',
1094     'hi':                                   'hi_IN.ISCII-DEV',
1095     'hi_in':                                'hi_IN.ISCII-DEV',
1096     'hi_in.isciidev':                       'hi_IN.ISCII-DEV',
1097     'hr':                                   'hr_HR.ISO8859-2',
1098     'hr_hr':                                'hr_HR.ISO8859-2',
1099     'hr_hr.iso88592':                       'hr_HR.ISO8859-2',
1100     'hrvatski':                             'hr_HR.ISO8859-2',
1101     'hu':                                   'hu_HU.ISO8859-2',
1102     'hu_hu':                                'hu_HU.ISO8859-2',
1103     'hu_hu.iso88592':                       'hu_HU.ISO8859-2',
1104     'hungarian':                            'hu_HU.ISO8859-2',
1105     'icelandic':                            'is_IS.ISO8859-1',
1106     'icelandic.iso88591':                   'is_IS.ISO8859-1',
1107     'id':                                   'id_ID.ISO8859-1',
1108     'id_id':                                'id_ID.ISO8859-1',
1109     'in':                                   'id_ID.ISO8859-1',
1110     'in_id':                                'id_ID.ISO8859-1',
1111     'is':                                   'is_IS.ISO8859-1',
1112     'is_is':                                'is_IS.ISO8859-1',
1113     'is_is.iso88591':                       'is_IS.ISO8859-1',
1114     'is_is.iso885915':                      'is_IS.ISO8859-15',
1115     'is_is@euro':                           'is_IS.ISO8859-15',
1116     'iso-8859-1':                           'en_US.ISO8859-1',
1117     'iso-8859-15':                          'en_US.ISO8859-15',
1118     'iso8859-1':                            'en_US.ISO8859-1',
1119     'iso8859-15':                           'en_US.ISO8859-15',
1120     'iso_8859_1':                           'en_US.ISO8859-1',
1121     'iso_8859_15':                          'en_US.ISO8859-15',
1122     'it':                                   'it_IT.ISO8859-1',
1123     'it_ch':                                'it_CH.ISO8859-1',
1124     'it_ch.iso88591':                       'it_CH.ISO8859-1',
1125     'it_ch.iso885915':                      'it_CH.ISO8859-15',
1126     'it_ch@euro':                           'it_CH.ISO8859-15',
1127     'it_it':                                'it_IT.ISO8859-1',
1128     'it_it.88591':                          'it_IT.ISO8859-1',
1129     'it_it.iso88591':                       'it_IT.ISO8859-1',
1130     'it_it.iso885915':                      'it_IT.ISO8859-15',
1131     'it_it.iso885915@euro':                 'it_IT.ISO8859-15',
1132     'it_it.utf8@euro':                      'it_IT.UTF-8',
1133     'it_it@euro':                           'it_IT.ISO8859-15',
1134     'italian':                              'it_IT.ISO8859-1',
1135     'italian.iso88591':                     'it_IT.ISO8859-1',
1136     'iu':                                   'iu_CA.NUNACOM-8',
1137     'iu_ca':                                'iu_CA.NUNACOM-8',
1138     'iu_ca.nunacom8':                       'iu_CA.NUNACOM-8',
1139     'iw':                                   'he_IL.ISO8859-8',
1140     'iw_il':                                'he_IL.ISO8859-8',
1141     'iw_il.iso88598':                       'he_IL.ISO8859-8',
1142     'ja':                                   'ja_JP.eucJP',
1143     'ja.jis':                               'ja_JP.JIS7',
1144     'ja.sjis':                              'ja_JP.SJIS',
1145     'ja_jp':                                'ja_JP.eucJP',
1146     'ja_jp.ajec':                           'ja_JP.eucJP',
1147     'ja_jp.euc':                            'ja_JP.eucJP',
1148     'ja_jp.eucjp':                          'ja_JP.eucJP',
1149     'ja_jp.iso-2022-jp':                    'ja_JP.JIS7',
1150     'ja_jp.iso2022jp':                      'ja_JP.JIS7',
1151     'ja_jp.jis':                            'ja_JP.JIS7',
1152     'ja_jp.jis7':                           'ja_JP.JIS7',
1153     'ja_jp.mscode':                         'ja_JP.SJIS',
1154     'ja_jp.sjis':                           'ja_JP.SJIS',
1155     'ja_jp.ujis':                           'ja_JP.eucJP',
1156     'japan':                                'ja_JP.eucJP',
1157     'japanese':                             'ja_JP.eucJP',
1158     'japanese-euc':                         'ja_JP.eucJP',
1159     'japanese.euc':                         'ja_JP.eucJP',
1160     'japanese.sjis':                        'ja_JP.SJIS',
1161     'jp_jp':                                'ja_JP.eucJP',
1162     'ka':                                   'ka_GE.GEORGIAN-ACADEMY',
1163     'ka_ge':                                'ka_GE.GEORGIAN-ACADEMY',
1164     'ka_ge.georgianacademy':                'ka_GE.GEORGIAN-ACADEMY',
1165     'ka_ge.georgianps':                     'ka_GE.GEORGIAN-PS',
1166     'ka_ge.georgianrs':                     'ka_GE.GEORGIAN-ACADEMY',
1167     'kl':                                   'kl_GL.ISO8859-1',
1168     'kl_gl':                                'kl_GL.ISO8859-1',
1169     'kl_gl.iso88591':                       'kl_GL.ISO8859-1',
1170     'kl_gl.iso885915':                      'kl_GL.ISO8859-15',
1171     'kl_gl@euro':                           'kl_GL.ISO8859-15',
1172     'km_kh':                                'km_KH.UTF-8',
1173     'kn_in':                                'kn_IN.UTF-8',
1174     'ko':                                   'ko_KR.eucKR',
1175     'ko_kr':                                'ko_KR.eucKR',
1176     'ko_kr.euc':                            'ko_KR.eucKR',
1177     'ko_kr.euckr':                          'ko_KR.eucKR',
1178     'korean':                               'ko_KR.eucKR',
1179     'korean.euc':                           'ko_KR.eucKR',
1180     'kw':                                   'kw_GB.ISO8859-1',
1181     'kw_gb':                                'kw_GB.ISO8859-1',
1182     'kw_gb.iso88591':                       'kw_GB.ISO8859-1',
1183     'kw_gb.iso885914':                      'kw_GB.ISO8859-14',
1184     'kw_gb.iso885915':                      'kw_GB.ISO8859-15',
1185     'kw_gb@euro':                           'kw_GB.ISO8859-15',
1186     'ky':                                   'ky_KG.UTF-8',
1187     'ky_kg':                                'ky_KG.UTF-8',
1188     'lithuanian':                           'lt_LT.ISO8859-13',
1189     'lo':                                   'lo_LA.MULELAO-1',
1190     'lo_la':                                'lo_LA.MULELAO-1',
1191     'lo_la.cp1133':                         'lo_LA.IBM-CP1133',
1192     'lo_la.ibmcp1133':                      'lo_LA.IBM-CP1133',
1193     'lo_la.mulelao1':                       'lo_LA.MULELAO-1',
1194     'lt':                                   'lt_LT.ISO8859-13',
1195     'lt_lt':                                'lt_LT.ISO8859-13',
1196     'lt_lt.iso885913':                      'lt_LT.ISO8859-13',
1197     'lt_lt.iso88594':                       'lt_LT.ISO8859-4',
1198     'lv':                                   'lv_LV.ISO8859-13',
1199     'lv_lv':                                'lv_LV.ISO8859-13',
1200     'lv_lv.iso885913':                      'lv_LV.ISO8859-13',
1201     'lv_lv.iso88594':                       'lv_LV.ISO8859-4',
1202     'mi':                                   'mi_NZ.ISO8859-1',
1203     'mi_nz':                                'mi_NZ.ISO8859-1',
1204     'mi_nz.iso88591':                       'mi_NZ.ISO8859-1',
1205     'mk':                                   'mk_MK.ISO8859-5',
1206     'mk_mk':                                'mk_MK.ISO8859-5',
1207     'mk_mk.cp1251':                         'mk_MK.CP1251',
1208     'mk_mk.iso88595':                       'mk_MK.ISO8859-5',
1209     'mk_mk.microsoftcp1251':                'mk_MK.CP1251',
1210     'mr_in':                                'mr_IN.UTF-8',
1211     'ms':                                   'ms_MY.ISO8859-1',
1212     'ms_my':                                'ms_MY.ISO8859-1',
1213     'ms_my.iso88591':                       'ms_MY.ISO8859-1',
1214     'mt':                                   'mt_MT.ISO8859-3',
1215     'mt_mt':                                'mt_MT.ISO8859-3',
1216     'mt_mt.iso88593':                       'mt_MT.ISO8859-3',
1217     'nb':                                   'nb_NO.ISO8859-1',
1218     'nb_no':                                'nb_NO.ISO8859-1',
1219     'nb_no.88591':                          'nb_NO.ISO8859-1',
1220     'nb_no.iso88591':                       'nb_NO.ISO8859-1',
1221     'nb_no.iso885915':                      'nb_NO.ISO8859-15',
1222     'nb_no@euro':                           'nb_NO.ISO8859-15',
1223     'nl':                                   'nl_NL.ISO8859-1',
1224     'nl_be':                                'nl_BE.ISO8859-1',
1225     'nl_be.88591':                          'nl_BE.ISO8859-1',
1226     'nl_be.iso88591':                       'nl_BE.ISO8859-1',
1227     'nl_be.iso885915':                      'nl_BE.ISO8859-15',
1228     'nl_be.iso885915@euro':                 'nl_BE.ISO8859-15',
1229     'nl_be.utf8@euro':                      'nl_BE.UTF-8',
1230     'nl_be@euro':                           'nl_BE.ISO8859-15',
1231     'nl_nl':                                'nl_NL.ISO8859-1',
1232     'nl_nl.88591':                          'nl_NL.ISO8859-1',
1233     'nl_nl.iso88591':                       'nl_NL.ISO8859-1',
1234     'nl_nl.iso885915':                      'nl_NL.ISO8859-15',
1235     'nl_nl.iso885915@euro':                 'nl_NL.ISO8859-15',
1236     'nl_nl.utf8@euro':                      'nl_NL.UTF-8',
1237     'nl_nl@euro':                           'nl_NL.ISO8859-15',
1238     'nn':                                   'nn_NO.ISO8859-1',
1239     'nn_no':                                'nn_NO.ISO8859-1',
1240     'nn_no.88591':                          'nn_NO.ISO8859-1',
1241     'nn_no.iso88591':                       'nn_NO.ISO8859-1',
1242     'nn_no.iso885915':                      'nn_NO.ISO8859-15',
1243     'nn_no@euro':                           'nn_NO.ISO8859-15',
1244     'no':                                   'no_NO.ISO8859-1',
1245     'no@nynorsk':                           'ny_NO.ISO8859-1',
1246     'no_no':                                'no_NO.ISO8859-1',
1247     'no_no.88591':                          'no_NO.ISO8859-1',
1248     'no_no.iso88591':                       'no_NO.ISO8859-1',
1249     'no_no.iso885915':                      'no_NO.ISO8859-15',
1250     'no_no@euro':                           'no_NO.ISO8859-15',
1251     'norwegian':                            'no_NO.ISO8859-1',
1252     'norwegian.iso88591':                   'no_NO.ISO8859-1',
1253     'nr':                                   'nr_ZA.ISO8859-1',
1254     'nr_za':                                'nr_ZA.ISO8859-1',
1255     'nr_za.iso88591':                       'nr_ZA.ISO8859-1',
1256     'nso':                                  'nso_ZA.ISO8859-15',
1257     'nso_za':                               'nso_ZA.ISO8859-15',
1258     'nso_za.iso885915':                     'nso_ZA.ISO8859-15',
1259     'ny':                                   'ny_NO.ISO8859-1',
1260     'ny_no':                                'ny_NO.ISO8859-1',
1261     'ny_no.88591':                          'ny_NO.ISO8859-1',
1262     'ny_no.iso88591':                       'ny_NO.ISO8859-1',
1263     'ny_no.iso885915':                      'ny_NO.ISO8859-15',
1264     'ny_no@euro':                           'ny_NO.ISO8859-15',
1265     'nynorsk':                              'nn_NO.ISO8859-1',
1266     'oc':                                   'oc_FR.ISO8859-1',
1267     'oc_fr':                                'oc_FR.ISO8859-1',
1268     'oc_fr.iso88591':                       'oc_FR.ISO8859-1',
1269     'oc_fr.iso885915':                      'oc_FR.ISO8859-15',
1270     'oc_fr@euro':                           'oc_FR.ISO8859-15',
1271     'pa_in':                                'pa_IN.UTF-8',
1272     'pd':                                   'pd_US.ISO8859-1',
1273     'pd_de':                                'pd_DE.ISO8859-1',
1274     'pd_de.iso88591':                       'pd_DE.ISO8859-1',
1275     'pd_de.iso885915':                      'pd_DE.ISO8859-15',
1276     'pd_de@euro':                           'pd_DE.ISO8859-15',
1277     'pd_us':                                'pd_US.ISO8859-1',
1278     'pd_us.iso88591':                       'pd_US.ISO8859-1',
1279     'pd_us.iso885915':                      'pd_US.ISO8859-15',
1280     'pd_us@euro':                           'pd_US.ISO8859-15',
1281     'ph':                                   'ph_PH.ISO8859-1',
1282     'ph_ph':                                'ph_PH.ISO8859-1',
1283     'ph_ph.iso88591':                       'ph_PH.ISO8859-1',
1284     'pl':                                   'pl_PL.ISO8859-2',
1285     'pl_pl':                                'pl_PL.ISO8859-2',
1286     'pl_pl.iso88592':                       'pl_PL.ISO8859-2',
1287     'polish':                               'pl_PL.ISO8859-2',
1288     'portuguese':                           'pt_PT.ISO8859-1',
1289     'portuguese.iso88591':                  'pt_PT.ISO8859-1',
1290     'portuguese_brazil':                    'pt_BR.ISO8859-1',
1291     'portuguese_brazil.8859':               'pt_BR.ISO8859-1',
1292     'posix':                                'C',
1293     'posix-utf2':                           'C',
1294     'pp':                                   'pp_AN.ISO8859-1',
1295     'pp_an':                                'pp_AN.ISO8859-1',
1296     'pp_an.iso88591':                       'pp_AN.ISO8859-1',
1297     'pt':                                   'pt_PT.ISO8859-1',
1298     'pt_br':                                'pt_BR.ISO8859-1',
1299     'pt_br.88591':                          'pt_BR.ISO8859-1',
1300     'pt_br.iso88591':                       'pt_BR.ISO8859-1',
1301     'pt_br.iso885915':                      'pt_BR.ISO8859-15',
1302     'pt_br@euro':                           'pt_BR.ISO8859-15',
1303     'pt_pt':                                'pt_PT.ISO8859-1',
1304     'pt_pt.88591':                          'pt_PT.ISO8859-1',
1305     'pt_pt.iso88591':                       'pt_PT.ISO8859-1',
1306     'pt_pt.iso885915':                      'pt_PT.ISO8859-15',
1307     'pt_pt.iso885915@euro':                 'pt_PT.ISO8859-15',
1308     'pt_pt.utf8@euro':                      'pt_PT.UTF-8',
1309     'pt_pt@euro':                           'pt_PT.ISO8859-15',
1310     'ro':                                   'ro_RO.ISO8859-2',
1311     'ro_ro':                                'ro_RO.ISO8859-2',
1312     'ro_ro.iso88592':                       'ro_RO.ISO8859-2',
1313     'romanian':                             'ro_RO.ISO8859-2',
1314     'ru':                                   'ru_RU.ISO8859-5',
1315     'ru_ru':                                'ru_RU.ISO8859-5',
1316     'ru_ru.cp1251':                         'ru_RU.CP1251',
1317     'ru_ru.iso88595':                       'ru_RU.ISO8859-5',
1318     'ru_ru.koi8r':                          'ru_RU.KOI8-R',
1319     'ru_ru.microsoftcp1251':                'ru_RU.CP1251',
1320     'ru_ua':                                'ru_UA.KOI8-U',
1321     'ru_ua.cp1251':                         'ru_UA.CP1251',
1322     'ru_ua.koi8u':                          'ru_UA.KOI8-U',
1323     'ru_ua.microsoftcp1251':                'ru_UA.CP1251',
1324     'rumanian':                             'ro_RO.ISO8859-2',
1325     'russian':                              'ru_RU.ISO8859-5',
1326     'rw':                                   'rw_RW.ISO8859-1',
1327     'rw_rw':                                'rw_RW.ISO8859-1',
1328     'rw_rw.iso88591':                       'rw_RW.ISO8859-1',
1329     'se_no':                                'se_NO.UTF-8',
1330     'serbocroatian':                        'sr_CS.ISO8859-2',
1331     'sh':                                   'sr_CS.ISO8859-2',
1332     'sh_hr':                                'sh_HR.ISO8859-2',
1333     'sh_hr.iso88592':                       'hr_HR.ISO8859-2',
1334     'sh_sp':                                'sr_CS.ISO8859-2',
1335     'sh_yu':                                'sr_CS.ISO8859-2',
1336     'si':                                   'si_LK.UTF-8',
1337     'si_lk':                                'si_LK.UTF-8',
1338     'sinhala':                              'si_LK.UTF-8',
1339     'sk':                                   'sk_SK.ISO8859-2',
1340     'sk_sk':                                'sk_SK.ISO8859-2',
1341     'sk_sk.iso88592':                       'sk_SK.ISO8859-2',
1342     'sl':                                   'sl_SI.ISO8859-2',
1343     'sl_cs':                                'sl_CS.ISO8859-2',
1344     'sl_si':                                'sl_SI.ISO8859-2',
1345     'sl_si.iso88592':                       'sl_SI.ISO8859-2',
1346     'slovak':                               'sk_SK.ISO8859-2',
1347     'slovene':                              'sl_SI.ISO8859-2',
1348     'slovenian':                            'sl_SI.ISO8859-2',
1349     'sp':                                   'sr_CS.ISO8859-5',
1350     'sp_yu':                                'sr_CS.ISO8859-5',
1351     'spanish':                              'es_ES.ISO8859-1',
1352     'spanish.iso88591':                     'es_ES.ISO8859-1',
1353     'spanish_spain':                        'es_ES.ISO8859-1',
1354     'spanish_spain.8859':                   'es_ES.ISO8859-1',
1355     'sq':                                   'sq_AL.ISO8859-2',
1356     'sq_al':                                'sq_AL.ISO8859-2',
1357     'sq_al.iso88592':                       'sq_AL.ISO8859-2',
1358     'sr':                                   'sr_CS.ISO8859-5',
1359     'sr@cyrillic':                          'sr_CS.ISO8859-5',
1360     'sr@latn':                              'sr_CS.ISO8859-2',
1361     'sr_cs.iso88592':                       'sr_CS.ISO8859-2',
1362     'sr_cs.iso88592@latn':                  'sr_CS.ISO8859-2',
1363     'sr_cs.iso88595':                       'sr_CS.ISO8859-5',
1364     'sr_cs.utf8@latn':                      'sr_CS.UTF-8',
1365     'sr_cs@latn':                           'sr_CS.ISO8859-2',
1366     'sr_sp':                                'sr_CS.ISO8859-2',
1367     'sr_yu':                                'sr_CS.ISO8859-5',
1368     'sr_yu.cp1251@cyrillic':                'sr_CS.CP1251',
1369     'sr_yu.iso88592':                       'sr_CS.ISO8859-2',
1370     'sr_yu.iso88595':                       'sr_CS.ISO8859-5',
1371     'sr_yu.iso88595@cyrillic':              'sr_CS.ISO8859-5',
1372     'sr_yu.microsoftcp1251@cyrillic':       'sr_CS.CP1251',
1373     'sr_yu.utf8@cyrillic':                  'sr_CS.UTF-8',
1374     'sr_yu@cyrillic':                       'sr_CS.ISO8859-5',
1375     'ss':                                   'ss_ZA.ISO8859-1',
1376     'ss_za':                                'ss_ZA.ISO8859-1',
1377     'ss_za.iso88591':                       'ss_ZA.ISO8859-1',
1378     'st':                                   'st_ZA.ISO8859-1',
1379     'st_za':                                'st_ZA.ISO8859-1',
1380     'st_za.iso88591':                       'st_ZA.ISO8859-1',
1381     'sv':                                   'sv_SE.ISO8859-1',
1382     'sv_fi':                                'sv_FI.ISO8859-1',
1383     'sv_fi.iso88591':                       'sv_FI.ISO8859-1',
1384     'sv_fi.iso885915':                      'sv_FI.ISO8859-15',
1385     'sv_fi.iso885915@euro':                 'sv_FI.ISO8859-15',
1386     'sv_fi.utf8@euro':                      'sv_FI.UTF-8',
1387     'sv_fi@euro':                           'sv_FI.ISO8859-15',
1388     'sv_se':                                'sv_SE.ISO8859-1',
1389     'sv_se.88591':                          'sv_SE.ISO8859-1',
1390     'sv_se.iso88591':                       'sv_SE.ISO8859-1',
1391     'sv_se.iso885915':                      'sv_SE.ISO8859-15',
1392     'sv_se@euro':                           'sv_SE.ISO8859-15',
1393     'swedish':                              'sv_SE.ISO8859-1',
1394     'swedish.iso88591':                     'sv_SE.ISO8859-1',
1395     'ta':                                   'ta_IN.TSCII-0',
1396     'ta_in':                                'ta_IN.TSCII-0',
1397     'ta_in.tscii':                          'ta_IN.TSCII-0',
1398     'ta_in.tscii0':                         'ta_IN.TSCII-0',
1399     'tg':                                   'tg_TJ.KOI8-C',
1400     'tg_tj':                                'tg_TJ.KOI8-C',
1401     'tg_tj.koi8c':                          'tg_TJ.KOI8-C',
1402     'th':                                   'th_TH.ISO8859-11',
1403     'th_th':                                'th_TH.ISO8859-11',
1404     'th_th.iso885911':                      'th_TH.ISO8859-11',
1405     'th_th.tactis':                         'th_TH.TIS620',
1406     'th_th.tis620':                         'th_TH.TIS620',
1407     'thai':                                 'th_TH.ISO8859-11',
1408     'tl':                                   'tl_PH.ISO8859-1',
1409     'tl_ph':                                'tl_PH.ISO8859-1',
1410     'tl_ph.iso88591':                       'tl_PH.ISO8859-1',
1411     'tn':                                   'tn_ZA.ISO8859-15',
1412     'tn_za':                                'tn_ZA.ISO8859-15',
1413     'tn_za.iso885915':                      'tn_ZA.ISO8859-15',
1414     'tr':                                   'tr_TR.ISO8859-9',
1415     'tr_tr':                                'tr_TR.ISO8859-9',
1416     'tr_tr.iso88599':                       'tr_TR.ISO8859-9',
1417     'ts':                                   'ts_ZA.ISO8859-1',
1418     'ts_za':                                'ts_ZA.ISO8859-1',
1419     'ts_za.iso88591':                       'ts_ZA.ISO8859-1',
1420     'tt':                                   'tt_RU.TATAR-CYR',
1421     'tt_ru':                                'tt_RU.TATAR-CYR',
1422     'tt_ru.koi8c':                          'tt_RU.KOI8-C',
1423     'tt_ru.tatarcyr':                       'tt_RU.TATAR-CYR',
1424     'turkish':                              'tr_TR.ISO8859-9',
1425     'turkish.iso88599':                     'tr_TR.ISO8859-9',
1426     'uk':                                   'uk_UA.KOI8-U',
1427     'uk_ua':                                'uk_UA.KOI8-U',
1428     'uk_ua.cp1251':                         'uk_UA.CP1251',
1429     'uk_ua.iso88595':                       'uk_UA.ISO8859-5',
1430     'uk_ua.koi8u':                          'uk_UA.KOI8-U',
1431     'uk_ua.microsoftcp1251':                'uk_UA.CP1251',
1432     'univ':                                 'en_US.utf',
1433     'universal':                            'en_US.utf',
1434     'universal.utf8@ucs4':                  'en_US.UTF-8',
1435     'ur':                                   'ur_PK.CP1256',
1436     'ur_pk':                                'ur_PK.CP1256',
1437     'ur_pk.cp1256':                         'ur_PK.CP1256',
1438     'ur_pk.microsoftcp1256':                'ur_PK.CP1256',
1439     'uz':                                   'uz_UZ.UTF-8',
1440     'uz_uz':                                'uz_UZ.UTF-8',
1441     'uz_uz.iso88591':                       'uz_UZ.ISO8859-1',
1442     'uz_uz.utf8@cyrillic':                  'uz_UZ.UTF-8',
1443     'uz_uz@cyrillic':                       'uz_UZ.UTF-8',
1444     've':                                   've_ZA.UTF-8',
1445     've_za':                                've_ZA.UTF-8',
1446     'vi':                                   'vi_VN.TCVN',
1447     'vi_vn':                                'vi_VN.TCVN',
1448     'vi_vn.tcvn':                           'vi_VN.TCVN',
1449     'vi_vn.tcvn5712':                       'vi_VN.TCVN',
1450     'vi_vn.viscii':                         'vi_VN.VISCII',
1451     'vi_vn.viscii111':                      'vi_VN.VISCII',
1452     'wa':                                   'wa_BE.ISO8859-1',
1453     'wa_be':                                'wa_BE.ISO8859-1',
1454     'wa_be.iso88591':                       'wa_BE.ISO8859-1',
1455     'wa_be.iso885915':                      'wa_BE.ISO8859-15',
1456     'wa_be.iso885915@euro':                 'wa_BE.ISO8859-15',
1457     'wa_be@euro':                           'wa_BE.ISO8859-15',
1458     'xh':                                   'xh_ZA.ISO8859-1',
1459     'xh_za':                                'xh_ZA.ISO8859-1',
1460     'xh_za.iso88591':                       'xh_ZA.ISO8859-1',
1461     'yi':                                   'yi_US.CP1255',
1462     'yi_us':                                'yi_US.CP1255',
1463     'yi_us.cp1255':                         'yi_US.CP1255',
1464     'yi_us.microsoftcp1255':                'yi_US.CP1255',
1465     'zh':                                   'zh_CN.eucCN',
1466     'zh_cn':                                'zh_CN.gb2312',
1467     'zh_cn.big5':                           'zh_TW.big5',
1468     'zh_cn.euc':                            'zh_CN.eucCN',
1469     'zh_cn.gb18030':                        'zh_CN.gb18030',
1470     'zh_cn.gb2312':                         'zh_CN.gb2312',
1471     'zh_cn.gbk':                            'zh_CN.gbk',
1472     'zh_hk':                                'zh_HK.big5hkscs',
1473     'zh_hk.big5':                           'zh_HK.big5',
1474     'zh_hk.big5hkscs':                      'zh_HK.big5hkscs',
1475     'zh_tw':                                'zh_TW.big5',
1476     'zh_tw.big5':                           'zh_TW.big5',
1477     'zh_tw.euc':                            'zh_TW.eucTW',
1478     'zh_tw.euctw':                          'zh_TW.eucTW',
1479     'zu':                                   'zu_ZA.ISO8859-1',
1480     'zu_za':                                'zu_ZA.ISO8859-1',
1481     'zu_za.iso88591':                       'zu_ZA.ISO8859-1',
1482 }
1483
1484 #
1485 # This maps Windows language identifiers to locale strings.
1486 #
1487 # This list has been updated from
1488 # http://msdn.microsoft.com/library/default.asp?url=/library/en-us/intl/nls_238z.asp
1489 # to include every locale up to Windows Vista.
1490 #
1491 # NOTE: this mapping is incomplete.  If your language is missing, please
1492 # submit a bug report to Python bug manager, which you can find via:
1493 #     http://www.python.org/dev/
1494 # Make sure you include the missing language identifier and the suggested
1495 # locale code.
1496 #
1497
1498 windows_locale = {
1499     0x0436: "af_ZA", # Afrikaans
1500     0x041c: "sq_AL", # Albanian
1501     0x0484: "gsw_FR",# Alsatian - France
1502     0x045e: "am_ET", # Amharic - Ethiopia
1503     0x0401: "ar_SA", # Arabic - Saudi Arabia
1504     0x0801: "ar_IQ", # Arabic - Iraq
1505     0x0c01: "ar_EG", # Arabic - Egypt
1506     0x1001: "ar_LY", # Arabic - Libya
1507     0x1401: "ar_DZ", # Arabic - Algeria
1508     0x1801: "ar_MA", # Arabic - Morocco
1509     0x1c01: "ar_TN", # Arabic - Tunisia
1510     0x2001: "ar_OM", # Arabic - Oman
1511     0x2401: "ar_YE", # Arabic - Yemen
1512     0x2801: "ar_SY", # Arabic - Syria
1513     0x2c01: "ar_JO", # Arabic - Jordan
1514     0x3001: "ar_LB", # Arabic - Lebanon
1515     0x3401: "ar_KW", # Arabic - Kuwait
1516     0x3801: "ar_AE", # Arabic - United Arab Emirates
1517     0x3c01: "ar_BH", # Arabic - Bahrain
1518     0x4001: "ar_QA", # Arabic - Qatar
1519     0x042b: "hy_AM", # Armenian
1520     0x044d: "as_IN", # Assamese - India
1521     0x042c: "az_AZ", # Azeri - Latin
1522     0x082c: "az_AZ", # Azeri - Cyrillic
1523     0x046d: "ba_RU", # Bashkir
1524     0x042d: "eu_ES", # Basque - Russia
1525     0x0423: "be_BY", # Belarusian
1526     0x0445: "bn_IN", # Begali
1527     0x201a: "bs_BA", # Bosnian - Cyrillic
1528     0x141a: "bs_BA", # Bosnian - Latin
1529     0x047e: "br_FR", # Breton - France
1530     0x0402: "bg_BG", # Bulgarian
1531 #    0x0455: "my_MM", # Burmese - Not supported
1532     0x0403: "ca_ES", # Catalan
1533     0x0004: "zh_CHS",# Chinese - Simplified
1534     0x0404: "zh_TW", # Chinese - Taiwan
1535     0x0804: "zh_CN", # Chinese - PRC
1536     0x0c04: "zh_HK", # Chinese - Hong Kong S.A.R.
1537     0x1004: "zh_SG", # Chinese - Singapore
1538     0x1404: "zh_MO", # Chinese - Macao S.A.R.
1539     0x7c04: "zh_CHT",# Chinese - Traditional
1540     0x0483: "co_FR", # Corsican - France
1541     0x041a: "hr_HR", # Croatian
1542     0x101a: "hr_BA", # Croatian - Bosnia
1543     0x0405: "cs_CZ", # Czech
1544     0x0406: "da_DK", # Danish
1545     0x048c: "gbz_AF",# Dari - Afghanistan
1546     0x0465: "div_MV",# Divehi - Maldives
1547     0x0413: "nl_NL", # Dutch - The Netherlands
1548     0x0813: "nl_BE", # Dutch - Belgium
1549     0x0409: "en_US", # English - United States
1550     0x0809: "en_GB", # English - United Kingdom
1551     0x0c09: "en_AU", # English - Australia
1552     0x1009: "en_CA", # English - Canada
1553     0x1409: "en_NZ", # English - New Zealand
1554     0x1809: "en_IE", # English - Ireland
1555     0x1c09: "en_ZA", # English - South Africa
1556     0x2009: "en_JA", # English - Jamaica
1557     0x2409: "en_CB", # English - Carribbean
1558     0x2809: "en_BZ", # English - Belize
1559     0x2c09: "en_TT", # English - Trinidad
1560     0x3009: "en_ZW", # English - Zimbabwe
1561     0x3409: "en_PH", # English - Philippines
1562     0x4009: "en_IN", # English - India
1563     0x4409: "en_MY", # English - Malaysia
1564     0x4809: "en_IN", # English - Singapore
1565     0x0425: "et_EE", # Estonian
1566     0x0438: "fo_FO", # Faroese
1567     0x0464: "fil_PH",# Filipino
1568     0x040b: "fi_FI", # Finnish
1569     0x040c: "fr_FR", # French - France
1570     0x080c: "fr_BE", # French - Belgium
1571     0x0c0c: "fr_CA", # French - Canada
1572     0x100c: "fr_CH", # French - Switzerland
1573     0x140c: "fr_LU", # French - Luxembourg
1574     0x180c: "fr_MC", # French - Monaco
1575     0x0462: "fy_NL", # Frisian - Netherlands
1576     0x0456: "gl_ES", # Galician
1577     0x0437: "ka_GE", # Georgian
1578     0x0407: "de_DE", # German - Germany
1579     0x0807: "de_CH", # German - Switzerland
1580     0x0c07: "de_AT", # German - Austria
1581     0x1007: "de_LU", # German - Luxembourg
1582     0x1407: "de_LI", # German - Liechtenstein
1583     0x0408: "el_GR", # Greek
1584     0x046f: "kl_GL", # Greenlandic - Greenland
1585     0x0447: "gu_IN", # Gujarati
1586     0x0468: "ha_NG", # Hausa - Latin
1587     0x040d: "he_IL", # Hebrew
1588     0x0439: "hi_IN", # Hindi
1589     0x040e: "hu_HU", # Hungarian
1590     0x040f: "is_IS", # Icelandic
1591     0x0421: "id_ID", # Indonesian
1592     0x045d: "iu_CA", # Inuktitut - Syllabics
1593     0x085d: "iu_CA", # Inuktitut - Latin
1594     0x083c: "ga_IE", # Irish - Ireland
1595     0x0410: "it_IT", # Italian - Italy
1596     0x0810: "it_CH", # Italian - Switzerland
1597     0x0411: "ja_JP", # Japanese
1598     0x044b: "kn_IN", # Kannada - India
1599     0x043f: "kk_KZ", # Kazakh
1600     0x0453: "kh_KH", # Khmer - Cambodia
1601     0x0486: "qut_GT",# K'iche - Guatemala
1602     0x0487: "rw_RW", # Kinyarwanda - Rwanda
1603     0x0457: "kok_IN",# Konkani
1604     0x0412: "ko_KR", # Korean
1605     0x0440: "ky_KG", # Kyrgyz
1606     0x0454: "lo_LA", # Lao - Lao PDR
1607     0x0426: "lv_LV", # Latvian
1608     0x0427: "lt_LT", # Lithuanian
1609     0x082e: "dsb_DE",# Lower Sorbian - Germany
1610     0x046e: "lb_LU", # Luxembourgish
1611     0x042f: "mk_MK", # FYROM Macedonian
1612     0x043e: "ms_MY", # Malay - Malaysia
1613     0x083e: "ms_BN", # Malay - Brunei Darussalam
1614     0x044c: "ml_IN", # Malayalam - India
1615     0x043a: "mt_MT", # Maltese
1616     0x0481: "mi_NZ", # Maori
1617     0x047a: "arn_CL",# Mapudungun
1618     0x044e: "mr_IN", # Marathi
1619     0x047c: "moh_CA",# Mohawk - Canada
1620     0x0450: "mn_MN", # Mongolian - Cyrillic
1621     0x0850: "mn_CN", # Mongolian - PRC
1622     0x0461: "ne_NP", # Nepali
1623     0x0414: "nb_NO", # Norwegian - Bokmal
1624     0x0814: "nn_NO", # Norwegian - Nynorsk
1625     0x0482: "oc_FR", # Occitan - France
1626     0x0448: "or_IN", # Oriya - India
1627     0x0463: "ps_AF", # Pashto - Afghanistan
1628     0x0429: "fa_IR", # Persian
1629     0x0415: "pl_PL", # Polish
1630     0x0416: "pt_BR", # Portuguese - Brazil
1631     0x0816: "pt_PT", # Portuguese - Portugal
1632     0x0446: "pa_IN", # Punjabi
1633     0x046b: "quz_BO",# Quechua (Bolivia)
1634     0x086b: "quz_EC",# Quechua (Ecuador)
1635     0x0c6b: "quz_PE",# Quechua (Peru)
1636     0x0418: "ro_RO", # Romanian - Romania
1637     0x0417: "rm_CH", # Romansh
1638     0x0419: "ru_RU", # Russian
1639     0x243b: "smn_FI",# Sami Finland
1640     0x103b: "smj_NO",# Sami Norway
1641     0x143b: "smj_SE",# Sami Sweden
1642     0x043b: "se_NO", # Sami Northern Norway
1643     0x083b: "se_SE", # Sami Northern Sweden
1644     0x0c3b: "se_FI", # Sami Northern Finland
1645     0x203b: "sms_FI",# Sami Skolt
1646     0x183b: "sma_NO",# Sami Southern Norway
1647     0x1c3b: "sma_SE",# Sami Southern Sweden
1648     0x044f: "sa_IN", # Sanskrit
1649     0x0c1a: "sr_SP", # Serbian - Cyrillic
1650     0x1c1a: "sr_BA", # Serbian - Bosnia Cyrillic
1651     0x081a: "sr_SP", # Serbian - Latin
1652     0x181a: "sr_BA", # Serbian - Bosnia Latin
1653     0x045b: "si_LK", # Sinhala - Sri Lanka
1654     0x046c: "ns_ZA", # Northern Sotho
1655     0x0432: "tn_ZA", # Setswana - Southern Africa
1656     0x041b: "sk_SK", # Slovak
1657     0x0424: "sl_SI", # Slovenian
1658     0x040a: "es_ES", # Spanish - Spain
1659     0x080a: "es_MX", # Spanish - Mexico
1660     0x0c0a: "es_ES", # Spanish - Spain (Modern)
1661     0x100a: "es_GT", # Spanish - Guatemala
1662     0x140a: "es_CR", # Spanish - Costa Rica
1663     0x180a: "es_PA", # Spanish - Panama
1664     0x1c0a: "es_DO", # Spanish - Dominican Republic
1665     0x200a: "es_VE", # Spanish - Venezuela
1666     0x240a: "es_CO", # Spanish - Colombia
1667     0x280a: "es_PE", # Spanish - Peru
1668     0x2c0a: "es_AR", # Spanish - Argentina
1669     0x300a: "es_EC", # Spanish - Ecuador
1670     0x340a: "es_CL", # Spanish - Chile
1671     0x380a: "es_UR", # Spanish - Uruguay
1672     0x3c0a: "es_PY", # Spanish - Paraguay
1673     0x400a: "es_BO", # Spanish - Bolivia
1674     0x440a: "es_SV", # Spanish - El Salvador
1675     0x480a: "es_HN", # Spanish - Honduras
1676     0x4c0a: "es_NI", # Spanish - Nicaragua
1677     0x500a: "es_PR", # Spanish - Puerto Rico
1678     0x540a: "es_US", # Spanish - United States
1679 #    0x0430: "", # Sutu - Not supported
1680     0x0441: "sw_KE", # Swahili
1681     0x041d: "sv_SE", # Swedish - Sweden
1682     0x081d: "sv_FI", # Swedish - Finland
1683     0x045a: "syr_SY",# Syriac
1684     0x0428: "tg_TJ", # Tajik - Cyrillic
1685     0x085f: "tmz_DZ",# Tamazight - Latin
1686     0x0449: "ta_IN", # Tamil
1687     0x0444: "tt_RU", # Tatar
1688     0x044a: "te_IN", # Telugu
1689     0x041e: "th_TH", # Thai
1690     0x0851: "bo_BT", # Tibetan - Bhutan
1691     0x0451: "bo_CN", # Tibetan - PRC
1692     0x041f: "tr_TR", # Turkish
1693     0x0442: "tk_TM", # Turkmen - Cyrillic
1694     0x0480: "ug_CN", # Uighur - Arabic
1695     0x0422: "uk_UA", # Ukrainian
1696     0x042e: "wen_DE",# Upper Sorbian - Germany
1697     0x0420: "ur_PK", # Urdu
1698     0x0820: "ur_IN", # Urdu - India
1699     0x0443: "uz_UZ", # Uzbek - Latin
1700     0x0843: "uz_UZ", # Uzbek - Cyrillic
1701     0x042a: "vi_VN", # Vietnamese
1702     0x0452: "cy_GB", # Welsh
1703     0x0488: "wo_SN", # Wolof - Senegal
1704     0x0434: "xh_ZA", # Xhosa - South Africa
1705     0x0485: "sah_RU",# Yakut - Cyrillic
1706     0x0478: "ii_CN", # Yi - PRC
1707     0x046a: "yo_NG", # Yoruba - Nigeria
1708     0x0435: "zu_ZA", # Zulu
1709 }
1710
1711 def _print_locale():
1712
1713     """ Test function.
1714     """
1715     categories = {}
1716     def _init_categories(categories=categories):
1717         for k,v in globals().items():
1718             if k[:3] == 'LC_':
1719                 categories[k] = v
1720     _init_categories()
1721     del categories['LC_ALL']
1722
1723     print 'Locale defaults as determined by getdefaultlocale():'
1724     print '-'*72
1725     lang, enc = getdefaultlocale()
1726     print 'Language: ', lang or '(undefined)'
1727     print 'Encoding: ', enc or '(undefined)'
1728     print
1729
1730     print 'Locale settings on startup:'
1731     print '-'*72
1732     for name,category in categories.items():
1733         print name, '...'
1734         lang, enc = getlocale(category)
1735         print '   Language: ', lang or '(undefined)'
1736         print '   Encoding: ', enc or '(undefined)'
1737         print
1738
1739     print
1740     print 'Locale settings after calling resetlocale():'
1741     print '-'*72
1742     resetlocale()
1743     for name,category in categories.items():
1744         print name, '...'
1745         lang, enc = getlocale(category)
1746         print '   Language: ', lang or '(undefined)'
1747         print '   Encoding: ', enc or '(undefined)'
1748         print
1749
1750     try:
1751         setlocale(LC_ALL, "")
1752     except:
1753         print 'NOTE:'
1754         print 'setlocale(LC_ALL, "") does not support the default locale'
1755         print 'given in the OS environment variables.'
1756     else:
1757         print
1758         print 'Locale settings after calling setlocale(LC_ALL, ""):'
1759         print '-'*72
1760         for name,category in categories.items():
1761             print name, '...'
1762             lang, enc = getlocale(category)
1763             print '   Language: ', lang or '(undefined)'
1764             print '   Encoding: ', enc or '(undefined)'
1765             print
1766
1767 ###
1768
1769 try:
1770     LC_MESSAGES
1771 except NameError:
1772     pass
1773 else:
1774     __all__.append("LC_MESSAGES")
1775
1776 if __name__=='__main__':
1777     print 'Locale aliasing:'
1778     print
1779     _print_locale()
1780     print
1781     print 'Number formatting:'
1782     print
1783     _test()