Lib/locale.py

   1 """ Locale support.
   2
   3     The module provides low-level access to the C lib's locale APIs
   4     and adds high level number formatting APIs as well as a locale
   5     aliasing engine to complement these.
   6
   7     The aliasing engine includes support for many commonly used locale
   8     names and maps them to values suitable for passing to the C lib's
   9     setlocale() function. It also includes default encodings for all
  10     supported locale names.
  11
  12 """
  13
  14 import sys
  15 import encodings
  16 import encodings.aliases
  17 import re
  18 import operator
  19 import functools
  20
  21 # Try importing the _locale module.
  22 #
  23 # If this fails, fall back on a basic 'C' locale emulation.
  24
  25 # Yuck:  LC_MESSAGES is non-standard:  can't tell whether it exists before
  26 # trying the import.  So __all__ is also fiddled at the end of the file.
  27 __all__ = ["getlocale", "getdefaultlocale", "getpreferredencoding", "Error",
  28            "setlocale", "resetlocale", "localeconv", "strcoll", "strxfrm",
  29            "str", "atof", "atoi", "format", "format_string", "currency",
  30            "normalize", "LC_CTYPE", "LC_COLLATE", "LC_TIME", "LC_MONETARY",
  31            "LC_NUMERIC", "LC_ALL", "CHAR_MAX"]
  32
  33 try:
  34
  35     from _locale import *
  36
  37 except ImportError:
  38
  39     # Locale emulation
  40
  41     CHAR_MAX = 127
  42     LC_ALL = 6
  43     LC_COLLATE = 3
  44     LC_CTYPE = 0
  45     LC_MESSAGES = 5
  46     LC_MONETARY = 4
  47     LC_NUMERIC = 1
  48     LC_TIME = 2
  49     Error = ValueError
  50
  51     def localeconv():
  52         """ localeconv() -> dict.
  53             Returns numeric and monetary locale-specific parameters.
  54         """
  55         # 'C' locale default values
  56         return {'grouping': [127],
  57                 'currency_symbol': '',
  58                 'n_sign_posn': 127,
  59                 'p_cs_precedes': 127,
  60                 'n_cs_precedes': 127,
  61                 'mon_grouping': [],
  62                 'n_sep_by_space': 127,
  63                 'decimal_point': '.',
  64                 'negative_sign': '',
  65                 'positive_sign': '',
  66                 'p_sep_by_space': 127,
  67                 'int_curr_symbol': '',
  68                 'p_sign_posn': 127,
  69                 'thousands_sep': '',
  70                 'mon_thousands_sep': '',
  71                 'frac_digits': 127,
  72                 'mon_decimal_point': '',
  73                 'int_frac_digits': 127}
  74
  75     def setlocale(category, value=None):
  76         """ setlocale(integer,string=None) -> string.
  77             Activates/queries locale processing.
  78         """
  79         if value not in (None, '', 'C'):
  80             raise Error, '_locale emulation only supports "C" locale'
  81         return 'C'
  82
  83     def strcoll(a,b):
  84         """ strcoll(string,string) -> int.
  85             Compares two strings according to the locale.
  86         """
  87         return cmp(a,b)
  88
  89     def strxfrm(s):
  90         """ strxfrm(string) -> string.
  91             Returns a string that behaves for cmp locale-aware.
  92         """
  93         return s
  94
  95
  96 _localeconv = localeconv
  97
  98 # With this dict, you can override some items of localeconv's return value.
  99 # This is useful for testing purposes.
 100 _override_localeconv = {}
 101
 102 @functools.wraps(_localeconv)
 103 def localeconv():
 104     d = _localeconv()
 105     if _override_localeconv:
 106         d.update(_override_localeconv)
 107     return d
 108
 109
 110 ### Number formatting APIs
 111
 112 # Author: Martin von Loewis
 113 # improved by Georg Brandl
 114
 115 # Iterate over grouping intervals
 116 def _grouping_intervals(grouping):
 117     for interval in grouping:
 118         # if grouping is -1, we are done
 119         if interval == CHAR_MAX:
 120             return
 121         # 0: re-use last group ad infinitum
 122         if interval == 0:
 123             while True:
 124                 yield last_interval
 125         yield interval
 126         last_interval = interval
 127
 128 #perform the grouping from right to left
 129 def _group(s, monetary=False):
 130     conv = localeconv()
 131     thousands_sep = conv[monetary and 'mon_thousands_sep' or 'thousands_sep']
 132     grouping = conv[monetary and 'mon_grouping' or 'grouping']
 133     if not grouping:
 134         return (s, 0)
 135     result = ""
 136     seps = 0
 137     if s[-1] == ' ':
 138         stripped = s.rstrip()
 139         right_spaces = s[len(stripped):]
 140         s = stripped
 141     else:
 142         right_spaces = ''
 143     left_spaces = ''
 144     groups = []
 145     for interval in _grouping_intervals(grouping):
 146         if not s or s[-1] not in "0123456789":
 147             # only non-digit characters remain (sign, spaces)
 148             left_spaces = s
 149             s = ''
 150             break
 151         groups.append(s[-interval:])
 152         s = s[:-interval]
 153     if s:
 154         groups.append(s)
 155     groups.reverse()
 156     return (
 157         left_spaces + thousands_sep.join(groups) + right_spaces,
 158         len(thousands_sep) * (len(groups) - 1)
 159     )
 160
 161 # Strip a given amount of excess padding from the given string
 162 def _strip_padding(s, amount):
 163     lpos = 0
 164     while amount and s[lpos] == ' ':
 165         lpos += 1
 166         amount -= 1
 167     rpos = len(s) - 1
 168     while amount and s[rpos] == ' ':
 169         rpos -= 1
 170         amount -= 1
 171     return s[lpos:rpos+1]
 172
 173 _percent_re = re.compile(r'%(?:\((?P<key>.*?)\))?'
 174                          r'(?P<modifiers>[-#0-9 +*.hlL]*?)[eEfFgGdiouxXcrs%]')
 175
 176 def format(percent, value, grouping=False, monetary=False, *additional):
 177     """Returns the locale-aware substitution of a %? specifier
 178     (percent).
 179
 180     additional is for format strings which contain one or more
 181     '*' modifiers."""
 182     # this is only for one-percent-specifier strings and this should be checked
 183     match = _percent_re.match(percent)
 184     if not match or len(match.group())!= len(percent):
 185         raise ValueError(("format() must be given exactly one %%char "
 186                          "format specifier, %s not valid") % repr(percent))
 187     return _format(percent, value, grouping, monetary, *additional)
 188
 189 def _format(percent, value, grouping=False, monetary=False, *additional):
 190     if additional:
 191         formatted = percent % ((value,) + additional)
 192     else:
 193         formatted = percent % value
 194     # floats and decimal ints need special action!
 195     if percent[-1] in 'eEfFgG':
 196         seps = 0
 197         parts = formatted.split('.')
 198         if grouping:
 199             parts[0], seps = _group(parts[0], monetary=monetary)
 200         decimal_point = localeconv()[monetary and 'mon_decimal_point'
 201                                               or 'decimal_point']
 202         formatted = decimal_point.join(parts)
 203         if seps:
 204             formatted = _strip_padding(formatted, seps)
 205     elif percent[-1] in 'diu':
 206         seps = 0
 207         if grouping:
 208             formatted, seps = _group(formatted, monetary=monetary)
 209         if seps:
 210             formatted = _strip_padding(formatted, seps)
 211     return formatted
 212
 213 def format_string(f, val, grouping=False):
 214     """Formats a string in the same way that the % formatting would use,
 215     but takes the current locale into account.
 216     Grouping is applied if the third parameter is true."""
 217     percents = list(_percent_re.finditer(f))
 218     new_f = _percent_re.sub('%s', f)
 219
 220     if isinstance(val, tuple):
 221         new_val = list(val)
 222         i = 0
 223         for perc in percents:
 224             starcount = perc.group('modifiers').count('*')
 225             new_val[i] = format(perc.group(), new_val[i], grouping, False, *new_val[i+1:i+1+starcount])
 226             del new_val[i+1:i+1+starcount]
 227             i += (1 + starcount)
 228         val = tuple(new_val)
 229     elif operator.isMappingType(val):
 230         for perc in percents:
 231             key = perc.group("key")
 232             val[key] = format(perc.group(), val[key], grouping)
 233     else:
 234         # val is a single value
 235         val = format(percents[0].group(), val, grouping)
 236
 237     return new_f % val
 238
 239 def currency(val, symbol=True, grouping=False, international=False):
 240     """Formats val according to the currency settings
 241     in the current locale."""
 242     conv = localeconv()
 243
 244     # check for illegal values
 245     digits = conv[international and 'int_frac_digits' or 'frac_digits']
 246     if digits == 127:
 247         raise ValueError("Currency formatting is not possible using "
 248                          "the 'C' locale.")
 249
 250     s = format('%%.%if' % digits, abs(val), grouping, monetary=True)
 251     # '<' and '>' are markers if the sign must be inserted between symbol and value
 252     s = '<' + s + '>'
 253
 254     if symbol:
 255         smb = conv[international and 'int_curr_symbol' or 'currency_symbol']
 256         precedes = conv[val<0 and 'n_cs_precedes' or 'p_cs_precedes']
 257         separated = conv[val<0 and 'n_sep_by_space' or 'p_sep_by_space']
 258
 259         if precedes:
 260             s = smb + (separated and ' ' or '') + s
 261         else:
 262             s = s + (separated and ' ' or '') + smb
 263
 264     sign_pos = conv[val<0 and 'n_sign_posn' or 'p_sign_posn']
 265     sign = conv[val<0 and 'negative_sign' or 'positive_sign']
 266
 267     if sign_pos == 0:
 268         s = '(' + s + ')'
 269     elif sign_pos == 1:
 270         s = sign + s
 271     elif sign_pos == 2:
 272         s = s + sign
 273     elif sign_pos == 3:
 274         s = s.replace('<', sign)
 275     elif sign_pos == 4:
 276         s = s.replace('>', sign)
 277     else:
 278         # the default if nothing specified;
 279         # this should be the most fitting sign position
 280         s = sign + s
 281
 282     return s.replace('<', '').replace('>', '')
 283
 284 def str(val):
 285     """Convert float to integer, taking the locale into account."""
 286     return format("%.12g", val)
 287
 288 def atof(string, func=float):
 289     "Parses a string as a float according to the locale settings."
 290     #First, get rid of the grouping
 291     ts = localeconv()['thousands_sep']
 292     if ts:
 293         string = string.replace(ts, '')
 294     #next, replace the decimal point with a dot
 295     dd = localeconv()['decimal_point']
 296     if dd:
 297         string = string.replace(dd, '.')
 298     #finally, parse the string
 299     return func(string)
 300
 301 def atoi(str):
 302     "Converts a string to an integer according to the locale settings."
 303     return atof(str, int)
 304
 305 def _test():
 306     setlocale(LC_ALL, "")
 307     #do grouping
 308     s1 = format("%d", 123456789,1)
 309     print s1, "is", atoi(s1)
 310     #standard formatting
 311     s1 = str(3.14)
 312     print s1, "is", atof(s1)
 313
 314 ### Locale name aliasing engine
 315
 316 # Author: Marc-Andre Lemburg, mal@lemburg.com
 317 # Various tweaks by Fredrik Lundh <fredrik@pythonware.com>
 318
 319 # store away the low-level version of setlocale (it's
 320 # overridden below)
 321 _setlocale = setlocale
 322
 323 def normalize(localename):
 324
 325     """ Returns a normalized locale code for the given locale
 326         name.
 327
 328         The returned locale code is formatted for use with
 329         setlocale().
 330
 331         If normalization fails, the original name is returned
 332         unchanged.
 333
 334         If the given encoding is not known, the function defaults to
 335         the default encoding for the locale code just like setlocale()
 336         does.
 337
 338     """
 339     # Normalize the locale name and extract the encoding
 340     fullname = localename.lower()
 341     if ':' in fullname:
 342         # ':' is sometimes used as encoding delimiter.
 343         fullname = fullname.replace(':', '.')
 344     if '.' in fullname:
 345         langname, encoding = fullname.split('.')[:2]
 346         fullname = langname + '.' + encoding
 347     else:
 348         langname = fullname
 349         encoding = ''
 350
 351     # First lookup: fullname (possibly with encoding)
 352     norm_encoding = encoding.replace('-', '')
 353     norm_encoding = norm_encoding.replace('_', '')
 354     lookup_name = langname + '.' + encoding
 355     code = locale_alias.get(lookup_name, None)
 356     if code is not None:
 357         return code
 358     #print 'first lookup failed'
 359
 360     # Second try: langname (without encoding)
 361     code = locale_alias.get(langname, None)
 362     if code is not None:
 363         #print 'langname lookup succeeded'
 364         if '.' in code:
 365             langname, defenc = code.split('.')
 366         else:
 367             langname = code
 368             defenc = ''
 369         if encoding:
 370             # Convert the encoding to a C lib compatible encoding string
 371             norm_encoding = encodings.normalize_encoding(encoding)
 372             #print 'norm encoding: %r' % norm_encoding
 373             norm_encoding = encodings.aliases.aliases.get(norm_encoding,
 374                                                           norm_encoding)
 375             #print 'aliased encoding: %r' % norm_encoding
 376             encoding = locale_encoding_alias.get(norm_encoding,
 377                                                  norm_encoding)
 378         else:
 379             encoding = defenc
 380         #print 'found encoding %r' % encoding
 381         if encoding:
 382             return langname + '.' + encoding
 383         else:
 384             return langname
 385
 386     else:
 387         return localename
 388
 389 def _parse_localename(localename):
 390
 391     """ Parses the locale code for localename and returns the
 392         result as tuple (language code, encoding).
 393
 394         The localename is normalized and passed through the locale
 395         alias engine. A ValueError is raised in case the locale name
 396         cannot be parsed.
 397
 398         The language code corresponds to RFC 1766.  code and encoding
 399         can be None in case the values cannot be determined or are
 400         unknown to this implementation.
 401
 402     """
 403     code = normalize(localename)
 404     if '@' in code:
 405         # Deal with locale modifiers
 406         code, modifier = code.split('@')
 407         if modifier == 'euro' and '.' not in code:
 408             # Assume Latin-9 for @euro locales. This is bogus,
 409             # since some systems may use other encodings for these
 410             # locales. Also, we ignore other modifiers.
 411             return code, 'iso-8859-15'
 412
 413     if '.' in code:
 414         return tuple(code.split('.')[:2])
 415     elif code == 'C':
 416         return None, None
 417     raise ValueError, 'unknown locale: %s' % localename
 418
 419 def _build_localename(localetuple):
 420
 421     """ Builds a locale code from the given tuple (language code,
 422         encoding).
 423
 424         No aliasing or normalizing takes place.
 425
 426     """
 427     language, encoding = localetuple
 428     if language is None:
 429         language = 'C'
 430     if encoding is None:
 431         return language
 432     else:
 433         return language + '.' + encoding
 434
 435 def getdefaultlocale(envvars=('LC_ALL', 'LC_CTYPE', 'LANG', 'LANGUAGE')):
 436
 437     """ Tries to determine the default locale settings and returns
 438         them as tuple (language code, encoding).
 439
 440         According to POSIX, a program which has not called
 441         setlocale(LC_ALL, "") runs using the portable 'C' locale.
 442         Calling setlocale(LC_ALL, "") lets it use the default locale as
 443         defined by the LANG variable. Since we don't want to interfere
 444         with the current locale setting we thus emulate the behavior
 445         in the way described above.
 446
 447         To maintain compatibility with other platforms, not only the
 448         LANG variable is tested, but a list of variables given as
 449         envvars parameter. The first found to be defined will be
 450         used. envvars defaults to the search path used in GNU gettext;
 451         it must always contain the variable name 'LANG'.
 452
 453         Except for the code 'C', the language code corresponds to RFC
 454         1766.  code and encoding can be None in case the values cannot
 455         be determined.
 456
 457     """
 458
 459     try:
 460         # check if it's supported by the _locale module
 461         import _locale
 462         code, encoding = _locale._getdefaultlocale()
 463     except (ImportError, AttributeError):
 464         pass
 465     else:
 466         # make sure the code/encoding values are valid
 467         if sys.platform == "win32" and code and code[:2] == "0x":
 468             # map windows language identifier to language name
 469             code = windows_locale.get(int(code, 0))
 470         # ...add other platform-specific processing here, if
 471         # necessary...
 472         return code, encoding
 473
 474     # fall back on POSIX behaviour
 475     import os
 476     lookup = os.environ.get
 477     for variable in envvars:
 478         localename = lookup(variable,None)
 479         if localename:
 480             if variable == 'LANGUAGE':
 481                 localename = localename.split(':')[0]
 482             break
 483     else:
 484         localename = 'C'
 485     return _parse_localename(localename)
 486
 487
 488 def getlocale(category=LC_CTYPE):
 489
 490     """ Returns the current setting for the given locale category as
 491         tuple (language code, encoding).
 492
 493         category may be one of the LC_* value except LC_ALL. It
 494         defaults to LC_CTYPE.
 495
 496         Except for the code 'C', the language code corresponds to RFC
 497         1766.  code and encoding can be None in case the values cannot
 498         be determined.
 499
 500     """
 501     localename = _setlocale(category)
 502     if category == LC_ALL and ';' in localename:
 503         raise TypeError, 'category LC_ALL is not supported'
 504     return _parse_localename(localename)
 505
 506 def setlocale(category, locale=None):
 507
 508     """ Set the locale for the given category.  The locale can be
 509         a string, a locale tuple (language code, encoding), or None.
 510
 511         Locale tuples are converted to strings the locale aliasing
 512         engine.  Locale strings are passed directly to the C lib.
 513
 514         category may be given as one of the LC_* values.
 515
 516     """
 517     if locale and type(locale) is not type(""):
 518         # convert to string
 519         locale = normalize(_build_localename(locale))
 520     return _setlocale(category, locale)
 521
 522 def resetlocale(category=LC_ALL):
 523
 524     """ Sets the locale for category to the default setting.
 525
 526         The default setting is determined by calling
 527         getdefaultlocale(). category defaults to LC_ALL.
 528
 529     """
 530     _setlocale(category, _build_localename(getdefaultlocale()))
 531
 532 if sys.platform.startswith("win"):
 533     # On Win32, this will return the ANSI code page
 534     def getpreferredencoding(do_setlocale = True):
 535         """Return the charset that the user is likely using."""
 536         import _locale
 537         return _locale._getdefaultlocale()[1]
 538 else:
 539     # On Unix, if CODESET is available, use that.
 540     try:
 541         CODESET
 542     except NameError:
 543         # Fall back to parsing environment variables :-(
 544         def getpreferredencoding(do_setlocale = True):
 545             """Return the charset that the user is likely using,
 546             by looking at environment variables."""
 547             return getdefaultlocale()[1]
 548     else:
 549         def getpreferredencoding(do_setlocale = True):
 550             """Return the charset that the user is likely using,
 551             according to the system configuration."""
 552             if do_setlocale:
 553                 oldloc = setlocale(LC_CTYPE)
 554                 try:
 555                     setlocale(LC_CTYPE, "")
 556                 except Error:
 557                     pass
 558                 result = nl_langinfo(CODESET)
 559                 setlocale(LC_CTYPE, oldloc)
 560                 return result
 561             else:
 562                 return nl_langinfo(CODESET)
 563
 564
 565 ### Database
 566 #
 567 # The following data was extracted from the locale.alias file which
 568 # comes with X11 and then hand edited removing the explicit encoding
 569 # definitions and adding some more aliases. The file is usually
 570 # available as /usr/lib/X11/locale/locale.alias.
 571 #
 572
 573 #
 574 # The local_encoding_alias table maps lowercase encoding alias names
 575 # to C locale encoding names (case-sensitive). Note that normalize()
 576 # first looks up the encoding in the encodings.aliases dictionary and
 577 # then applies this mapping to find the correct C lib name for the
 578 # encoding.
 579 #
 580 locale_encoding_alias = {
 581
 582     # Mappings for non-standard encoding names used in locale names
 583     '437':                          'C',
 584     'c':                            'C',
 585     'en':                           'ISO8859-1',
 586     'jis':                          'JIS7',
 587     'jis7':                         'JIS7',
 588     'ajec':                         'eucJP',
 589
 590     # Mappings from Python codec names to C lib encoding names
 591     'ascii':                        'ISO8859-1',
 592     'latin_1':                      'ISO8859-1',
 593     'iso8859_1':                    'ISO8859-1',
 594     'iso8859_10':                   'ISO8859-10',
 595     'iso8859_11':                   'ISO8859-11',
 596     'iso8859_13':                   'ISO8859-13',
 597     'iso8859_14':                   'ISO8859-14',
 598     'iso8859_15':                   'ISO8859-15',
 599     'iso8859_16':                   'ISO8859-16',
 600     'iso8859_2':                    'ISO8859-2',
 601     'iso8859_3':                    'ISO8859-3',
 602     'iso8859_4':                    'ISO8859-4',
 603     'iso8859_5':                    'ISO8859-5',
 604     'iso8859_6':                    'ISO8859-6',
 605     'iso8859_7':                    'ISO8859-7',
 606     'iso8859_8':                    'ISO8859-8',
 607     'iso8859_9':                    'ISO8859-9',
 608     'iso2022_jp':                   'JIS7',
 609     'shift_jis':                    'SJIS',
 610     'tactis':                       'TACTIS',
 611     'euc_jp':                       'eucJP',
 612     'euc_kr':                       'eucKR',
 613     'utf_8':                        'UTF8',
 614     'koi8_r':                       'KOI8-R',
 615     'koi8_u':                       'KOI8-U',
 616     # XXX This list is still incomplete. If you know more
 617     # mappings, please file a bug report. Thanks.
 618 }
 619
 620 #
 621 # The locale_alias table maps lowercase alias names to C locale names
 622 # (case-sensitive). Encodings are always separated from the locale
 623 # name using a dot ('.'); they should only be given in case the
 624 # language name is needed to interpret the given encoding alias
 625 # correctly (CJK codes often have this need).
 626 #
 627 # Note that the normalize() function which uses this tables
 628 # removes '_' and '-' characters from the encoding part of the
 629 # locale name before doing the lookup. This saves a lot of
 630 # space in the table.
 631 #
 632 # MAL 2004-12-10:
 633 # Updated alias mapping to most recent locale.alias file
 634 # from X.org distribution using makelocalealias.py.
 635 #
 636 # These are the differences compared to the old mapping (Python 2.4
 637 # and older):
 638 #
 639 #    updated 'bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 640 #    updated 'bg_bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 641 #    updated 'bulgarian' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
 642 #    updated 'cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
 643 #    updated 'cz_cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
 644 #    updated 'czech' -> 'cs_CS.ISO8859-2' to 'cs_CZ.ISO8859-2'
 645 #    updated 'dutch' -> 'nl_BE.ISO8859-1' to 'nl_NL.ISO8859-1'
 646 #    updated 'et' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
 647 #    updated 'et_ee' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
 648 #    updated 'fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
 649 #    updated 'fi_fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
 650 #    updated 'iw' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
 651 #    updated 'iw_il' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
 652 #    updated 'japanese' -> 'ja_JP.SJIS' to 'ja_JP.eucJP'
 653 #    updated 'lt' -> 'lt_LT.ISO8859-4' to 'lt_LT.ISO8859-13'
 654 #    updated 'lv' -> 'lv_LV.ISO8859-4' to 'lv_LV.ISO8859-13'
 655 #    updated 'sl' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
 656 #    updated 'slovene' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
 657 #    updated 'th_th' -> 'th_TH.TACTIS' to 'th_TH.ISO8859-11'
 658 #    updated 'zh_cn' -> 'zh_CN.eucCN' to 'zh_CN.gb2312'
 659 #    updated 'zh_cn.big5' -> 'zh_TW.eucTW' to 'zh_TW.big5'
 660 #    updated 'zh_tw' -> 'zh_TW.eucTW' to 'zh_TW.big5'
 661 #
 662 # MAL 2008-05-30:
 663 # Updated alias mapping to most recent locale.alias file
 664 # from X.org distribution using makelocalealias.py.
 665 #
 666 # These are the differences compared to the old mapping (Python 2.5
 667 # and older):
 668 #
 669 #    updated 'cs_cs.iso88592' -> 'cs_CZ.ISO8859-2' to 'cs_CS.ISO8859-2'
 670 #    updated 'serbocroatian' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 671 #    updated 'sh' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 672 #    updated 'sh_hr.iso88592' -> 'sh_HR.ISO8859-2' to 'hr_HR.ISO8859-2'
 673 #    updated 'sh_sp' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 674 #    updated 'sh_yu' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 675 #    updated 'sp' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 676 #    updated 'sp_yu' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 677 #    updated 'sr' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 678 #    updated 'sr@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 679 #    updated 'sr_sp' -> 'sr_SP.ISO8859-2' to 'sr_CS.ISO8859-2'
 680 #    updated 'sr_yu' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 681 #    updated 'sr_yu.cp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
 682 #    updated 'sr_yu.iso88592' -> 'sr_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
 683 #    updated 'sr_yu.iso88595' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 684 #    updated 'sr_yu.iso88595@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 685 #    updated 'sr_yu.microsoftcp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
 686 #    updated 'sr_yu.utf8@cyrillic' -> 'sr_YU.UTF-8' to 'sr_CS.UTF-8'
 687 #    updated 'sr_yu@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
 688
 689 locale_alias = {
 690     'a3':                                   'a3_AZ.KOI8-C',
 691     'a3_az':                                'a3_AZ.KOI8-C',
 692     'a3_az.koi8c':                          'a3_AZ.KOI8-C',
 693     'af':                                   'af_ZA.ISO8859-1',
 694     'af_za':                                'af_ZA.ISO8859-1',
 695     'af_za.iso88591':                       'af_ZA.ISO8859-1',
 696     'am':                                   'am_ET.UTF-8',
 697     'am_et':                                'am_ET.UTF-8',
 698     'american':                             'en_US.ISO8859-1',
 699     'american.iso88591':                    'en_US.ISO8859-1',
 700     'ar':                                   'ar_AA.ISO8859-6',
 701     'ar_aa':                                'ar_AA.ISO8859-6',
 702     'ar_aa.iso88596':                       'ar_AA.ISO8859-6',
 703     'ar_ae':                                'ar_AE.ISO8859-6',
 704     'ar_ae.iso88596':                       'ar_AE.ISO8859-6',
 705     'ar_bh':                                'ar_BH.ISO8859-6',
 706     'ar_bh.iso88596':                       'ar_BH.ISO8859-6',
 707     'ar_dz':                                'ar_DZ.ISO8859-6',
 708     'ar_dz.iso88596':                       'ar_DZ.ISO8859-6',
 709     'ar_eg':                                'ar_EG.ISO8859-6',
 710     'ar_eg.iso88596':                       'ar_EG.ISO8859-6',
 711     'ar_iq':                                'ar_IQ.ISO8859-6',
 712     'ar_iq.iso88596':                       'ar_IQ.ISO8859-6',
 713     'ar_jo':                                'ar_JO.ISO8859-6',
 714     'ar_jo.iso88596':                       'ar_JO.ISO8859-6',
 715     'ar_kw':                                'ar_KW.ISO8859-6',
 716     'ar_kw.iso88596':                       'ar_KW.ISO8859-6',
 717     'ar_lb':                                'ar_LB.ISO8859-6',
 718     'ar_lb.iso88596':                       'ar_LB.ISO8859-6',
 719     'ar_ly':                                'ar_LY.ISO8859-6',
 720     'ar_ly.iso88596':                       'ar_LY.ISO8859-6',
 721     'ar_ma':                                'ar_MA.ISO8859-6',
 722     'ar_ma.iso88596':                       'ar_MA.ISO8859-6',
 723     'ar_om':                                'ar_OM.ISO8859-6',
 724     'ar_om.iso88596':                       'ar_OM.ISO8859-6',
 725     'ar_qa':                                'ar_QA.ISO8859-6',
 726     'ar_qa.iso88596':                       'ar_QA.ISO8859-6',
 727     'ar_sa':                                'ar_SA.ISO8859-6',
 728     'ar_sa.iso88596':                       'ar_SA.ISO8859-6',
 729     'ar_sd':                                'ar_SD.ISO8859-6',
 730     'ar_sd.iso88596':                       'ar_SD.ISO8859-6',
 731     'ar_sy':                                'ar_SY.ISO8859-6',
 732     'ar_sy.iso88596':                       'ar_SY.ISO8859-6',
 733     'ar_tn':                                'ar_TN.ISO8859-6',
 734     'ar_tn.iso88596':                       'ar_TN.ISO8859-6',
 735     'ar_ye':                                'ar_YE.ISO8859-6',
 736     'ar_ye.iso88596':                       'ar_YE.ISO8859-6',
 737     'arabic':                               'ar_AA.ISO8859-6',
 738     'arabic.iso88596':                      'ar_AA.ISO8859-6',
 739     'az':                                   'az_AZ.ISO8859-9E',
 740     'az_az':                                'az_AZ.ISO8859-9E',
 741     'az_az.iso88599e':                      'az_AZ.ISO8859-9E',
 742     'be':                                   'be_BY.CP1251',
 743     'be_by':                                'be_BY.CP1251',
 744     'be_by.cp1251':                         'be_BY.CP1251',
 745     'be_by.microsoftcp1251':                'be_BY.CP1251',
 746     'bg':                                   'bg_BG.CP1251',
 747     'bg_bg':                                'bg_BG.CP1251',
 748     'bg_bg.cp1251':                         'bg_BG.CP1251',
 749     'bg_bg.iso88595':                       'bg_BG.ISO8859-5',
 750     'bg_bg.koi8r':                          'bg_BG.KOI8-R',
 751     'bg_bg.microsoftcp1251':                'bg_BG.CP1251',
 752     'bn_in':                                'bn_IN.UTF-8',
 753     'bokmal':                               'nb_NO.ISO8859-1',
 754     'bokm\xe5l':                            'nb_NO.ISO8859-1',
 755     'br':                                   'br_FR.ISO8859-1',
 756     'br_fr':                                'br_FR.ISO8859-1',
 757     'br_fr.iso88591':                       'br_FR.ISO8859-1',
 758     'br_fr.iso885914':                      'br_FR.ISO8859-14',
 759     'br_fr.iso885915':                      'br_FR.ISO8859-15',
 760     'br_fr.iso885915@euro':                 'br_FR.ISO8859-15',
 761     'br_fr.utf8@euro':                      'br_FR.UTF-8',
 762     'br_fr@euro':                           'br_FR.ISO8859-15',
 763     'bs':                                   'bs_BA.ISO8859-2',
 764     'bs_ba':                                'bs_BA.ISO8859-2',
 765     'bs_ba.iso88592':                       'bs_BA.ISO8859-2',
 766     'bulgarian':                            'bg_BG.CP1251',
 767     'c':                                    'C',
 768     'c-french':                             'fr_CA.ISO8859-1',
 769     'c-french.iso88591':                    'fr_CA.ISO8859-1',
 770     'c.en':                                 'C',
 771     'c.iso88591':                           'en_US.ISO8859-1',
 772     'c_c':                                  'C',
 773     'c_c.c':                                'C',
 774     'ca':                                   'ca_ES.ISO8859-1',
 775     'ca_es':                                'ca_ES.ISO8859-1',
 776     'ca_es.iso88591':                       'ca_ES.ISO8859-1',
 777     'ca_es.iso885915':                      'ca_ES.ISO8859-15',
 778     'ca_es.iso885915@euro':                 'ca_ES.ISO8859-15',
 779     'ca_es.utf8@euro':                      'ca_ES.UTF-8',
 780     'ca_es@euro':                           'ca_ES.ISO8859-15',
 781     'catalan':                              'ca_ES.ISO8859-1',
 782     'cextend':                              'en_US.ISO8859-1',
 783     'cextend.en':                           'en_US.ISO8859-1',
 784     'chinese-s':                            'zh_CN.eucCN',
 785     'chinese-t':                            'zh_TW.eucTW',
 786     'croatian':                             'hr_HR.ISO8859-2',
 787     'cs':                                   'cs_CZ.ISO8859-2',
 788     'cs_cs':                                'cs_CZ.ISO8859-2',
 789     'cs_cs.iso88592':                       'cs_CS.ISO8859-2',
 790     'cs_cz':                                'cs_CZ.ISO8859-2',
 791     'cs_cz.iso88592':                       'cs_CZ.ISO8859-2',
 792     'cy':                                   'cy_GB.ISO8859-1',
 793     'cy_gb':                                'cy_GB.ISO8859-1',
 794     'cy_gb.iso88591':                       'cy_GB.ISO8859-1',
 795     'cy_gb.iso885914':                      'cy_GB.ISO8859-14',
 796     'cy_gb.iso885915':                      'cy_GB.ISO8859-15',
 797     'cy_gb@euro':                           'cy_GB.ISO8859-15',
 798     'cz':                                   'cs_CZ.ISO8859-2',
 799     'cz_cz':                                'cs_CZ.ISO8859-2',
 800     'czech':                                'cs_CZ.ISO8859-2',
 801     'da':                                   'da_DK.ISO8859-1',
 802     'da_dk':                                'da_DK.ISO8859-1',
 803     'da_dk.88591':                          'da_DK.ISO8859-1',
 804     'da_dk.885915':                         'da_DK.ISO8859-15',
 805     'da_dk.iso88591':                       'da_DK.ISO8859-1',
 806     'da_dk.iso885915':                      'da_DK.ISO8859-15',
 807     'da_dk@euro':                           'da_DK.ISO8859-15',
 808     'danish':                               'da_DK.ISO8859-1',
 809     'danish.iso88591':                      'da_DK.ISO8859-1',
 810     'dansk':                                'da_DK.ISO8859-1',
 811     'de':                                   'de_DE.ISO8859-1',
 812     'de_at':                                'de_AT.ISO8859-1',
 813     'de_at.iso88591':                       'de_AT.ISO8859-1',
 814     'de_at.iso885915':                      'de_AT.ISO8859-15',
 815     'de_at.iso885915@euro':                 'de_AT.ISO8859-15',
 816     'de_at.utf8@euro':                      'de_AT.UTF-8',
 817     'de_at@euro':                           'de_AT.ISO8859-15',
 818     'de_be':                                'de_BE.ISO8859-1',
 819     'de_be.iso88591':                       'de_BE.ISO8859-1',
 820     'de_be.iso885915':                      'de_BE.ISO8859-15',
 821     'de_be.iso885915@euro':                 'de_BE.ISO8859-15',
 822     'de_be.utf8@euro':                      'de_BE.UTF-8',
 823     'de_be@euro':                           'de_BE.ISO8859-15',
 824     'de_ch':                                'de_CH.ISO8859-1',
 825     'de_ch.iso88591':                       'de_CH.ISO8859-1',
 826     'de_ch.iso885915':                      'de_CH.ISO8859-15',
 827     'de_ch@euro':                           'de_CH.ISO8859-15',
 828     'de_de':                                'de_DE.ISO8859-1',
 829     'de_de.88591':                          'de_DE.ISO8859-1',
 830     'de_de.885915':                         'de_DE.ISO8859-15',
 831     'de_de.885915@euro':                    'de_DE.ISO8859-15',
 832     'de_de.iso88591':                       'de_DE.ISO8859-1',
 833     'de_de.iso885915':                      'de_DE.ISO8859-15',
 834     'de_de.iso885915@euro':                 'de_DE.ISO8859-15',
 835     'de_de.utf8@euro':                      'de_DE.UTF-8',
 836     'de_de@euro':                           'de_DE.ISO8859-15',
 837     'de_lu':                                'de_LU.ISO8859-1',
 838     'de_lu.iso88591':                       'de_LU.ISO8859-1',
 839     'de_lu.iso885915':                      'de_LU.ISO8859-15',
 840     'de_lu.iso885915@euro':                 'de_LU.ISO8859-15',
 841     'de_lu.utf8@euro':                      'de_LU.UTF-8',
 842     'de_lu@euro':                           'de_LU.ISO8859-15',
 843     'deutsch':                              'de_DE.ISO8859-1',
 844     'dutch':                                'nl_NL.ISO8859-1',
 845     'dutch.iso88591':                       'nl_BE.ISO8859-1',
 846     'ee':                                   'ee_EE.ISO8859-4',
 847     'ee_ee':                                'ee_EE.ISO8859-4',
 848     'ee_ee.iso88594':                       'ee_EE.ISO8859-4',
 849     'eesti':                                'et_EE.ISO8859-1',
 850     'el':                                   'el_GR.ISO8859-7',
 851     'el_gr':                                'el_GR.ISO8859-7',
 852     'el_gr.iso88597':                       'el_GR.ISO8859-7',
 853     'el_gr@euro':                           'el_GR.ISO8859-15',
 854     'en':                                   'en_US.ISO8859-1',
 855     'en.iso88591':                          'en_US.ISO8859-1',
 856     'en_au':                                'en_AU.ISO8859-1',
 857     'en_au.iso88591':                       'en_AU.ISO8859-1',
 858     'en_be':                                'en_BE.ISO8859-1',
 859     'en_be@euro':                           'en_BE.ISO8859-15',
 860     'en_bw':                                'en_BW.ISO8859-1',
 861     'en_bw.iso88591':                       'en_BW.ISO8859-1',
 862     'en_ca':                                'en_CA.ISO8859-1',
 863     'en_ca.iso88591':                       'en_CA.ISO8859-1',
 864     'en_gb':                                'en_GB.ISO8859-1',
 865     'en_gb.88591':                          'en_GB.ISO8859-1',
 866     'en_gb.iso88591':                       'en_GB.ISO8859-1',
 867     'en_gb.iso885915':                      'en_GB.ISO8859-15',
 868     'en_gb@euro':                           'en_GB.ISO8859-15',
 869     'en_hk':                                'en_HK.ISO8859-1',
 870     'en_hk.iso88591':                       'en_HK.ISO8859-1',
 871     'en_ie':                                'en_IE.ISO8859-1',
 872     'en_ie.iso88591':                       'en_IE.ISO8859-1',
 873     'en_ie.iso885915':                      'en_IE.ISO8859-15',
 874     'en_ie.iso885915@euro':                 'en_IE.ISO8859-15',
 875     'en_ie.utf8@euro':                      'en_IE.UTF-8',
 876     'en_ie@euro':                           'en_IE.ISO8859-15',
 877     'en_in':                                'en_IN.ISO8859-1',
 878     'en_nz':                                'en_NZ.ISO8859-1',
 879     'en_nz.iso88591':                       'en_NZ.ISO8859-1',
 880     'en_ph':                                'en_PH.ISO8859-1',
 881     'en_ph.iso88591':                       'en_PH.ISO8859-1',
 882     'en_sg':                                'en_SG.ISO8859-1',
 883     'en_sg.iso88591':                       'en_SG.ISO8859-1',
 884     'en_uk':                                'en_GB.ISO8859-1',
 885     'en_us':                                'en_US.ISO8859-1',
 886     'en_us.88591':                          'en_US.ISO8859-1',
 887     'en_us.885915':                         'en_US.ISO8859-15',
 888     'en_us.iso88591':                       'en_US.ISO8859-1',
 889     'en_us.iso885915':                      'en_US.ISO8859-15',
 890     'en_us.iso885915@euro':                 'en_US.ISO8859-15',
 891     'en_us@euro':                           'en_US.ISO8859-15',
 892     'en_us@euro@euro':                      'en_US.ISO8859-15',
 893     'en_za':                                'en_ZA.ISO8859-1',
 894     'en_za.88591':                          'en_ZA.ISO8859-1',
 895     'en_za.iso88591':                       'en_ZA.ISO8859-1',
 896     'en_za.iso885915':                      'en_ZA.ISO8859-15',
 897     'en_za@euro':                           'en_ZA.ISO8859-15',
 898     'en_zw':                                'en_ZW.ISO8859-1',
 899     'en_zw.iso88591':                       'en_ZW.ISO8859-1',
 900     'eng_gb':                               'en_GB.ISO8859-1',
 901     'eng_gb.8859':                          'en_GB.ISO8859-1',
 902     'english':                              'en_EN.ISO8859-1',
 903     'english.iso88591':                     'en_EN.ISO8859-1',
 904     'english_uk':                           'en_GB.ISO8859-1',
 905     'english_uk.8859':                      'en_GB.ISO8859-1',
 906     'english_united-states':                'en_US.ISO8859-1',
 907     'english_united-states.437':            'C',
 908     'english_us':                           'en_US.ISO8859-1',
 909     'english_us.8859':                      'en_US.ISO8859-1',
 910     'english_us.ascii':                     'en_US.ISO8859-1',
 911     'eo':                                   'eo_XX.ISO8859-3',
 912     'eo_eo':                                'eo_EO.ISO8859-3',
 913     'eo_eo.iso88593':                       'eo_EO.ISO8859-3',
 914     'eo_xx':                                'eo_XX.ISO8859-3',
 915     'eo_xx.iso88593':                       'eo_XX.ISO8859-3',
 916     'es':                                   'es_ES.ISO8859-1',
 917     'es_ar':                                'es_AR.ISO8859-1',
 918     'es_ar.iso88591':                       'es_AR.ISO8859-1',
 919     'es_bo':                                'es_BO.ISO8859-1',
 920     'es_bo.iso88591':                       'es_BO.ISO8859-1',
 921     'es_cl':                                'es_CL.ISO8859-1',
 922     'es_cl.iso88591':                       'es_CL.ISO8859-1',
 923     'es_co':                                'es_CO.ISO8859-1',
 924     'es_co.iso88591':                       'es_CO.ISO8859-1',
 925     'es_cr':                                'es_CR.ISO8859-1',
 926     'es_cr.iso88591':                       'es_CR.ISO8859-1',
 927     'es_do':                                'es_DO.ISO8859-1',
 928     'es_do.iso88591':                       'es_DO.ISO8859-1',
 929     'es_ec':                                'es_EC.ISO8859-1',
 930     'es_ec.iso88591':                       'es_EC.ISO8859-1',
 931     'es_es':                                'es_ES.ISO8859-1',
 932     'es_es.88591':                          'es_ES.ISO8859-1',
 933     'es_es.iso88591':                       'es_ES.ISO8859-1',
 934     'es_es.iso885915':                      'es_ES.ISO8859-15',
 935     'es_es.iso885915@euro':                 'es_ES.ISO8859-15',
 936     'es_es.utf8@euro':                      'es_ES.UTF-8',
 937     'es_es@euro':                           'es_ES.ISO8859-15',
 938     'es_gt':                                'es_GT.ISO8859-1',
 939     'es_gt.iso88591':                       'es_GT.ISO8859-1',
 940     'es_hn':                                'es_HN.ISO8859-1',
 941     'es_hn.iso88591':                       'es_HN.ISO8859-1',
 942     'es_mx':                                'es_MX.ISO8859-1',
 943     'es_mx.iso88591':                       'es_MX.ISO8859-1',
 944     'es_ni':                                'es_NI.ISO8859-1',
 945     'es_ni.iso88591':                       'es_NI.ISO8859-1',
 946     'es_pa':                                'es_PA.ISO8859-1',
 947     'es_pa.iso88591':                       'es_PA.ISO8859-1',
 948     'es_pa.iso885915':                      'es_PA.ISO8859-15',
 949     'es_pa@euro':                           'es_PA.ISO8859-15',
 950     'es_pe':                                'es_PE.ISO8859-1',
 951     'es_pe.iso88591':                       'es_PE.ISO8859-1',
 952     'es_pe.iso885915':                      'es_PE.ISO8859-15',
 953     'es_pe@euro':                           'es_PE.ISO8859-15',
 954     'es_pr':                                'es_PR.ISO8859-1',
 955     'es_pr.iso88591':                       'es_PR.ISO8859-1',
 956     'es_py':                                'es_PY.ISO8859-1',
 957     'es_py.iso88591':                       'es_PY.ISO8859-1',
 958     'es_py.iso885915':                      'es_PY.ISO8859-15',
 959     'es_py@euro':                           'es_PY.ISO8859-15',
 960     'es_sv':                                'es_SV.ISO8859-1',
 961     'es_sv.iso88591':                       'es_SV.ISO8859-1',
 962     'es_sv.iso885915':                      'es_SV.ISO8859-15',
 963     'es_sv@euro':                           'es_SV.ISO8859-15',
 964     'es_us':                                'es_US.ISO8859-1',
 965     'es_us.iso88591':                       'es_US.ISO8859-1',
 966     'es_uy':                                'es_UY.ISO8859-1',
 967     'es_uy.iso88591':                       'es_UY.ISO8859-1',
 968     'es_uy.iso885915':                      'es_UY.ISO8859-15',
 969     'es_uy@euro':                           'es_UY.ISO8859-15',
 970     'es_ve':                                'es_VE.ISO8859-1',
 971     'es_ve.iso88591':                       'es_VE.ISO8859-1',
 972     'es_ve.iso885915':                      'es_VE.ISO8859-15',
 973     'es_ve@euro':                           'es_VE.ISO8859-15',
 974     'estonian':                             'et_EE.ISO8859-1',
 975     'et':                                   'et_EE.ISO8859-15',
 976     'et_ee':                                'et_EE.ISO8859-15',
 977     'et_ee.iso88591':                       'et_EE.ISO8859-1',
 978     'et_ee.iso885913':                      'et_EE.ISO8859-13',
 979     'et_ee.iso885915':                      'et_EE.ISO8859-15',
 980     'et_ee.iso88594':                       'et_EE.ISO8859-4',
 981     'et_ee@euro':                           'et_EE.ISO8859-15',
 982     'eu':                                   'eu_ES.ISO8859-1',
 983     'eu_es':                                'eu_ES.ISO8859-1',
 984     'eu_es.iso88591':                       'eu_ES.ISO8859-1',
 985     'eu_es.iso885915':                      'eu_ES.ISO8859-15',
 986     'eu_es.iso885915@euro':                 'eu_ES.ISO8859-15',
 987     'eu_es.utf8@euro':                      'eu_ES.UTF-8',
 988     'eu_es@euro':                           'eu_ES.ISO8859-15',
 989     'fa':                                   'fa_IR.UTF-8',
 990     'fa_ir':                                'fa_IR.UTF-8',
 991     'fa_ir.isiri3342':                      'fa_IR.ISIRI-3342',
 992     'fi':                                   'fi_FI.ISO8859-15',
 993     'fi_fi':                                'fi_FI.ISO8859-15',
 994     'fi_fi.88591':                          'fi_FI.ISO8859-1',
 995     'fi_fi.iso88591':                       'fi_FI.ISO8859-1',
 996     'fi_fi.iso885915':                      'fi_FI.ISO8859-15',
 997     'fi_fi.iso885915@euro':                 'fi_FI.ISO8859-15',
 998     'fi_fi.utf8@euro':                      'fi_FI.UTF-8',
 999     'fi_fi@euro':                           'fi_FI.ISO8859-15',
1000     'finnish':                              'fi_FI.ISO8859-1',
1001     'finnish.iso88591':                     'fi_FI.ISO8859-1',
1002     'fo':                                   'fo_FO.ISO8859-1',
1003     'fo_fo':                                'fo_FO.ISO8859-1',
1004     'fo_fo.iso88591':                       'fo_FO.ISO8859-1',
1005     'fo_fo.iso885915':                      'fo_FO.ISO8859-15',
1006     'fo_fo@euro':                           'fo_FO.ISO8859-15',
1007     'fr':                                   'fr_FR.ISO8859-1',
1008     'fr_be':                                'fr_BE.ISO8859-1',
1009     'fr_be.88591':                          'fr_BE.ISO8859-1',
1010     'fr_be.iso88591':                       'fr_BE.ISO8859-1',
1011     'fr_be.iso885915':                      'fr_BE.ISO8859-15',
1012     'fr_be.iso885915@euro':                 'fr_BE.ISO8859-15',
1013     'fr_be.utf8@euro':                      'fr_BE.UTF-8',
1014     'fr_be@euro':                           'fr_BE.ISO8859-15',
1015     'fr_ca':                                'fr_CA.ISO8859-1',
1016     'fr_ca.88591':                          'fr_CA.ISO8859-1',
1017     'fr_ca.iso88591':                       'fr_CA.ISO8859-1',
1018     'fr_ca.iso885915':                      'fr_CA.ISO8859-15',
1019     'fr_ca@euro':                           'fr_CA.ISO8859-15',
1020     'fr_ch':                                'fr_CH.ISO8859-1',
1021     'fr_ch.88591':                          'fr_CH.ISO8859-1',
1022     'fr_ch.iso88591':                       'fr_CH.ISO8859-1',
1023     'fr_ch.iso885915':                      'fr_CH.ISO8859-15',
1024     'fr_ch@euro':                           'fr_CH.ISO8859-15',
1025     'fr_fr':                                'fr_FR.ISO8859-1',
1026     'fr_fr.88591':                          'fr_FR.ISO8859-1',
1027     'fr_fr.iso88591':                       'fr_FR.ISO8859-1',
1028     'fr_fr.iso885915':                      'fr_FR.ISO8859-15',
1029     'fr_fr.iso885915@euro':                 'fr_FR.ISO8859-15',
1030     'fr_fr.utf8@euro':                      'fr_FR.UTF-8',
1031     'fr_fr@euro':                           'fr_FR.ISO8859-15',
1032     'fr_lu':                                'fr_LU.ISO8859-1',
1033     'fr_lu.88591':                          'fr_LU.ISO8859-1',
1034     'fr_lu.iso88591':                       'fr_LU.ISO8859-1',
1035     'fr_lu.iso885915':                      'fr_LU.ISO8859-15',
1036     'fr_lu.iso885915@euro':                 'fr_LU.ISO8859-15',
1037     'fr_lu.utf8@euro':                      'fr_LU.UTF-8',
1038     'fr_lu@euro':                           'fr_LU.ISO8859-15',
1039     'fran\xe7ais':                          'fr_FR.ISO8859-1',
1040     'fre_fr':                               'fr_FR.ISO8859-1',
1041     'fre_fr.8859':                          'fr_FR.ISO8859-1',
1042     'french':                               'fr_FR.ISO8859-1',
1043     'french.iso88591':                      'fr_CH.ISO8859-1',
1044     'french_france':                        'fr_FR.ISO8859-1',
1045     'french_france.8859':                   'fr_FR.ISO8859-1',
1046     'ga':                                   'ga_IE.ISO8859-1',
1047     'ga_ie':                                'ga_IE.ISO8859-1',
1048     'ga_ie.iso88591':                       'ga_IE.ISO8859-1',
1049     'ga_ie.iso885914':                      'ga_IE.ISO8859-14',
1050     'ga_ie.iso885915':                      'ga_IE.ISO8859-15',
1051     'ga_ie.iso885915@euro':                 'ga_IE.ISO8859-15',
1052     'ga_ie.utf8@euro':                      'ga_IE.UTF-8',
1053     'ga_ie@euro':                           'ga_IE.ISO8859-15',
1054     'galego':                               'gl_ES.ISO8859-1',
1055     'galician':                             'gl_ES.ISO8859-1',
1056     'gd':                                   'gd_GB.ISO8859-1',
1057     'gd_gb':                                'gd_GB.ISO8859-1',
1058     'gd_gb.iso88591':                       'gd_GB.ISO8859-1',
1059     'gd_gb.iso885914':                      'gd_GB.ISO8859-14',
1060     'gd_gb.iso885915':                      'gd_GB.ISO8859-15',
1061     'gd_gb@euro':                           'gd_GB.ISO8859-15',
1062     'ger_de':                               'de_DE.ISO8859-1',
1063     'ger_de.8859':                          'de_DE.ISO8859-1',
1064     'german':                               'de_DE.ISO8859-1',
1065     'german.iso88591':                      'de_CH.ISO8859-1',
1066     'german_germany':                       'de_DE.ISO8859-1',
1067     'german_germany.8859':                  'de_DE.ISO8859-1',
1068     'gl':                                   'gl_ES.ISO8859-1',
1069     'gl_es':                                'gl_ES.ISO8859-1',
1070     'gl_es.iso88591':                       'gl_ES.ISO8859-1',
1071     'gl_es.iso885915':                      'gl_ES.ISO8859-15',
1072     'gl_es.iso885915@euro':                 'gl_ES.ISO8859-15',
1073     'gl_es.utf8@euro':                      'gl_ES.UTF-8',
1074     'gl_es@euro':                           'gl_ES.ISO8859-15',
1075     'greek':                                'el_GR.ISO8859-7',
1076     'greek.iso88597':                       'el_GR.ISO8859-7',
1077     'gu_in':                                'gu_IN.UTF-8',
1078     'gv':                                   'gv_GB.ISO8859-1',
1079     'gv_gb':                                'gv_GB.ISO8859-1',
1080     'gv_gb.iso88591':                       'gv_GB.ISO8859-1',
1081     'gv_gb.iso885914':                      'gv_GB.ISO8859-14',
1082     'gv_gb.iso885915':                      'gv_GB.ISO8859-15',
1083     'gv_gb@euro':                           'gv_GB.ISO8859-15',
1084     'he':                                   'he_IL.ISO8859-8',
1085     'he_il':                                'he_IL.ISO8859-8',
1086     'he_il.cp1255':                         'he_IL.CP1255',
1087     'he_il.iso88598':                       'he_IL.ISO8859-8',
1088     'he_il.microsoftcp1255':                'he_IL.CP1255',
1089     'hebrew':                               'iw_IL.ISO8859-8',
1090     'hebrew.iso88598':                      'iw_IL.ISO8859-8',
1091     'hi':                                   'hi_IN.ISCII-DEV',
1092     'hi_in':                                'hi_IN.ISCII-DEV',
1093     'hi_in.isciidev':                       'hi_IN.ISCII-DEV',
1094     'hr':                                   'hr_HR.ISO8859-2',
1095     'hr_hr':                                'hr_HR.ISO8859-2',
1096     'hr_hr.iso88592':                       'hr_HR.ISO8859-2',
1097     'hrvatski':                             'hr_HR.ISO8859-2',
1098     'hu':                                   'hu_HU.ISO8859-2',
1099     'hu_hu':                                'hu_HU.ISO8859-2',
1100     'hu_hu.iso88592':                       'hu_HU.ISO8859-2',
1101     'hungarian':                            'hu_HU.ISO8859-2',
1102     'icelandic':                            'is_IS.ISO8859-1',
1103     'icelandic.iso88591':                   'is_IS.ISO8859-1',
1104     'id':                                   'id_ID.ISO8859-1',
1105     'id_id':                                'id_ID.ISO8859-1',
1106     'in':                                   'id_ID.ISO8859-1',
1107     'in_id':                                'id_ID.ISO8859-1',
1108     'is':                                   'is_IS.ISO8859-1',
1109     'is_is':                                'is_IS.ISO8859-1',
1110     'is_is.iso88591':                       'is_IS.ISO8859-1',
1111     'is_is.iso885915':                      'is_IS.ISO8859-15',
1112     'is_is@euro':                           'is_IS.ISO8859-15',
1113     'iso-8859-1':                           'en_US.ISO8859-1',
1114     'iso-8859-15':                          'en_US.ISO8859-15',
1115     'iso8859-1':                            'en_US.ISO8859-1',
1116     'iso8859-15':                           'en_US.ISO8859-15',
1117     'iso_8859_1':                           'en_US.ISO8859-1',
1118     'iso_8859_15':                          'en_US.ISO8859-15',
1119     'it':                                   'it_IT.ISO8859-1',
1120     'it_ch':                                'it_CH.ISO8859-1',
1121     'it_ch.iso88591':                       'it_CH.ISO8859-1',
1122     'it_ch.iso885915':                      'it_CH.ISO8859-15',
1123     'it_ch@euro':                           'it_CH.ISO8859-15',
1124     'it_it':                                'it_IT.ISO8859-1',
1125     'it_it.88591':                          'it_IT.ISO8859-1',
1126     'it_it.iso88591':                       'it_IT.ISO8859-1',
1127     'it_it.iso885915':                      'it_IT.ISO8859-15',
1128     'it_it.iso885915@euro':                 'it_IT.ISO8859-15',
1129     'it_it.utf8@euro':                      'it_IT.UTF-8',
1130     'it_it@euro':                           'it_IT.ISO8859-15',
1131     'italian':                              'it_IT.ISO8859-1',
1132     'italian.iso88591':                     'it_IT.ISO8859-1',
1133     'iu':                                   'iu_CA.NUNACOM-8',
1134     'iu_ca':                                'iu_CA.NUNACOM-8',
1135     'iu_ca.nunacom8':                       'iu_CA.NUNACOM-8',
1136     'iw':                                   'he_IL.ISO8859-8',
1137     'iw_il':                                'he_IL.ISO8859-8',
1138     'iw_il.iso88598':                       'he_IL.ISO8859-8',
1139     'ja':                                   'ja_JP.eucJP',
1140     'ja.jis':                               'ja_JP.JIS7',
1141     'ja.sjis':                              'ja_JP.SJIS',
1142     'ja_jp':                                'ja_JP.eucJP',
1143     'ja_jp.ajec':                           'ja_JP.eucJP',
1144     'ja_jp.euc':                            'ja_JP.eucJP',
1145     'ja_jp.eucjp':                          'ja_JP.eucJP',
1146     'ja_jp.iso-2022-jp':                    'ja_JP.JIS7',
1147     'ja_jp.iso2022jp':                      'ja_JP.JIS7',
1148     'ja_jp.jis':                            'ja_JP.JIS7',
1149     'ja_jp.jis7':                           'ja_JP.JIS7',
1150     'ja_jp.mscode':                         'ja_JP.SJIS',
1151     'ja_jp.sjis':                           'ja_JP.SJIS',
1152     'ja_jp.ujis':                           'ja_JP.eucJP',
1153     'japan':                                'ja_JP.eucJP',
1154     'japanese':                             'ja_JP.eucJP',
1155     'japanese-euc':                         'ja_JP.eucJP',
1156     'japanese.euc':                         'ja_JP.eucJP',
1157     'japanese.sjis':                        'ja_JP.SJIS',
1158     'jp_jp':                                'ja_JP.eucJP',
1159     'ka':                                   'ka_GE.GEORGIAN-ACADEMY',
1160     'ka_ge':                                'ka_GE.GEORGIAN-ACADEMY',
1161     'ka_ge.georgianacademy':                'ka_GE.GEORGIAN-ACADEMY',
1162     'ka_ge.georgianps':                     'ka_GE.GEORGIAN-PS',
1163     'ka_ge.georgianrs':                     'ka_GE.GEORGIAN-ACADEMY',
1164     'kl':                                   'kl_GL.ISO8859-1',
1165     'kl_gl':                                'kl_GL.ISO8859-1',
1166     'kl_gl.iso88591':                       'kl_GL.ISO8859-1',
1167     'kl_gl.iso885915':                      'kl_GL.ISO8859-15',
1168     'kl_gl@euro':                           'kl_GL.ISO8859-15',
1169     'km_kh':                                'km_KH.UTF-8',
1170     'kn_in':                                'kn_IN.UTF-8',
1171     'ko':                                   'ko_KR.eucKR',
1172     'ko_kr':                                'ko_KR.eucKR',
1173     'ko_kr.euc':                            'ko_KR.eucKR',
1174     'ko_kr.euckr':                          'ko_KR.eucKR',
1175     'korean':                               'ko_KR.eucKR',
1176     'korean.euc':                           'ko_KR.eucKR',
1177     'kw':                                   'kw_GB.ISO8859-1',
1178     'kw_gb':                                'kw_GB.ISO8859-1',
1179     'kw_gb.iso88591':                       'kw_GB.ISO8859-1',
1180     'kw_gb.iso885914':                      'kw_GB.ISO8859-14',
1181     'kw_gb.iso885915':                      'kw_GB.ISO8859-15',
1182     'kw_gb@euro':                           'kw_GB.ISO8859-15',
1183     'ky':                                   'ky_KG.UTF-8',
1184     'ky_kg':                                'ky_KG.UTF-8',
1185     'lithuanian':                           'lt_LT.ISO8859-13',
1186     'lo':                                   'lo_LA.MULELAO-1',
1187     'lo_la':                                'lo_LA.MULELAO-1',
1188     'lo_la.cp1133':                         'lo_LA.IBM-CP1133',
1189     'lo_la.ibmcp1133':                      'lo_LA.IBM-CP1133',
1190     'lo_la.mulelao1':                       'lo_LA.MULELAO-1',
1191     'lt':                                   'lt_LT.ISO8859-13',
1192     'lt_lt':                                'lt_LT.ISO8859-13',
1193     'lt_lt.iso885913':                      'lt_LT.ISO8859-13',
1194     'lt_lt.iso88594':                       'lt_LT.ISO8859-4',
1195     'lv':                                   'lv_LV.ISO8859-13',
1196     'lv_lv':                                'lv_LV.ISO8859-13',
1197     'lv_lv.iso885913':                      'lv_LV.ISO8859-13',
1198     'lv_lv.iso88594':                       'lv_LV.ISO8859-4',
1199     'mi':                                   'mi_NZ.ISO8859-1',
1200     'mi_nz':                                'mi_NZ.ISO8859-1',
1201     'mi_nz.iso88591':                       'mi_NZ.ISO8859-1',
1202     'mk':                                   'mk_MK.ISO8859-5',
1203     'mk_mk':                                'mk_MK.ISO8859-5',
1204     'mk_mk.cp1251':                         'mk_MK.CP1251',
1205     'mk_mk.iso88595':                       'mk_MK.ISO8859-5',
1206     'mk_mk.microsoftcp1251':                'mk_MK.CP1251',
1207     'mr_in':                                'mr_IN.UTF-8',
1208     'ms':                                   'ms_MY.ISO8859-1',
1209     'ms_my':                                'ms_MY.ISO8859-1',
1210     'ms_my.iso88591':                       'ms_MY.ISO8859-1',
1211     'mt':                                   'mt_MT.ISO8859-3',
1212     'mt_mt':                                'mt_MT.ISO8859-3',
1213     'mt_mt.iso88593':                       'mt_MT.ISO8859-3',
1214     'nb':                                   'nb_NO.ISO8859-1',
1215     'nb_no':                                'nb_NO.ISO8859-1',
1216     'nb_no.88591':                          'nb_NO.ISO8859-1',
1217     'nb_no.iso88591':                       'nb_NO.ISO8859-1',
1218     'nb_no.iso885915':                      'nb_NO.ISO8859-15',
1219     'nb_no@euro':                           'nb_NO.ISO8859-15',
1220     'nl':                                   'nl_NL.ISO8859-1',
1221     'nl_be':                                'nl_BE.ISO8859-1',
1222     'nl_be.88591':                          'nl_BE.ISO8859-1',
1223     'nl_be.iso88591':                       'nl_BE.ISO8859-1',
1224     'nl_be.iso885915':                      'nl_BE.ISO8859-15',
1225     'nl_be.iso885915@euro':                 'nl_BE.ISO8859-15',
1226     'nl_be.utf8@euro':                      'nl_BE.UTF-8',
1227     'nl_be@euro':                           'nl_BE.ISO8859-15',
1228     'nl_nl':                                'nl_NL.ISO8859-1',
1229     'nl_nl.88591':                          'nl_NL.ISO8859-1',
1230     'nl_nl.iso88591':                       'nl_NL.ISO8859-1',
1231     'nl_nl.iso885915':                      'nl_NL.ISO8859-15',
1232     'nl_nl.iso885915@euro':                 'nl_NL.ISO8859-15',
1233     'nl_nl.utf8@euro':                      'nl_NL.UTF-8',
1234     'nl_nl@euro':                           'nl_NL.ISO8859-15',
1235     'nn':                                   'nn_NO.ISO8859-1',
1236     'nn_no':                                'nn_NO.ISO8859-1',
1237     'nn_no.88591':                          'nn_NO.ISO8859-1',
1238     'nn_no.iso88591':                       'nn_NO.ISO8859-1',
1239     'nn_no.iso885915':                      'nn_NO.ISO8859-15',
1240     'nn_no@euro':                           'nn_NO.ISO8859-15',
1241     'no':                                   'no_NO.ISO8859-1',
1242     'no@nynorsk':                           'ny_NO.ISO8859-1',
1243     'no_no':                                'no_NO.ISO8859-1',
1244     'no_no.88591':                          'no_NO.ISO8859-1',
1245     'no_no.iso88591':                       'no_NO.ISO8859-1',
1246     'no_no.iso885915':                      'no_NO.ISO8859-15',
1247     'no_no@euro':                           'no_NO.ISO8859-15',
1248     'norwegian':                            'no_NO.ISO8859-1',
1249     'norwegian.iso88591':                   'no_NO.ISO8859-1',
1250     'nr':                                   'nr_ZA.ISO8859-1',
1251     'nr_za':                                'nr_ZA.ISO8859-1',
1252     'nr_za.iso88591':                       'nr_ZA.ISO8859-1',
1253     'nso':                                  'nso_ZA.ISO8859-15',
1254     'nso_za':                               'nso_ZA.ISO8859-15',
1255     'nso_za.iso885915':                     'nso_ZA.ISO8859-15',
1256     'ny':                                   'ny_NO.ISO8859-1',
1257     'ny_no':                                'ny_NO.ISO8859-1',
1258     'ny_no.88591':                          'ny_NO.ISO8859-1',
1259     'ny_no.iso88591':                       'ny_NO.ISO8859-1',
1260     'ny_no.iso885915':                      'ny_NO.ISO8859-15',
1261     'ny_no@euro':                           'ny_NO.ISO8859-15',
1262     'nynorsk':                              'nn_NO.ISO8859-1',
1263     'oc':                                   'oc_FR.ISO8859-1',
1264     'oc_fr':                                'oc_FR.ISO8859-1',
1265     'oc_fr.iso88591':                       'oc_FR.ISO8859-1',
1266     'oc_fr.iso885915':                      'oc_FR.ISO8859-15',
1267     'oc_fr@euro':                           'oc_FR.ISO8859-15',
1268     'pa_in':                                'pa_IN.UTF-8',
1269     'pd':                                   'pd_US.ISO8859-1',
1270     'pd_de':                                'pd_DE.ISO8859-1',
1271     'pd_de.iso88591':                       'pd_DE.ISO8859-1',
1272     'pd_de.iso885915':                      'pd_DE.ISO8859-15',
1273     'pd_de@euro':                           'pd_DE.ISO8859-15',
1274     'pd_us':                                'pd_US.ISO8859-1',
1275     'pd_us.iso88591':                       'pd_US.ISO8859-1',
1276     'pd_us.iso885915':                      'pd_US.ISO8859-15',
1277     'pd_us@euro':                           'pd_US.ISO8859-15',
1278     'ph':                                   'ph_PH.ISO8859-1',
1279     'ph_ph':                                'ph_PH.ISO8859-1',
1280     'ph_ph.iso88591':                       'ph_PH.ISO8859-1',
1281     'pl':                                   'pl_PL.ISO8859-2',
1282     'pl_pl':                                'pl_PL.ISO8859-2',
1283     'pl_pl.iso88592':                       'pl_PL.ISO8859-2',
1284     'polish':                               'pl_PL.ISO8859-2',
1285     'portuguese':                           'pt_PT.ISO8859-1',
1286     'portuguese.iso88591':                  'pt_PT.ISO8859-1',
1287     'portuguese_brazil':                    'pt_BR.ISO8859-1',
1288     'portuguese_brazil.8859':               'pt_BR.ISO8859-1',
1289     'posix':                                'C',
1290     'posix-utf2':                           'C',
1291     'pp':                                   'pp_AN.ISO8859-1',
1292     'pp_an':                                'pp_AN.ISO8859-1',
1293     'pp_an.iso88591':                       'pp_AN.ISO8859-1',
1294     'pt':                                   'pt_PT.ISO8859-1',
1295     'pt_br':                                'pt_BR.ISO8859-1',
1296     'pt_br.88591':                          'pt_BR.ISO8859-1',
1297     'pt_br.iso88591':                       'pt_BR.ISO8859-1',
1298     'pt_br.iso885915':                      'pt_BR.ISO8859-15',
1299     'pt_br@euro':                           'pt_BR.ISO8859-15',
1300     'pt_pt':                                'pt_PT.ISO8859-1',
1301     'pt_pt.88591':                          'pt_PT.ISO8859-1',
1302     'pt_pt.iso88591':                       'pt_PT.ISO8859-1',
1303     'pt_pt.iso885915':                      'pt_PT.ISO8859-15',
1304     'pt_pt.iso885915@euro':                 'pt_PT.ISO8859-15',
1305     'pt_pt.utf8@euro':                      'pt_PT.UTF-8',
1306     'pt_pt@euro':                           'pt_PT.ISO8859-15',
1307     'ro':                                   'ro_RO.ISO8859-2',
1308     'ro_ro':                                'ro_RO.ISO8859-2',
1309     'ro_ro.iso88592':                       'ro_RO.ISO8859-2',
1310     'romanian':                             'ro_RO.ISO8859-2',
1311     'ru':                                   'ru_RU.ISO8859-5',
1312     'ru_ru':                                'ru_RU.ISO8859-5',
1313     'ru_ru.cp1251':                         'ru_RU.CP1251',
1314     'ru_ru.iso88595':                       'ru_RU.ISO8859-5',
1315     'ru_ru.koi8r':                          'ru_RU.KOI8-R',
1316     'ru_ru.microsoftcp1251':                'ru_RU.CP1251',
1317     'ru_ua':                                'ru_UA.KOI8-U',
1318     'ru_ua.cp1251':                         'ru_UA.CP1251',
1319     'ru_ua.koi8u':                          'ru_UA.KOI8-U',
1320     'ru_ua.microsoftcp1251':                'ru_UA.CP1251',
1321     'rumanian':                             'ro_RO.ISO8859-2',
1322     'russian':                              'ru_RU.ISO8859-5',
1323     'rw':                                   'rw_RW.ISO8859-1',
1324     'rw_rw':                                'rw_RW.ISO8859-1',
1325     'rw_rw.iso88591':                       'rw_RW.ISO8859-1',
1326     'se_no':                                'se_NO.UTF-8',
1327     'serbocroatian':                        'sr_CS.ISO8859-2',
1328     'sh':                                   'sr_CS.ISO8859-2',
1329     'sh_hr':                                'sh_HR.ISO8859-2',
1330     'sh_hr.iso88592':                       'hr_HR.ISO8859-2',
1331     'sh_sp':                                'sr_CS.ISO8859-2',
1332     'sh_yu':                                'sr_CS.ISO8859-2',
1333     'si':                                   'si_LK.UTF-8',
1334     'si_lk':                                'si_LK.UTF-8',
1335     'sinhala':                              'si_LK.UTF-8',
1336     'sk':                                   'sk_SK.ISO8859-2',
1337     'sk_sk':                                'sk_SK.ISO8859-2',
1338     'sk_sk.iso88592':                       'sk_SK.ISO8859-2',
1339     'sl':                                   'sl_SI.ISO8859-2',
1340     'sl_cs':                                'sl_CS.ISO8859-2',
1341     'sl_si':                                'sl_SI.ISO8859-2',
1342     'sl_si.iso88592':                       'sl_SI.ISO8859-2',
1343     'slovak':                               'sk_SK.ISO8859-2',
1344     'slovene':                              'sl_SI.ISO8859-2',
1345     'slovenian':                            'sl_SI.ISO8859-2',
1346     'sp':                                   'sr_CS.ISO8859-5',
1347     'sp_yu':                                'sr_CS.ISO8859-5',
1348     'spanish':                              'es_ES.ISO8859-1',
1349     'spanish.iso88591':                     'es_ES.ISO8859-1',
1350     'spanish_spain':                        'es_ES.ISO8859-1',
1351     'spanish_spain.8859':                   'es_ES.ISO8859-1',
1352     'sq':                                   'sq_AL.ISO8859-2',
1353     'sq_al':                                'sq_AL.ISO8859-2',
1354     'sq_al.iso88592':                       'sq_AL.ISO8859-2',
1355     'sr':                                   'sr_CS.ISO8859-5',
1356     'sr@cyrillic':                          'sr_CS.ISO8859-5',
1357     'sr@latn':                              'sr_CS.ISO8859-2',
1358     'sr_cs.iso88592':                       'sr_CS.ISO8859-2',
1359     'sr_cs.iso88592@latn':                  'sr_CS.ISO8859-2',
1360     'sr_cs.iso88595':                       'sr_CS.ISO8859-5',
1361     'sr_cs.utf8@latn':                      'sr_CS.UTF-8',
1362     'sr_cs@latn':                           'sr_CS.ISO8859-2',
1363     'sr_sp':                                'sr_CS.ISO8859-2',
1364     'sr_yu':                                'sr_CS.ISO8859-5',
1365     'sr_yu.cp1251@cyrillic':                'sr_CS.CP1251',
1366     'sr_yu.iso88592':                       'sr_CS.ISO8859-2',
1367     'sr_yu.iso88595':                       'sr_CS.ISO8859-5',
1368     'sr_yu.iso88595@cyrillic':              'sr_CS.ISO8859-5',
1369     'sr_yu.microsoftcp1251@cyrillic':       'sr_CS.CP1251',
1370     'sr_yu.utf8@cyrillic':                  'sr_CS.UTF-8',
1371     'sr_yu@cyrillic':                       'sr_CS.ISO8859-5',
1372     'ss':                                   'ss_ZA.ISO8859-1',
1373     'ss_za':                                'ss_ZA.ISO8859-1',
1374     'ss_za.iso88591':                       'ss_ZA.ISO8859-1',
1375     'st':                                   'st_ZA.ISO8859-1',
1376     'st_za':                                'st_ZA.ISO8859-1',
1377     'st_za.iso88591':                       'st_ZA.ISO8859-1',
1378     'sv':                                   'sv_SE.ISO8859-1',
1379     'sv_fi':                                'sv_FI.ISO8859-1',
1380     'sv_fi.iso88591':                       'sv_FI.ISO8859-1',
1381     'sv_fi.iso885915':                      'sv_FI.ISO8859-15',
1382     'sv_fi.iso885915@euro':                 'sv_FI.ISO8859-15',
1383     'sv_fi.utf8@euro':                      'sv_FI.UTF-8',
1384     'sv_fi@euro':                           'sv_FI.ISO8859-15',
1385     'sv_se':                                'sv_SE.ISO8859-1',
1386     'sv_se.88591':                          'sv_SE.ISO8859-1',
1387     'sv_se.iso88591':                       'sv_SE.ISO8859-1',
1388     'sv_se.iso885915':                      'sv_SE.ISO8859-15',
1389     'sv_se@euro':                           'sv_SE.ISO8859-15',
1390     'swedish':                              'sv_SE.ISO8859-1',
1391     'swedish.iso88591':                     'sv_SE.ISO8859-1',
1392     'ta':                                   'ta_IN.TSCII-0',
1393     'ta_in':                                'ta_IN.TSCII-0',
1394     'ta_in.tscii':                          'ta_IN.TSCII-0',
1395     'ta_in.tscii0':                         'ta_IN.TSCII-0',
1396     'tg':                                   'tg_TJ.KOI8-C',
1397     'tg_tj':                                'tg_TJ.KOI8-C',
1398     'tg_tj.koi8c':                          'tg_TJ.KOI8-C',
1399     'th':                                   'th_TH.ISO8859-11',
1400     'th_th':                                'th_TH.ISO8859-11',
1401     'th_th.iso885911':                      'th_TH.ISO8859-11',
1402     'th_th.tactis':                         'th_TH.TIS620',
1403     'th_th.tis620':                         'th_TH.TIS620',
1404     'thai':                                 'th_TH.ISO8859-11',
1405     'tl':                                   'tl_PH.ISO8859-1',
1406     'tl_ph':                                'tl_PH.ISO8859-1',
1407     'tl_ph.iso88591':                       'tl_PH.ISO8859-1',
1408     'tn':                                   'tn_ZA.ISO8859-15',
1409     'tn_za':                                'tn_ZA.ISO8859-15',
1410     'tn_za.iso885915':                      'tn_ZA.ISO8859-15',
1411     'tr':                                   'tr_TR.ISO8859-9',
1412     'tr_tr':                                'tr_TR.ISO8859-9',
1413     'tr_tr.iso88599':                       'tr_TR.ISO8859-9',
1414     'ts':                                   'ts_ZA.ISO8859-1',
1415     'ts_za':                                'ts_ZA.ISO8859-1',
1416     'ts_za.iso88591':                       'ts_ZA.ISO8859-1',
1417     'tt':                                   'tt_RU.TATAR-CYR',
1418     'tt_ru':                                'tt_RU.TATAR-CYR',
1419     'tt_ru.koi8c':                          'tt_RU.KOI8-C',
1420     'tt_ru.tatarcyr':                       'tt_RU.TATAR-CYR',
1421     'turkish':                              'tr_TR.ISO8859-9',
1422     'turkish.iso88599':                     'tr_TR.ISO8859-9',
1423     'uk':                                   'uk_UA.KOI8-U',
1424     'uk_ua':                                'uk_UA.KOI8-U',
1425     'uk_ua.cp1251':                         'uk_UA.CP1251',
1426     'uk_ua.iso88595':                       'uk_UA.ISO8859-5',
1427     'uk_ua.koi8u':                          'uk_UA.KOI8-U',
1428     'uk_ua.microsoftcp1251':                'uk_UA.CP1251',
1429     'univ':                                 'en_US.utf',
1430     'universal':                            'en_US.utf',
1431     'universal.utf8@ucs4':                  'en_US.UTF-8',
1432     'ur':                                   'ur_PK.CP1256',
1433     'ur_pk':                                'ur_PK.CP1256',
1434     'ur_pk.cp1256':                         'ur_PK.CP1256',
1435     'ur_pk.microsoftcp1256':                'ur_PK.CP1256',
1436     'uz':                                   'uz_UZ.UTF-8',
1437     'uz_uz':                                'uz_UZ.UTF-8',
1438     'uz_uz.iso88591':                       'uz_UZ.ISO8859-1',
1439     'uz_uz.utf8@cyrillic':                  'uz_UZ.UTF-8',
1440     'uz_uz@cyrillic':                       'uz_UZ.UTF-8',
1441     've':                                   've_ZA.UTF-8',
1442     've_za':                                've_ZA.UTF-8',
1443     'vi':                                   'vi_VN.TCVN',
1444     'vi_vn':                                'vi_VN.TCVN',
1445     'vi_vn.tcvn':                           'vi_VN.TCVN',
1446     'vi_vn.tcvn5712':                       'vi_VN.TCVN',
1447     'vi_vn.viscii':                         'vi_VN.VISCII',
1448     'vi_vn.viscii111':                      'vi_VN.VISCII',
1449     'wa':                                   'wa_BE.ISO8859-1',
1450     'wa_be':                                'wa_BE.ISO8859-1',
1451     'wa_be.iso88591':                       'wa_BE.ISO8859-1',
1452     'wa_be.iso885915':                      'wa_BE.ISO8859-15',
1453     'wa_be.iso885915@euro':                 'wa_BE.ISO8859-15',
1454     'wa_be@euro':                           'wa_BE.ISO8859-15',
1455     'xh':                                   'xh_ZA.ISO8859-1',
1456     'xh_za':                                'xh_ZA.ISO8859-1',
1457     'xh_za.iso88591':                       'xh_ZA.ISO8859-1',
1458     'yi':                                   'yi_US.CP1255',
1459     'yi_us':                                'yi_US.CP1255',
1460     'yi_us.cp1255':                         'yi_US.CP1255',
1461     'yi_us.microsoftcp1255':                'yi_US.CP1255',
1462     'zh':                                   'zh_CN.eucCN',
1463     'zh_cn':                                'zh_CN.gb2312',
1464     'zh_cn.big5':                           'zh_TW.big5',
1465     'zh_cn.euc':                            'zh_CN.eucCN',
1466     'zh_cn.gb18030':                        'zh_CN.gb18030',
1467     'zh_cn.gb2312':                         'zh_CN.gb2312',
1468     'zh_cn.gbk':                            'zh_CN.gbk',
1469     'zh_hk':                                'zh_HK.big5hkscs',
1470     'zh_hk.big5':                           'zh_HK.big5',
1471     'zh_hk.big5hkscs':                      'zh_HK.big5hkscs',
1472     'zh_tw':                                'zh_TW.big5',
1473     'zh_tw.big5':                           'zh_TW.big5',
1474     'zh_tw.euc':                            'zh_TW.eucTW',
1475     'zh_tw.euctw':                          'zh_TW.eucTW',
1476     'zu':                                   'zu_ZA.ISO8859-1',
1477     'zu_za':                                'zu_ZA.ISO8859-1',
1478     'zu_za.iso88591':                       'zu_ZA.ISO8859-1',
1479 }
1480
1481 #
1482 # This maps Windows language identifiers to locale strings.
1483 #
1484 # This list has been updated from
1485 # http://msdn.microsoft.com/library/default.asp?url=/library/en-us/intl/nls_238z.asp
1486 # to include every locale up to Windows Vista.
1487 #
1488 # NOTE: this mapping is incomplete.  If your language is missing, please
1489 # submit a bug report to Python bug manager, which you can find via:
1490 #     http://www.python.org/dev/
1491 # Make sure you include the missing language identifier and the suggested
1492 # locale code.
1493 #
1494
1495 windows_locale = {
1496     0x0436: "af_ZA", # Afrikaans
1497     0x041c: "sq_AL", # Albanian
1498     0x0484: "gsw_FR",# Alsatian - France
1499     0x045e: "am_ET", # Amharic - Ethiopia
1500     0x0401: "ar_SA", # Arabic - Saudi Arabia
1501     0x0801: "ar_IQ", # Arabic - Iraq
1502     0x0c01: "ar_EG", # Arabic - Egypt
1503     0x1001: "ar_LY", # Arabic - Libya
1504     0x1401: "ar_DZ", # Arabic - Algeria
1505     0x1801: "ar_MA", # Arabic - Morocco
1506     0x1c01: "ar_TN", # Arabic - Tunisia
1507     0x2001: "ar_OM", # Arabic - Oman
1508     0x2401: "ar_YE", # Arabic - Yemen
1509     0x2801: "ar_SY", # Arabic - Syria
1510     0x2c01: "ar_JO", # Arabic - Jordan
1511     0x3001: "ar_LB", # Arabic - Lebanon
1512     0x3401: "ar_KW", # Arabic - Kuwait
1513     0x3801: "ar_AE", # Arabic - United Arab Emirates
1514     0x3c01: "ar_BH", # Arabic - Bahrain
1515     0x4001: "ar_QA", # Arabic - Qatar
1516     0x042b: "hy_AM", # Armenian
1517     0x044d: "as_IN", # Assamese - India
1518     0x042c: "az_AZ", # Azeri - Latin
1519     0x082c: "az_AZ", # Azeri - Cyrillic
1520     0x046d: "ba_RU", # Bashkir
1521     0x042d: "eu_ES", # Basque - Russia
1522     0x0423: "be_BY", # Belarusian
1523     0x0445: "bn_IN", # Begali
1524     0x201a: "bs_BA", # Bosnian - Cyrillic
1525     0x141a: "bs_BA", # Bosnian - Latin
1526     0x047e: "br_FR", # Breton - France
1527     0x0402: "bg_BG", # Bulgarian
1528 #    0x0455: "my_MM", # Burmese - Not supported
1529     0x0403: "ca_ES", # Catalan
1530     0x0004: "zh_CHS",# Chinese - Simplified
1531     0x0404: "zh_TW", # Chinese - Taiwan
1532     0x0804: "zh_CN", # Chinese - PRC
1533     0x0c04: "zh_HK", # Chinese - Hong Kong S.A.R.
1534     0x1004: "zh_SG", # Chinese - Singapore
1535     0x1404: "zh_MO", # Chinese - Macao S.A.R.
1536     0x7c04: "zh_CHT",# Chinese - Traditional
1537     0x0483: "co_FR", # Corsican - France
1538     0x041a: "hr_HR", # Croatian
1539     0x101a: "hr_BA", # Croatian - Bosnia
1540     0x0405: "cs_CZ", # Czech
1541     0x0406: "da_DK", # Danish
1542     0x048c: "gbz_AF",# Dari - Afghanistan
1543     0x0465: "div_MV",# Divehi - Maldives
1544     0x0413: "nl_NL", # Dutch - The Netherlands
1545     0x0813: "nl_BE", # Dutch - Belgium
1546     0x0409: "en_US", # English - United States
1547     0x0809: "en_GB", # English - United Kingdom
1548     0x0c09: "en_AU", # English - Australia
1549     0x1009: "en_CA", # English - Canada
1550     0x1409: "en_NZ", # English - New Zealand
1551     0x1809: "en_IE", # English - Ireland
1552     0x1c09: "en_ZA", # English - South Africa
1553     0x2009: "en_JA", # English - Jamaica
1554     0x2409: "en_CB", # English - Carribbean
1555     0x2809: "en_BZ", # English - Belize
1556     0x2c09: "en_TT", # English - Trinidad
1557     0x3009: "en_ZW", # English - Zimbabwe
1558     0x3409: "en_PH", # English - Philippines
1559     0x4009: "en_IN", # English - India
1560     0x4409: "en_MY", # English - Malaysia
1561     0x4809: "en_IN", # English - Singapore
1562     0x0425: "et_EE", # Estonian
1563     0x0438: "fo_FO", # Faroese
1564     0x0464: "fil_PH",# Filipino
1565     0x040b: "fi_FI", # Finnish
1566     0x040c: "fr_FR", # French - France
1567     0x080c: "fr_BE", # French - Belgium
1568     0x0c0c: "fr_CA", # French - Canada
1569     0x100c: "fr_CH", # French - Switzerland
1570     0x140c: "fr_LU", # French - Luxembourg
1571     0x180c: "fr_MC", # French - Monaco
1572     0x0462: "fy_NL", # Frisian - Netherlands
1573     0x0456: "gl_ES", # Galician
1574     0x0437: "ka_GE", # Georgian
1575     0x0407: "de_DE", # German - Germany
1576     0x0807: "de_CH", # German - Switzerland
1577     0x0c07: "de_AT", # German - Austria
1578     0x1007: "de_LU", # German - Luxembourg
1579     0x1407: "de_LI", # German - Liechtenstein
1580     0x0408: "el_GR", # Greek
1581     0x046f: "kl_GL", # Greenlandic - Greenland
1582     0x0447: "gu_IN", # Gujarati
1583     0x0468: "ha_NG", # Hausa - Latin
1584     0x040d: "he_IL", # Hebrew
1585     0x0439: "hi_IN", # Hindi
1586     0x040e: "hu_HU", # Hungarian
1587     0x040f: "is_IS", # Icelandic
1588     0x0421: "id_ID", # Indonesian
1589     0x045d: "iu_CA", # Inuktitut - Syllabics
1590     0x085d: "iu_CA", # Inuktitut - Latin
1591     0x083c: "ga_IE", # Irish - Ireland
1592     0x0410: "it_IT", # Italian - Italy
1593     0x0810: "it_CH", # Italian - Switzerland
1594     0x0411: "ja_JP", # Japanese
1595     0x044b: "kn_IN", # Kannada - India
1596     0x043f: "kk_KZ", # Kazakh
1597     0x0453: "kh_KH", # Khmer - Cambodia
1598     0x0486: "qut_GT",# K'iche - Guatemala
1599     0x0487: "rw_RW", # Kinyarwanda - Rwanda
1600     0x0457: "kok_IN",# Konkani
1601     0x0412: "ko_KR", # Korean
1602     0x0440: "ky_KG", # Kyrgyz
1603     0x0454: "lo_LA", # Lao - Lao PDR
1604     0x0426: "lv_LV", # Latvian
1605     0x0427: "lt_LT", # Lithuanian
1606     0x082e: "dsb_DE",# Lower Sorbian - Germany
1607     0x046e: "lb_LU", # Luxembourgish
1608     0x042f: "mk_MK", # FYROM Macedonian
1609     0x043e: "ms_MY", # Malay - Malaysia
1610     0x083e: "ms_BN", # Malay - Brunei Darussalam
1611     0x044c: "ml_IN", # Malayalam - India
1612     0x043a: "mt_MT", # Maltese
1613     0x0481: "mi_NZ", # Maori
1614     0x047a: "arn_CL",# Mapudungun
1615     0x044e: "mr_IN", # Marathi
1616     0x047c: "moh_CA",# Mohawk - Canada
1617     0x0450: "mn_MN", # Mongolian - Cyrillic
1618     0x0850: "mn_CN", # Mongolian - PRC
1619     0x0461: "ne_NP", # Nepali
1620     0x0414: "nb_NO", # Norwegian - Bokmal
1621     0x0814: "nn_NO", # Norwegian - Nynorsk
1622     0x0482: "oc_FR", # Occitan - France
1623     0x0448: "or_IN", # Oriya - India
1624     0x0463: "ps_AF", # Pashto - Afghanistan
1625     0x0429: "fa_IR", # Persian
1626     0x0415: "pl_PL", # Polish
1627     0x0416: "pt_BR", # Portuguese - Brazil
1628     0x0816: "pt_PT", # Portuguese - Portugal
1629     0x0446: "pa_IN", # Punjabi
1630     0x046b: "quz_BO",# Quechua (Bolivia)
1631     0x086b: "quz_EC",# Quechua (Ecuador)
1632     0x0c6b: "quz_PE",# Quechua (Peru)
1633     0x0418: "ro_RO", # Romanian - Romania
1634     0x0417: "rm_CH", # Romansh
1635     0x0419: "ru_RU", # Russian
1636     0x243b: "smn_FI",# Sami Finland
1637     0x103b: "smj_NO",# Sami Norway
1638     0x143b: "smj_SE",# Sami Sweden
1639     0x043b: "se_NO", # Sami Northern Norway
1640     0x083b: "se_SE", # Sami Northern Sweden
1641     0x0c3b: "se_FI", # Sami Northern Finland
1642     0x203b: "sms_FI",# Sami Skolt
1643     0x183b: "sma_NO",# Sami Southern Norway
1644     0x1c3b: "sma_SE",# Sami Southern Sweden
1645     0x044f: "sa_IN", # Sanskrit
1646     0x0c1a: "sr_SP", # Serbian - Cyrillic
1647     0x1c1a: "sr_BA", # Serbian - Bosnia Cyrillic
1648     0x081a: "sr_SP", # Serbian - Latin
1649     0x181a: "sr_BA", # Serbian - Bosnia Latin
1650     0x045b: "si_LK", # Sinhala - Sri Lanka
1651     0x046c: "ns_ZA", # Northern Sotho
1652     0x0432: "tn_ZA", # Setswana - Southern Africa
1653     0x041b: "sk_SK", # Slovak
1654     0x0424: "sl_SI", # Slovenian
1655     0x040a: "es_ES", # Spanish - Spain
1656     0x080a: "es_MX", # Spanish - Mexico
1657     0x0c0a: "es_ES", # Spanish - Spain (Modern)
1658     0x100a: "es_GT", # Spanish - Guatemala
1659     0x140a: "es_CR", # Spanish - Costa Rica
1660     0x180a: "es_PA", # Spanish - Panama
1661     0x1c0a: "es_DO", # Spanish - Dominican Republic
1662     0x200a: "es_VE", # Spanish - Venezuela
1663     0x240a: "es_CO", # Spanish - Colombia
1664     0x280a: "es_PE", # Spanish - Peru
1665     0x2c0a: "es_AR", # Spanish - Argentina
1666     0x300a: "es_EC", # Spanish - Ecuador
1667     0x340a: "es_CL", # Spanish - Chile
1668     0x380a: "es_UR", # Spanish - Uruguay
1669     0x3c0a: "es_PY", # Spanish - Paraguay
1670     0x400a: "es_BO", # Spanish - Bolivia
1671     0x440a: "es_SV", # Spanish - El Salvador
1672     0x480a: "es_HN", # Spanish - Honduras
1673     0x4c0a: "es_NI", # Spanish - Nicaragua
1674     0x500a: "es_PR", # Spanish - Puerto Rico
1675     0x540a: "es_US", # Spanish - United States
1676 #    0x0430: "", # Sutu - Not supported
1677     0x0441: "sw_KE", # Swahili
1678     0x041d: "sv_SE", # Swedish - Sweden
1679     0x081d: "sv_FI", # Swedish - Finland
1680     0x045a: "syr_SY",# Syriac
1681     0x0428: "tg_TJ", # Tajik - Cyrillic
1682     0x085f: "tmz_DZ",# Tamazight - Latin
1683     0x0449: "ta_IN", # Tamil
1684     0x0444: "tt_RU", # Tatar
1685     0x044a: "te_IN", # Telugu
1686     0x041e: "th_TH", # Thai
1687     0x0851: "bo_BT", # Tibetan - Bhutan
1688     0x0451: "bo_CN", # Tibetan - PRC
1689     0x041f: "tr_TR", # Turkish
1690     0x0442: "tk_TM", # Turkmen - Cyrillic
1691     0x0480: "ug_CN", # Uighur - Arabic
1692     0x0422: "uk_UA", # Ukrainian
1693     0x042e: "wen_DE",# Upper Sorbian - Germany
1694     0x0420: "ur_PK", # Urdu
1695     0x0820: "ur_IN", # Urdu - India
1696     0x0443: "uz_UZ", # Uzbek - Latin
1697     0x0843: "uz_UZ", # Uzbek - Cyrillic
1698     0x042a: "vi_VN", # Vietnamese
1699     0x0452: "cy_GB", # Welsh
1700     0x0488: "wo_SN", # Wolof - Senegal
1701     0x0434: "xh_ZA", # Xhosa - South Africa
1702     0x0485: "sah_RU",# Yakut - Cyrillic
1703     0x0478: "ii_CN", # Yi - PRC
1704     0x046a: "yo_NG", # Yoruba - Nigeria
1705     0x0435: "zu_ZA", # Zulu
1706 }
1707
1708 def _print_locale():
1709
1710     """ Test function.
1711     """
1712     categories = {}
1713     def _init_categories(categories=categories):
1714         for k,v in globals().items():
1715             if k[:3] == 'LC_':
1716                 categories[k] = v
1717     _init_categories()
1718     del categories['LC_ALL']
1719
1720     print 'Locale defaults as determined by getdefaultlocale():'
1721     print '-'*72
1722     lang, enc = getdefaultlocale()
1723     print 'Language: ', lang or '(undefined)'
1724     print 'Encoding: ', enc or '(undefined)'
1725     print
1726
1727     print 'Locale settings on startup:'
1728     print '-'*72
1729     for name,category in categories.items():
1730         print name, '...'
1731         lang, enc = getlocale(category)
1732         print '   Language: ', lang or '(undefined)'
1733         print '   Encoding: ', enc or '(undefined)'
1734         print
1735
1736     print
1737     print 'Locale settings after calling resetlocale():'
1738     print '-'*72
1739     resetlocale()
1740     for name,category in categories.items():
1741         print name, '...'
1742         lang, enc = getlocale(category)
1743         print '   Language: ', lang or '(undefined)'
1744         print '   Encoding: ', enc or '(undefined)'
1745         print
1746
1747     try:
1748         setlocale(LC_ALL, "")
1749     except:
1750         print 'NOTE:'
1751         print 'setlocale(LC_ALL, "") does not support the default locale'
1752         print 'given in the OS environment variables.'
1753     else:
1754         print
1755         print 'Locale settings after calling setlocale(LC_ALL, ""):'
1756         print '-'*72
1757         for name,category in categories.items():
1758             print name, '...'
1759             lang, enc = getlocale(category)
1760             print '   Language: ', lang or '(undefined)'
1761             print '   Encoding: ', enc or '(undefined)'
1762             print
1763
1764 ###
1765
1766 try:
1767     LC_MESSAGES
1768 except NameError:
1769     pass
1770 else:
1771     __all__.append("LC_MESSAGES")
1772
1773 if __name__=='__main__':
1774     print 'Locale aliasing:'
1775     print
1776     _print_locale()
1777     print
1778     print 'Number formatting:'
1779     print
1780     _test()