blob: 51909f81e734b59c4926e79fd7ef631236af0543 [file] [log] [blame]
Senthil Kumaranf1023ba2016-04-12 23:13:33 -07001"""Locale support module.
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +00002
Senthil Kumaranf1023ba2016-04-12 23:13:33 -07003The module provides low-level access to the C lib's locale APIs and adds high
4level number formatting APIs as well as a locale aliasing engine to complement
5these.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00006
Senthil Kumaranf1023ba2016-04-12 23:13:33 -07007The aliasing engine includes support for many commonly used locale names and
8maps them to values suitable for passing to the C lib's setlocale() function. It
9also includes default encodings for all supported locale names.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +000010"""
11
R. David Murraya83da352009-04-01 03:21:43 +000012import sys
13import encodings
14import encodings.aliases
15import re
16import operator
Antoine Pitrouba54eda2008-07-25 20:40:19 +000017import functools
Marc-André Lemburg5431bc32000-06-07 09:11:40 +000018
Martin Panter8d496ad2016-06-02 10:35:44 +000019# keep a copy of the builtin str type, because 'str' name is overridden
Victor Stinnere08496b2015-11-27 23:54:36 +010020# in globals by a function below
21_str = str
22
Martin v. Löwised11a5d2012-05-20 10:42:17 +020023try:
24 _unicode = unicode
25except NameError:
26 # If Python is built without Unicode support, the unicode type
27 # will not exist. Fake one.
28 class _unicode(object):
29 pass
30
Fredrik Lundh6c86b992000-07-09 17:12:58 +000031# Try importing the _locale module.
32#
33# If this fails, fall back on a basic 'C' locale emulation.
Guido van Rossumeef1d4e1997-11-19 19:01:43 +000034
Tim Peters1baf8292001-01-24 10:13:46 +000035# Yuck: LC_MESSAGES is non-standard: can't tell whether it exists before
36# trying the import. So __all__ is also fiddled at the end of the file.
Georg Brandl09728b72007-05-01 06:08:15 +000037__all__ = ["getlocale", "getdefaultlocale", "getpreferredencoding", "Error",
38 "setlocale", "resetlocale", "localeconv", "strcoll", "strxfrm",
39 "str", "atof", "atoi", "format", "format_string", "currency",
40 "normalize", "LC_CTYPE", "LC_COLLATE", "LC_TIME", "LC_MONETARY",
41 "LC_NUMERIC", "LC_ALL", "CHAR_MAX"]
Skip Montanaro17ab1232001-01-24 06:27:27 +000042
Marc-André Lemburg23481142000-06-08 17:49:41 +000043try:
Fredrik Lundh6c86b992000-07-09 17:12:58 +000044
Marc-André Lemburg23481142000-06-08 17:49:41 +000045 from _locale import *
46
47except ImportError:
48
Fredrik Lundh6c86b992000-07-09 17:12:58 +000049 # Locale emulation
50
Marc-André Lemburg23481142000-06-08 17:49:41 +000051 CHAR_MAX = 127
52 LC_ALL = 6
53 LC_COLLATE = 3
54 LC_CTYPE = 0
55 LC_MESSAGES = 5
56 LC_MONETARY = 4
57 LC_NUMERIC = 1
58 LC_TIME = 2
59 Error = ValueError
60
61 def localeconv():
Fredrik Lundh6c86b992000-07-09 17:12:58 +000062 """ localeconv() -> dict.
Marc-André Lemburg23481142000-06-08 17:49:41 +000063 Returns numeric and monetary locale-specific parameters.
64 """
65 # 'C' locale default values
66 return {'grouping': [127],
67 'currency_symbol': '',
68 'n_sign_posn': 127,
Fredrik Lundh6c86b992000-07-09 17:12:58 +000069 'p_cs_precedes': 127,
70 'n_cs_precedes': 127,
71 'mon_grouping': [],
Marc-André Lemburg23481142000-06-08 17:49:41 +000072 'n_sep_by_space': 127,
73 'decimal_point': '.',
74 'negative_sign': '',
75 'positive_sign': '',
Fredrik Lundh6c86b992000-07-09 17:12:58 +000076 'p_sep_by_space': 127,
Marc-André Lemburg23481142000-06-08 17:49:41 +000077 'int_curr_symbol': '',
Fredrik Lundh6c86b992000-07-09 17:12:58 +000078 'p_sign_posn': 127,
Marc-André Lemburg23481142000-06-08 17:49:41 +000079 'thousands_sep': '',
Fredrik Lundh6c86b992000-07-09 17:12:58 +000080 'mon_thousands_sep': '',
81 'frac_digits': 127,
Marc-André Lemburg23481142000-06-08 17:49:41 +000082 'mon_decimal_point': '',
83 'int_frac_digits': 127}
Fredrik Lundh6c86b992000-07-09 17:12:58 +000084
Marc-André Lemburg23481142000-06-08 17:49:41 +000085 def setlocale(category, value=None):
Fredrik Lundh6c86b992000-07-09 17:12:58 +000086 """ setlocale(integer,string=None) -> string.
Marc-André Lemburg23481142000-06-08 17:49:41 +000087 Activates/queries locale processing.
88 """
Martin v. Löwis103d6e72003-03-30 15:42:13 +000089 if value not in (None, '', 'C'):
Fredrik Lundh6c86b992000-07-09 17:12:58 +000090 raise Error, '_locale emulation only supports "C" locale'
Marc-André Lemburg23481142000-06-08 17:49:41 +000091 return 'C'
92
93 def strcoll(a,b):
Fredrik Lundh6c86b992000-07-09 17:12:58 +000094 """ strcoll(string,string) -> int.
Marc-André Lemburg23481142000-06-08 17:49:41 +000095 Compares two strings according to the locale.
96 """
97 return cmp(a,b)
98
99 def strxfrm(s):
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000100 """ strxfrm(string) -> string.
Marc-André Lemburg23481142000-06-08 17:49:41 +0000101 Returns a string that behaves for cmp locale-aware.
102 """
103 return s
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000104
Antoine Pitrouba54eda2008-07-25 20:40:19 +0000105
106_localeconv = localeconv
107
108# With this dict, you can override some items of localeconv's return value.
109# This is useful for testing purposes.
110_override_localeconv = {}
111
112@functools.wraps(_localeconv)
113def localeconv():
114 d = _localeconv()
115 if _override_localeconv:
116 d.update(_override_localeconv)
117 return d
118
119
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000120### Number formatting APIs
121
122# Author: Martin von Loewis
Georg Brandlb89316f2006-05-17 15:51:16 +0000123# improved by Georg Brandl
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000124
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000125# Iterate over grouping intervals
126def _grouping_intervals(grouping):
Mark Dickinson4b456732009-08-04 21:56:04 +0000127 last_interval = None
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000128 for interval in grouping:
129 # if grouping is -1, we are done
130 if interval == CHAR_MAX:
131 return
132 # 0: re-use last group ad infinitum
133 if interval == 0:
Mark Dickinson4b456732009-08-04 21:56:04 +0000134 if last_interval is None:
135 raise ValueError("invalid grouping")
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000136 while True:
137 yield last_interval
138 yield interval
139 last_interval = interval
140
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000141#perform the grouping from right to left
Georg Brandlb89316f2006-05-17 15:51:16 +0000142def _group(s, monetary=False):
143 conv = localeconv()
144 thousands_sep = conv[monetary and 'mon_thousands_sep' or 'thousands_sep']
145 grouping = conv[monetary and 'mon_grouping' or 'grouping']
146 if not grouping:
147 return (s, 0)
Martin v. Löwis88ad12a2001-04-13 08:09:50 +0000148 if s[-1] == ' ':
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000149 stripped = s.rstrip()
150 right_spaces = s[len(stripped):]
151 s = stripped
152 else:
153 right_spaces = ''
154 left_spaces = ''
155 groups = []
156 for interval in _grouping_intervals(grouping):
157 if not s or s[-1] not in "0123456789":
158 # only non-digit characters remain (sign, spaces)
159 left_spaces = s
160 s = ''
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000161 break
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000162 groups.append(s[-interval:])
163 s = s[:-interval]
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000164 if s:
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000165 groups.append(s)
166 groups.reverse()
167 return (
168 left_spaces + thousands_sep.join(groups) + right_spaces,
Antoine Pitrou7c33bd52009-03-18 17:10:04 +0000169 len(thousands_sep) * (len(groups) - 1)
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000170 )
171
172# Strip a given amount of excess padding from the given string
173def _strip_padding(s, amount):
174 lpos = 0
175 while amount and s[lpos] == ' ':
176 lpos += 1
177 amount -= 1
178 rpos = len(s) - 1
179 while amount and s[rpos] == ' ':
180 rpos -= 1
181 amount -= 1
182 return s[lpos:rpos+1]
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000183
R. David Murraya83da352009-04-01 03:21:43 +0000184_percent_re = re.compile(r'%(?:\((?P<key>.*?)\))?'
185 r'(?P<modifiers>[-#0-9 +*.hlL]*?)[eEfFgGdiouxXcrs%]')
186
Georg Brandlb89316f2006-05-17 15:51:16 +0000187def format(percent, value, grouping=False, monetary=False, *additional):
188 """Returns the locale-aware substitution of a %? specifier
189 (percent).
Tim Petersfd4c4192006-05-18 02:06:40 +0000190
Georg Brandlb89316f2006-05-17 15:51:16 +0000191 additional is for format strings which contain one or more
192 '*' modifiers."""
193 # this is only for one-percent-specifier strings and this should be checked
R. David Murraya83da352009-04-01 03:21:43 +0000194 match = _percent_re.match(percent)
195 if not match or len(match.group())!= len(percent):
196 raise ValueError(("format() must be given exactly one %%char "
197 "format specifier, %s not valid") % repr(percent))
198 return _format(percent, value, grouping, monetary, *additional)
199
200def _format(percent, value, grouping=False, monetary=False, *additional):
Georg Brandlb89316f2006-05-17 15:51:16 +0000201 if additional:
202 formatted = percent % ((value,) + additional)
203 else:
204 formatted = percent % value
205 # floats and decimal ints need special action!
206 if percent[-1] in 'eEfFgG':
207 seps = 0
208 parts = formatted.split('.')
209 if grouping:
210 parts[0], seps = _group(parts[0], monetary=monetary)
211 decimal_point = localeconv()[monetary and 'mon_decimal_point'
212 or 'decimal_point']
213 formatted = decimal_point.join(parts)
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000214 if seps:
215 formatted = _strip_padding(formatted, seps)
Georg Brandlb89316f2006-05-17 15:51:16 +0000216 elif percent[-1] in 'diu':
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000217 seps = 0
Georg Brandlb89316f2006-05-17 15:51:16 +0000218 if grouping:
Antoine Pitroufeeafff2009-03-14 00:07:21 +0000219 formatted, seps = _group(formatted, monetary=monetary)
220 if seps:
221 formatted = _strip_padding(formatted, seps)
Georg Brandlb89316f2006-05-17 15:51:16 +0000222 return formatted
223
Georg Brandlb89316f2006-05-17 15:51:16 +0000224def format_string(f, val, grouping=False):
225 """Formats a string in the same way that the % formatting would use,
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000226 but takes the current locale into account.
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000227 Grouping is applied if the third parameter is true."""
Georg Brandlb89316f2006-05-17 15:51:16 +0000228 percents = list(_percent_re.finditer(f))
229 new_f = _percent_re.sub('%s', f)
230
R. David Murray3939dcd2010-04-26 21:17:14 +0000231 if operator.isMappingType(val):
232 new_val = []
233 for perc in percents:
234 if perc.group()[-1]=='%':
235 new_val.append('%')
236 else:
237 new_val.append(format(perc.group(), val, grouping))
238 else:
239 if not isinstance(val, tuple):
240 val = (val,)
241 new_val = []
Georg Brandlb89316f2006-05-17 15:51:16 +0000242 i = 0
243 for perc in percents:
R. David Murray3939dcd2010-04-26 21:17:14 +0000244 if perc.group()[-1]=='%':
245 new_val.append('%')
246 else:
247 starcount = perc.group('modifiers').count('*')
248 new_val.append(_format(perc.group(),
249 val[i],
250 grouping,
251 False,
252 *val[i+1:i+1+starcount]))
253 i += (1 + starcount)
254 val = tuple(new_val)
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000255
Georg Brandlb89316f2006-05-17 15:51:16 +0000256 return new_f % val
Martin v. Löwis88ad12a2001-04-13 08:09:50 +0000257
Georg Brandlb89316f2006-05-17 15:51:16 +0000258def currency(val, symbol=True, grouping=False, international=False):
259 """Formats val according to the currency settings
260 in the current locale."""
261 conv = localeconv()
262
263 # check for illegal values
264 digits = conv[international and 'int_frac_digits' or 'frac_digits']
265 if digits == 127:
266 raise ValueError("Currency formatting is not possible using "
267 "the 'C' locale.")
268
269 s = format('%%.%if' % digits, abs(val), grouping, monetary=True)
270 # '<' and '>' are markers if the sign must be inserted between symbol and value
271 s = '<' + s + '>'
272
273 if symbol:
274 smb = conv[international and 'int_curr_symbol' or 'currency_symbol']
275 precedes = conv[val<0 and 'n_cs_precedes' or 'p_cs_precedes']
276 separated = conv[val<0 and 'n_sep_by_space' or 'p_sep_by_space']
277
278 if precedes:
279 s = smb + (separated and ' ' or '') + s
280 else:
281 s = s + (separated and ' ' or '') + smb
282
283 sign_pos = conv[val<0 and 'n_sign_posn' or 'p_sign_posn']
284 sign = conv[val<0 and 'negative_sign' or 'positive_sign']
285
286 if sign_pos == 0:
287 s = '(' + s + ')'
288 elif sign_pos == 1:
289 s = sign + s
290 elif sign_pos == 2:
291 s = s + sign
292 elif sign_pos == 3:
293 s = s.replace('<', sign)
294 elif sign_pos == 4:
295 s = s.replace('>', sign)
296 else:
297 # the default if nothing specified;
298 # this should be the most fitting sign position
299 s = sign + s
300
301 return s.replace('<', '').replace('>', '')
Martin v. Löwisdb786872001-01-21 18:52:33 +0000302
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000303def str(val):
Senthil Kumaranf1023ba2016-04-12 23:13:33 -0700304 """Convert float to string, taking the locale into account."""
Georg Brandlb89316f2006-05-17 15:51:16 +0000305 return format("%.12g", val)
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000306
Georg Brandlb89316f2006-05-17 15:51:16 +0000307def atof(string, func=float):
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000308 "Parses a string as a float according to the locale settings."
309 #First, get rid of the grouping
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000310 ts = localeconv()['thousands_sep']
311 if ts:
Skip Montanaro249369c2004-04-10 16:39:32 +0000312 string = string.replace(ts, '')
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000313 #next, replace the decimal point with a dot
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000314 dd = localeconv()['decimal_point']
315 if dd:
Skip Montanaro249369c2004-04-10 16:39:32 +0000316 string = string.replace(dd, '.')
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000317 #finally, parse the string
Skip Montanaro249369c2004-04-10 16:39:32 +0000318 return func(string)
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000319
320def atoi(str):
321 "Converts a string to an integer according to the locale settings."
Eric S. Raymondbe9b5072001-02-09 10:48:30 +0000322 return atof(str, int)
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000323
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000324def _test():
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000325 setlocale(LC_ALL, "")
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000326 #do grouping
Georg Brandlb89316f2006-05-17 15:51:16 +0000327 s1 = format("%d", 123456789,1)
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000328 print s1, "is", atoi(s1)
Guido van Rossumeef1d4e1997-11-19 19:01:43 +0000329 #standard formatting
Georg Brandlb89316f2006-05-17 15:51:16 +0000330 s1 = str(3.14)
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000331 print s1, "is", atof(s1)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000332
333### Locale name aliasing engine
334
335# Author: Marc-Andre Lemburg, mal@lemburg.com
Fredrik Lundh37a09822002-10-19 20:19:10 +0000336# Various tweaks by Fredrik Lundh <fredrik@pythonware.com>
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000337
338# store away the low-level version of setlocale (it's
339# overridden below)
340_setlocale = setlocale
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000341
Antoine Pitrou4cfae022011-07-24 02:51:01 +0200342# Avoid relying on the locale-dependent .lower() method
343# (see issue #1813).
344_ascii_lower_map = ''.join(
345 chr(x + 32 if x >= ord('A') and x <= ord('Z') else x)
346 for x in range(256)
347)
348
Serhiy Storchakabd789862013-12-19 21:21:06 +0200349def _replace_encoding(code, encoding):
350 if '.' in code:
351 langname = code[:code.index('.')]
352 else:
353 langname = code
354 # Convert the encoding to a C lib compatible encoding string
355 norm_encoding = encodings.normalize_encoding(encoding)
356 #print('norm encoding: %r' % norm_encoding)
357 norm_encoding = encodings.aliases.aliases.get(norm_encoding,
358 norm_encoding)
359 #print('aliased encoding: %r' % norm_encoding)
360 encoding = locale_encoding_alias.get(norm_encoding,
361 norm_encoding)
362 #print('found encoding %r' % encoding)
363 return langname + '.' + encoding
364
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000365def normalize(localename):
366
367 """ Returns a normalized locale code for the given locale
368 name.
369
370 The returned locale code is formatted for use with
371 setlocale().
372
373 If normalization fails, the original name is returned
374 unchanged.
375
376 If the given encoding is not known, the function defaults to
377 the default encoding for the locale code just like setlocale()
378 does.
379
380 """
Serhiy Storchakabd789862013-12-19 21:21:06 +0200381 # Normalize the locale name and extract the encoding and modifier
Martin v. Löwised11a5d2012-05-20 10:42:17 +0200382 if isinstance(localename, _unicode):
Barry Warsawedfba822011-08-15 19:17:12 -0400383 localename = localename.encode('ascii')
Serhiy Storchakaaf080872014-01-17 09:27:56 +0200384 code = localename.translate(_ascii_lower_map)
Serhiy Storchakabd789862013-12-19 21:21:06 +0200385 if ':' in code:
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000386 # ':' is sometimes used as encoding delimiter.
Serhiy Storchakabd789862013-12-19 21:21:06 +0200387 code = code.replace(':', '.')
388 if '@' in code:
389 code, modifier = code.split('@', 1)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000390 else:
Serhiy Storchakabd789862013-12-19 21:21:06 +0200391 modifier = ''
392 if '.' in code:
393 langname, encoding = code.split('.')[:2]
394 else:
395 langname = code
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000396 encoding = ''
397
Serhiy Storchakabd789862013-12-19 21:21:06 +0200398 # First lookup: fullname (possibly with encoding and modifier)
399 lang_enc = langname
400 if encoding:
401 norm_encoding = encoding.replace('-', '')
402 norm_encoding = norm_encoding.replace('_', '')
403 lang_enc += '.' + norm_encoding
404 lookup_name = lang_enc
405 if modifier:
406 lookup_name += '@' + modifier
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000407 code = locale_alias.get(lookup_name, None)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000408 if code is not None:
409 return code
Serhiy Storchakabd789862013-12-19 21:21:06 +0200410 #print('first lookup failed')
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000411
Serhiy Storchakabd789862013-12-19 21:21:06 +0200412 if modifier:
413 # Second try: fullname without modifier (possibly with encoding)
414 code = locale_alias.get(lang_enc, None)
415 if code is not None:
416 #print('lookup without modifier succeeded')
417 if '@' not in code:
418 return code + '@' + modifier
Serhiy Storchakaaf080872014-01-17 09:27:56 +0200419 if code.split('@', 1)[1].translate(_ascii_lower_map) == modifier:
Serhiy Storchakabd789862013-12-19 21:21:06 +0200420 return code
421 #print('second lookup failed')
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000422
Serhiy Storchakabd789862013-12-19 21:21:06 +0200423 if encoding:
424 # Third try: langname (without encoding, possibly with modifier)
425 lookup_name = langname
426 if modifier:
427 lookup_name += '@' + modifier
428 code = locale_alias.get(lookup_name, None)
429 if code is not None:
430 #print('lookup without encoding succeeded')
431 if '@' not in code:
432 return _replace_encoding(code, encoding)
433 code, modifier = code.split('@', 1)
434 return _replace_encoding(code, encoding) + '@' + modifier
435
436 if modifier:
437 # Fourth try: langname (without encoding and modifier)
438 code = locale_alias.get(langname, None)
439 if code is not None:
440 #print('lookup without modifier and encoding succeeded')
441 if '@' not in code:
442 return _replace_encoding(code, encoding) + '@' + modifier
443 code, defmod = code.split('@', 1)
Serhiy Storchakaaf080872014-01-17 09:27:56 +0200444 if defmod.translate(_ascii_lower_map) == modifier:
Serhiy Storchakabd789862013-12-19 21:21:06 +0200445 return _replace_encoding(code, encoding) + '@' + defmod
446
447 return localename
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000448
449def _parse_localename(localename):
450
451 """ Parses the locale code for localename and returns the
452 result as tuple (language code, encoding).
453
454 The localename is normalized and passed through the locale
455 alias engine. A ValueError is raised in case the locale name
456 cannot be parsed.
457
458 The language code corresponds to RFC 1766. code and encoding
459 can be None in case the values cannot be determined or are
Jeremy Hyltona05e2932000-06-28 14:48:01 +0000460 unknown to this implementation.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000461
462 """
463 code = normalize(localename)
Georg Brandlb709c2c2006-01-20 09:07:35 +0000464 if '@' in code:
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000465 # Deal with locale modifiers
Serhiy Storchakabd789862013-12-19 21:21:06 +0200466 code, modifier = code.split('@', 1)
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000467 if modifier == 'euro' and '.' not in code:
468 # Assume Latin-9 for @euro locales. This is bogus,
469 # since some systems may use other encodings for these
470 # locales. Also, we ignore other modifiers.
471 return code, 'iso-8859-15'
Tim Peters230a60c2002-11-09 05:08:07 +0000472
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000473 if '.' in code:
Raymond Hettinger346e67f2005-01-01 06:10:26 +0000474 return tuple(code.split('.')[:2])
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000475 elif code == 'C':
476 return None, None
Andrew M. Kuchling1f877ef2001-08-13 14:50:44 +0000477 raise ValueError, 'unknown locale: %s' % localename
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000478
479def _build_localename(localetuple):
480
481 """ Builds a locale code from the given tuple (language code,
482 encoding).
483
484 No aliasing or normalizing takes place.
485
486 """
487 language, encoding = localetuple
488 if language is None:
489 language = 'C'
490 if encoding is None:
491 return language
492 else:
493 return language + '.' + encoding
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000494
Matthias Klosef3f231f2005-09-20 07:02:49 +0000495def getdefaultlocale(envvars=('LC_ALL', 'LC_CTYPE', 'LANG', 'LANGUAGE')):
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000496
497 """ Tries to determine the default locale settings and returns
498 them as tuple (language code, encoding).
499
500 According to POSIX, a program which has not called
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000501 setlocale(LC_ALL, "") runs using the portable 'C' locale.
502 Calling setlocale(LC_ALL, "") lets it use the default locale as
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000503 defined by the LANG variable. Since we don't want to interfere
Thomas Wouters7e474022000-07-16 12:04:32 +0000504 with the current locale setting we thus emulate the behavior
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000505 in the way described above.
506
507 To maintain compatibility with other platforms, not only the
508 LANG variable is tested, but a list of variables given as
509 envvars parameter. The first found to be defined will be
510 used. envvars defaults to the search path used in GNU gettext;
511 it must always contain the variable name 'LANG'.
512
513 Except for the code 'C', the language code corresponds to RFC
514 1766. code and encoding can be None in case the values cannot
515 be determined.
516
517 """
Fredrik Lundh04661322000-07-09 23:16:10 +0000518
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000519 try:
520 # check if it's supported by the _locale module
521 import _locale
522 code, encoding = _locale._getdefaultlocale()
Fredrik Lundh04661322000-07-09 23:16:10 +0000523 except (ImportError, AttributeError):
524 pass
525 else:
Fredrik Lundh663809e2000-07-10 19:32:19 +0000526 # make sure the code/encoding values are valid
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000527 if sys.platform == "win32" and code and code[:2] == "0x":
528 # map windows language identifier to language name
529 code = windows_locale.get(int(code, 0))
Fredrik Lundh663809e2000-07-10 19:32:19 +0000530 # ...add other platform-specific processing here, if
531 # necessary...
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000532 return code, encoding
Fredrik Lundh04661322000-07-09 23:16:10 +0000533
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000534 # fall back on POSIX behaviour
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000535 import os
536 lookup = os.environ.get
537 for variable in envvars:
538 localename = lookup(variable,None)
Martin v. Löwisc8ae31d2004-07-26 12:45:18 +0000539 if localename:
Matthias Klosef3f231f2005-09-20 07:02:49 +0000540 if variable == 'LANGUAGE':
541 localename = localename.split(':')[0]
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000542 break
543 else:
544 localename = 'C'
545 return _parse_localename(localename)
546
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000547
548def getlocale(category=LC_CTYPE):
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000549
550 """ Returns the current setting for the given locale category as
551 tuple (language code, encoding).
552
553 category may be one of the LC_* value except LC_ALL. It
554 defaults to LC_CTYPE.
555
556 Except for the code 'C', the language code corresponds to RFC
557 1766. code and encoding can be None in case the values cannot
558 be determined.
559
560 """
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000561 localename = _setlocale(category)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000562 if category == LC_ALL and ';' in localename:
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000563 raise TypeError, 'category LC_ALL is not supported'
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000564 return _parse_localename(localename)
565
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000566def setlocale(category, locale=None):
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000567
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000568 """ Set the locale for the given category. The locale can be
Petri Lehtinen416ecff2011-11-05 10:18:50 +0200569 a string, an iterable of two strings (language code and encoding),
570 or None.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000571
Petri Lehtinen416ecff2011-11-05 10:18:50 +0200572 Iterables are converted to strings using the locale aliasing
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000573 engine. Locale strings are passed directly to the C lib.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000574
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000575 category may be given as one of the LC_* values.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000576
577 """
Victor Stinnere08496b2015-11-27 23:54:36 +0100578 if locale and not isinstance(locale, (_str, _unicode)):
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000579 # convert to string
580 locale = normalize(_build_localename(locale))
581 return _setlocale(category, locale)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000582
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000583def resetlocale(category=LC_ALL):
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000584
585 """ Sets the locale for category to the default setting.
586
587 The default setting is determined by calling
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000588 getdefaultlocale(). category defaults to LC_ALL.
589
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000590 """
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000591 _setlocale(category, _build_localename(getdefaultlocale()))
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000592
Benjamin Petersone021c9c2009-06-07 16:24:48 +0000593if sys.platform.startswith("win"):
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000594 # On Win32, this will return the ANSI code page
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000595 def getpreferredencoding(do_setlocale = True):
596 """Return the charset that the user is likely using."""
597 import _locale
Tim Petersa326f472002-11-05 03:49:09 +0000598 return _locale._getdefaultlocale()[1]
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000599else:
600 # On Unix, if CODESET is available, use that.
601 try:
602 CODESET
603 except NameError:
604 # Fall back to parsing environment variables :-(
605 def getpreferredencoding(do_setlocale = True):
606 """Return the charset that the user is likely using,
607 by looking at environment variables."""
608 return getdefaultlocale()[1]
609 else:
610 def getpreferredencoding(do_setlocale = True):
611 """Return the charset that the user is likely using,
612 according to the system configuration."""
613 if do_setlocale:
614 oldloc = setlocale(LC_CTYPE)
Jeroen Ruigrok van der Werven041f4652009-05-06 05:25:42 +0000615 try:
616 setlocale(LC_CTYPE, "")
Jeroen Ruigrok van der Wervenc924b3d2009-05-06 13:16:36 +0000617 except Error:
Jeroen Ruigrok van der Werven041f4652009-05-06 05:25:42 +0000618 pass
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000619 result = nl_langinfo(CODESET)
620 setlocale(LC_CTYPE, oldloc)
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000621 else:
Victor Stinner94a36942017-05-12 11:51:38 +0200622 result = nl_langinfo(CODESET)
Sean McCullycef8b172017-05-20 21:44:02 -0400623
624 if not result and sys.platform == 'darwin':
625 # nl_langinfo can return an empty string
626 # when the setting has an invalid value.
627 # Default to UTF-8 in that case because
628 # UTF-8 is the default charset on OSX and
629 # returning nothing will crash the
630 # interpreter.
631 result = 'UTF-8'
632 return result
Tim Peters230a60c2002-11-09 05:08:07 +0000633
Martin v. Löwisf0a46682002-11-03 17:20:12 +0000634
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000635### Database
636#
637# The following data was extracted from the locale.alias file which
638# comes with X11 and then hand edited removing the explicit encoding
639# definitions and adding some more aliases. The file is usually
640# available as /usr/lib/X11/locale/locale.alias.
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000641#
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000642
643#
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000644# The local_encoding_alias table maps lowercase encoding alias names
645# to C locale encoding names (case-sensitive). Note that normalize()
646# first looks up the encoding in the encodings.aliases dictionary and
647# then applies this mapping to find the correct C lib name for the
648# encoding.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000649#
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000650locale_encoding_alias = {
651
652 # Mappings for non-standard encoding names used in locale names
653 '437': 'C',
654 'c': 'C',
655 'en': 'ISO8859-1',
656 'jis': 'JIS7',
657 'jis7': 'JIS7',
658 'ajec': 'eucJP',
659
660 # Mappings from Python codec names to C lib encoding names
661 'ascii': 'ISO8859-1',
662 'latin_1': 'ISO8859-1',
663 'iso8859_1': 'ISO8859-1',
664 'iso8859_10': 'ISO8859-10',
665 'iso8859_11': 'ISO8859-11',
666 'iso8859_13': 'ISO8859-13',
667 'iso8859_14': 'ISO8859-14',
668 'iso8859_15': 'ISO8859-15',
Jeroen Ruigrok van der Werven51133d42009-05-08 13:07:39 +0000669 'iso8859_16': 'ISO8859-16',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000670 'iso8859_2': 'ISO8859-2',
671 'iso8859_3': 'ISO8859-3',
672 'iso8859_4': 'ISO8859-4',
673 'iso8859_5': 'ISO8859-5',
674 'iso8859_6': 'ISO8859-6',
675 'iso8859_7': 'ISO8859-7',
676 'iso8859_8': 'ISO8859-8',
677 'iso8859_9': 'ISO8859-9',
678 'iso2022_jp': 'JIS7',
679 'shift_jis': 'SJIS',
680 'tactis': 'TACTIS',
681 'euc_jp': 'eucJP',
682 'euc_kr': 'eucKR',
Ronald Oussoren372954e2011-05-17 13:22:30 +0200683 'utf_8': 'UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000684 'koi8_r': 'KOI8-R',
685 'koi8_u': 'KOI8-U',
686 # XXX This list is still incomplete. If you know more
687 # mappings, please file a bug report. Thanks.
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000688}
689
Fredrik Lundh6c86b992000-07-09 17:12:58 +0000690#
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000691# The locale_alias table maps lowercase alias names to C locale names
692# (case-sensitive). Encodings are always separated from the locale
693# name using a dot ('.'); they should only be given in case the
694# language name is needed to interpret the given encoding alias
695# correctly (CJK codes often have this need).
696#
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000697# Note that the normalize() function which uses this tables
698# removes '_' and '-' characters from the encoding part of the
699# locale name before doing the lookup. This saves a lot of
700# space in the table.
701#
702# MAL 2004-12-10:
703# Updated alias mapping to most recent locale.alias file
704# from X.org distribution using makelocalealias.py.
705#
706# These are the differences compared to the old mapping (Python 2.4
707# and older):
708#
709# updated 'bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
710# updated 'bg_bg' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
711# updated 'bulgarian' -> 'bg_BG.ISO8859-5' to 'bg_BG.CP1251'
712# updated 'cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
713# updated 'cz_cz' -> 'cz_CZ.ISO8859-2' to 'cs_CZ.ISO8859-2'
714# updated 'czech' -> 'cs_CS.ISO8859-2' to 'cs_CZ.ISO8859-2'
715# updated 'dutch' -> 'nl_BE.ISO8859-1' to 'nl_NL.ISO8859-1'
716# updated 'et' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
717# updated 'et_ee' -> 'et_EE.ISO8859-4' to 'et_EE.ISO8859-15'
718# updated 'fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
719# updated 'fi_fi' -> 'fi_FI.ISO8859-1' to 'fi_FI.ISO8859-15'
720# updated 'iw' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
721# updated 'iw_il' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
722# updated 'japanese' -> 'ja_JP.SJIS' to 'ja_JP.eucJP'
723# updated 'lt' -> 'lt_LT.ISO8859-4' to 'lt_LT.ISO8859-13'
724# updated 'lv' -> 'lv_LV.ISO8859-4' to 'lv_LV.ISO8859-13'
725# updated 'sl' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
726# updated 'slovene' -> 'sl_CS.ISO8859-2' to 'sl_SI.ISO8859-2'
727# updated 'th_th' -> 'th_TH.TACTIS' to 'th_TH.ISO8859-11'
728# updated 'zh_cn' -> 'zh_CN.eucCN' to 'zh_CN.gb2312'
729# updated 'zh_cn.big5' -> 'zh_TW.eucTW' to 'zh_TW.big5'
730# updated 'zh_tw' -> 'zh_TW.eucTW' to 'zh_TW.big5'
731#
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000732# MAL 2008-05-30:
733# Updated alias mapping to most recent locale.alias file
734# from X.org distribution using makelocalealias.py.
735#
736# These are the differences compared to the old mapping (Python 2.5
737# and older):
738#
739# updated 'cs_cs.iso88592' -> 'cs_CZ.ISO8859-2' to 'cs_CS.ISO8859-2'
740# updated 'serbocroatian' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
741# updated 'sh' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
742# updated 'sh_hr.iso88592' -> 'sh_HR.ISO8859-2' to 'hr_HR.ISO8859-2'
743# updated 'sh_sp' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
744# updated 'sh_yu' -> 'sh_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
745# updated 'sp' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
746# updated 'sp_yu' -> 'sp_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
747# updated 'sr' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
748# updated 'sr@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
749# updated 'sr_sp' -> 'sr_SP.ISO8859-2' to 'sr_CS.ISO8859-2'
750# updated 'sr_yu' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
751# updated 'sr_yu.cp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
752# updated 'sr_yu.iso88592' -> 'sr_YU.ISO8859-2' to 'sr_CS.ISO8859-2'
753# updated 'sr_yu.iso88595' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
754# updated 'sr_yu.iso88595@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
755# updated 'sr_yu.microsoftcp1251@cyrillic' -> 'sr_YU.CP1251' to 'sr_CS.CP1251'
756# updated 'sr_yu.utf8@cyrillic' -> 'sr_YU.UTF-8' to 'sr_CS.UTF-8'
757# updated 'sr_yu@cyrillic' -> 'sr_YU.ISO8859-5' to 'sr_CS.ISO8859-5'
Antoine Pitroufc531532010-04-11 22:32:39 +0000758#
759# AP 2010-04-12:
760# Updated alias mapping to most recent locale.alias file
761# from X.org distribution using makelocalealias.py.
762#
763# These are the differences compared to the old mapping (Python 2.6.5
764# and older):
765#
766# updated 'ru' -> 'ru_RU.ISO8859-5' to 'ru_RU.UTF-8'
767# updated 'ru_ru' -> 'ru_RU.ISO8859-5' to 'ru_RU.UTF-8'
768# updated 'serbocroatian' -> 'sr_CS.ISO8859-2' to 'sr_RS.UTF-8@latin'
769# updated 'sh' -> 'sr_CS.ISO8859-2' to 'sr_RS.UTF-8@latin'
770# updated 'sh_yu' -> 'sr_CS.ISO8859-2' to 'sr_RS.UTF-8@latin'
771# updated 'sr' -> 'sr_CS.ISO8859-5' to 'sr_RS.UTF-8'
772# updated 'sr@cyrillic' -> 'sr_CS.ISO8859-5' to 'sr_RS.UTF-8'
773# updated 'sr@latn' -> 'sr_CS.ISO8859-2' to 'sr_RS.UTF-8@latin'
774# updated 'sr_cs.utf8@latn' -> 'sr_CS.UTF-8' to 'sr_RS.UTF-8@latin'
775# updated 'sr_cs@latn' -> 'sr_CS.ISO8859-2' to 'sr_RS.UTF-8@latin'
776# updated 'sr_yu' -> 'sr_CS.ISO8859-5' to 'sr_RS.UTF-8@latin'
777# updated 'sr_yu.utf8@cyrillic' -> 'sr_CS.UTF-8' to 'sr_RS.UTF-8'
778# updated 'sr_yu@cyrillic' -> 'sr_CS.ISO8859-5' to 'sr_RS.UTF-8'
779#
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200780# SS 2013-12-20:
781# Updated alias mapping to most recent locale.alias file
782# from X.org distribution using makelocalealias.py.
783#
784# These are the differences compared to the old mapping (Python 2.7.6
785# and older):
786#
787# updated 'a3' -> 'a3_AZ.KOI8-C' to 'az_AZ.KOI8-C'
788# updated 'a3_az' -> 'a3_AZ.KOI8-C' to 'az_AZ.KOI8-C'
789# updated 'a3_az.koi8c' -> 'a3_AZ.KOI8-C' to 'az_AZ.KOI8-C'
790# updated 'cs_cs.iso88592' -> 'cs_CS.ISO8859-2' to 'cs_CZ.ISO8859-2'
791# updated 'hebrew' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
792# updated 'hebrew.iso88598' -> 'iw_IL.ISO8859-8' to 'he_IL.ISO8859-8'
793# updated 'sd' -> 'sd_IN@devanagari.UTF-8' to 'sd_IN.UTF-8'
794# updated 'sr@latn' -> 'sr_RS.UTF-8@latin' to 'sr_CS.UTF-8@latin'
795# updated 'sr_cs' -> 'sr_RS.UTF-8' to 'sr_CS.UTF-8'
796# updated 'sr_cs.utf8@latn' -> 'sr_RS.UTF-8@latin' to 'sr_CS.UTF-8@latin'
797# updated 'sr_cs@latn' -> 'sr_RS.UTF-8@latin' to 'sr_CS.UTF-8@latin'
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +0300798#
799# SS 2014-10-01:
800# Updated alias mapping with glibc 2.19 supported locales.
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300801#
802# SS 2018-05-05:
803# Updated alias mapping with glibc 2.27 supported locales.
804#
805# These are the differences compared to the old mapping (Python 2.7.15
806# and older):
807#
808# updated 'ca_es@valencia' -> 'ca_ES.ISO8859-15@valencia' to 'ca_ES.UTF-8@valencia'
809# updated 'english.iso88591' -> 'en_EN.ISO8859-1' to 'en_US.ISO8859-1'
810# updated 'kk_kz' -> 'kk_KZ.RK1048' to 'kk_KZ.ptcp154'
811# updated 'russian' -> 'ru_RU.ISO8859-5' to 'ru_RU.KOI8-R'
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000812
Marc-André Lemburg5431bc32000-06-07 09:11:40 +0000813locale_alias = {
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200814 'a3': 'az_AZ.KOI8-C',
815 'a3_az': 'az_AZ.KOI8-C',
816 'a3_az.koi8c': 'az_AZ.KOI8-C',
817 'a3_az.koic': 'az_AZ.KOI8-C',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300818 'aa_dj': 'aa_DJ.ISO8859-1',
819 'aa_er': 'aa_ER.UTF-8',
820 'aa_et': 'aa_ET.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000821 'af': 'af_ZA.ISO8859-1',
822 'af_za': 'af_ZA.ISO8859-1',
823 'af_za.iso88591': 'af_ZA.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300824 'agr_pe': 'agr_PE.UTF-8',
825 'ak_gh': 'ak_GH.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000826 'am': 'am_ET.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000827 'am_et': 'am_ET.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000828 'american': 'en_US.ISO8859-1',
829 'american.iso88591': 'en_US.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300830 'an_es': 'an_ES.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300831 'anp_in': 'anp_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000832 'ar': 'ar_AA.ISO8859-6',
833 'ar_aa': 'ar_AA.ISO8859-6',
834 'ar_aa.iso88596': 'ar_AA.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000835 'ar_ae': 'ar_AE.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000836 'ar_ae.iso88596': 'ar_AE.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000837 'ar_bh': 'ar_BH.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000838 'ar_bh.iso88596': 'ar_BH.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000839 'ar_dz': 'ar_DZ.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000840 'ar_dz.iso88596': 'ar_DZ.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000841 'ar_eg': 'ar_EG.ISO8859-6',
842 'ar_eg.iso88596': 'ar_EG.ISO8859-6',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200843 'ar_in': 'ar_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000844 'ar_iq': 'ar_IQ.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000845 'ar_iq.iso88596': 'ar_IQ.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000846 'ar_jo': 'ar_JO.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000847 'ar_jo.iso88596': 'ar_JO.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000848 'ar_kw': 'ar_KW.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000849 'ar_kw.iso88596': 'ar_KW.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000850 'ar_lb': 'ar_LB.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000851 'ar_lb.iso88596': 'ar_LB.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000852 'ar_ly': 'ar_LY.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000853 'ar_ly.iso88596': 'ar_LY.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000854 'ar_ma': 'ar_MA.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000855 'ar_ma.iso88596': 'ar_MA.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000856 'ar_om': 'ar_OM.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000857 'ar_om.iso88596': 'ar_OM.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000858 'ar_qa': 'ar_QA.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000859 'ar_qa.iso88596': 'ar_QA.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000860 'ar_sa': 'ar_SA.ISO8859-6',
861 'ar_sa.iso88596': 'ar_SA.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000862 'ar_sd': 'ar_SD.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000863 'ar_sd.iso88596': 'ar_SD.ISO8859-6',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300864 'ar_ss': 'ar_SS.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000865 'ar_sy': 'ar_SY.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000866 'ar_sy.iso88596': 'ar_SY.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000867 'ar_tn': 'ar_TN.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000868 'ar_tn.iso88596': 'ar_TN.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000869 'ar_ye': 'ar_YE.ISO8859-6',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000870 'ar_ye.iso88596': 'ar_YE.ISO8859-6',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000871 'arabic': 'ar_AA.ISO8859-6',
872 'arabic.iso88596': 'ar_AA.ISO8859-6',
Antoine Pitroufc531532010-04-11 22:32:39 +0000873 'as': 'as_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200874 'as_in': 'as_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300875 'ast_es': 'ast_ES.ISO8859-15',
876 'ayc_pe': 'ayc_PE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000877 'az': 'az_AZ.ISO8859-9E',
878 'az_az': 'az_AZ.ISO8859-9E',
879 'az_az.iso88599e': 'az_AZ.ISO8859-9E',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300880 'az_ir': 'az_IR.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000881 'be': 'be_BY.CP1251',
Antoine Pitroufc531532010-04-11 22:32:39 +0000882 'be@latin': 'be_BY.UTF-8@latin',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +0300883 'be_bg.utf8': 'bg_BG.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000884 'be_by': 'be_BY.CP1251',
885 'be_by.cp1251': 'be_BY.CP1251',
886 'be_by.microsoftcp1251': 'be_BY.CP1251',
Antoine Pitroufc531532010-04-11 22:32:39 +0000887 'be_by.utf8@latin': 'be_BY.UTF-8@latin',
888 'be_by@latin': 'be_BY.UTF-8@latin',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300889 'bem_zm': 'bem_ZM.UTF-8',
890 'ber_dz': 'ber_DZ.UTF-8',
891 'ber_ma': 'ber_MA.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000892 'bg': 'bg_BG.CP1251',
893 'bg_bg': 'bg_BG.CP1251',
894 'bg_bg.cp1251': 'bg_BG.CP1251',
895 'bg_bg.iso88595': 'bg_BG.ISO8859-5',
896 'bg_bg.koi8r': 'bg_BG.KOI8-R',
897 'bg_bg.microsoftcp1251': 'bg_BG.CP1251',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300898 'bhb_in.utf8': 'bhb_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300899 'bho_in': 'bho_IN.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300900 'bho_np': 'bho_NP.UTF-8',
901 'bi_vu': 'bi_VU.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300902 'bn_bd': 'bn_BD.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000903 'bn_in': 'bn_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300904 'bo_cn': 'bo_CN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200905 'bo_in': 'bo_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000906 'bokmal': 'nb_NO.ISO8859-1',
907 'bokm\xe5l': 'nb_NO.ISO8859-1',
908 'br': 'br_FR.ISO8859-1',
909 'br_fr': 'br_FR.ISO8859-1',
910 'br_fr.iso88591': 'br_FR.ISO8859-1',
911 'br_fr.iso885914': 'br_FR.ISO8859-14',
912 'br_fr.iso885915': 'br_FR.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000913 'br_fr.iso885915@euro': 'br_FR.ISO8859-15',
914 'br_fr.utf8@euro': 'br_FR.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000915 'br_fr@euro': 'br_FR.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300916 'brx_in': 'brx_IN.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000917 'bs': 'bs_BA.ISO8859-2',
918 'bs_ba': 'bs_BA.ISO8859-2',
919 'bs_ba.iso88592': 'bs_BA.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000920 'bulgarian': 'bg_BG.CP1251',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300921 'byn_er': 'byn_ER.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000922 'c': 'C',
923 'c-french': 'fr_CA.ISO8859-1',
924 'c-french.iso88591': 'fr_CA.ISO8859-1',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200925 'c.ascii': 'C',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000926 'c.en': 'C',
927 'c.iso88591': 'en_US.ISO8859-1',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +0300928 'c.utf8': 'en_US.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000929 'c_c': 'C',
930 'c_c.c': 'C',
931 'ca': 'ca_ES.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +0000932 'ca_ad': 'ca_AD.ISO8859-1',
933 'ca_ad.iso88591': 'ca_AD.ISO8859-1',
934 'ca_ad.iso885915': 'ca_AD.ISO8859-15',
935 'ca_ad.iso885915@euro': 'ca_AD.ISO8859-15',
936 'ca_ad.utf8@euro': 'ca_AD.UTF-8',
937 'ca_ad@euro': 'ca_AD.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000938 'ca_es': 'ca_ES.ISO8859-1',
939 'ca_es.iso88591': 'ca_ES.ISO8859-1',
940 'ca_es.iso885915': 'ca_ES.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +0000941 'ca_es.iso885915@euro': 'ca_ES.ISO8859-15',
942 'ca_es.utf8@euro': 'ca_ES.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000943 'ca_es@euro': 'ca_ES.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300944 'ca_es@valencia': 'ca_ES.UTF-8@valencia',
Antoine Pitroufc531532010-04-11 22:32:39 +0000945 'ca_fr': 'ca_FR.ISO8859-1',
946 'ca_fr.iso88591': 'ca_FR.ISO8859-1',
947 'ca_fr.iso885915': 'ca_FR.ISO8859-15',
948 'ca_fr.iso885915@euro': 'ca_FR.ISO8859-15',
949 'ca_fr.utf8@euro': 'ca_FR.UTF-8',
950 'ca_fr@euro': 'ca_FR.ISO8859-15',
951 'ca_it': 'ca_IT.ISO8859-1',
952 'ca_it.iso88591': 'ca_IT.ISO8859-1',
953 'ca_it.iso885915': 'ca_IT.ISO8859-15',
954 'ca_it.iso885915@euro': 'ca_IT.ISO8859-15',
955 'ca_it.utf8@euro': 'ca_IT.UTF-8',
956 'ca_it@euro': 'ca_IT.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000957 'catalan': 'ca_ES.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300958 'ce_ru': 'ce_RU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000959 'cextend': 'en_US.ISO8859-1',
960 'cextend.en': 'en_US.ISO8859-1',
961 'chinese-s': 'zh_CN.eucCN',
962 'chinese-t': 'zh_TW.eucTW',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +0300963 'chr_us': 'chr_US.UTF-8',
964 'ckb_iq': 'ckb_IQ.UTF-8',
965 'cmn_tw': 'cmn_TW.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300966 'crh_ua': 'crh_UA.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000967 'croatian': 'hr_HR.ISO8859-2',
968 'cs': 'cs_CZ.ISO8859-2',
969 'cs_cs': 'cs_CZ.ISO8859-2',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +0200970 'cs_cs.iso88592': 'cs_CZ.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000971 'cs_cz': 'cs_CZ.ISO8859-2',
972 'cs_cz.iso88592': 'cs_CZ.ISO8859-2',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +0300973 'csb_pl': 'csb_PL.UTF-8',
974 'cv_ru': 'cv_RU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000975 'cy': 'cy_GB.ISO8859-1',
976 'cy_gb': 'cy_GB.ISO8859-1',
977 'cy_gb.iso88591': 'cy_GB.ISO8859-1',
978 'cy_gb.iso885914': 'cy_GB.ISO8859-14',
979 'cy_gb.iso885915': 'cy_GB.ISO8859-15',
980 'cy_gb@euro': 'cy_GB.ISO8859-15',
981 'cz': 'cs_CZ.ISO8859-2',
982 'cz_cz': 'cs_CZ.ISO8859-2',
983 'czech': 'cs_CZ.ISO8859-2',
984 'da': 'da_DK.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +0000985 'da.iso885915': 'da_DK.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000986 'da_dk': 'da_DK.ISO8859-1',
987 'da_dk.88591': 'da_DK.ISO8859-1',
988 'da_dk.885915': 'da_DK.ISO8859-15',
989 'da_dk.iso88591': 'da_DK.ISO8859-1',
990 'da_dk.iso885915': 'da_DK.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000991 'da_dk@euro': 'da_DK.ISO8859-15',
992 'danish': 'da_DK.ISO8859-1',
993 'danish.iso88591': 'da_DK.ISO8859-1',
994 'dansk': 'da_DK.ISO8859-1',
995 'de': 'de_DE.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +0000996 'de.iso885915': 'de_DE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +0000997 'de_at': 'de_AT.ISO8859-1',
998 'de_at.iso88591': 'de_AT.ISO8859-1',
999 'de_at.iso885915': 'de_AT.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001000 'de_at.iso885915@euro': 'de_AT.ISO8859-15',
1001 'de_at.utf8@euro': 'de_AT.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001002 'de_at@euro': 'de_AT.ISO8859-15',
1003 'de_be': 'de_BE.ISO8859-1',
1004 'de_be.iso88591': 'de_BE.ISO8859-1',
1005 'de_be.iso885915': 'de_BE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001006 'de_be.iso885915@euro': 'de_BE.ISO8859-15',
1007 'de_be.utf8@euro': 'de_BE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001008 'de_be@euro': 'de_BE.ISO8859-15',
1009 'de_ch': 'de_CH.ISO8859-1',
1010 'de_ch.iso88591': 'de_CH.ISO8859-1',
1011 'de_ch.iso885915': 'de_CH.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001012 'de_ch@euro': 'de_CH.ISO8859-15',
1013 'de_de': 'de_DE.ISO8859-1',
1014 'de_de.88591': 'de_DE.ISO8859-1',
1015 'de_de.885915': 'de_DE.ISO8859-15',
1016 'de_de.885915@euro': 'de_DE.ISO8859-15',
1017 'de_de.iso88591': 'de_DE.ISO8859-1',
1018 'de_de.iso885915': 'de_DE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001019 'de_de.iso885915@euro': 'de_DE.ISO8859-15',
1020 'de_de.utf8@euro': 'de_DE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001021 'de_de@euro': 'de_DE.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001022 'de_it': 'de_IT.ISO8859-1',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001023 'de_li.utf8': 'de_LI.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001024 'de_lu': 'de_LU.ISO8859-1',
1025 'de_lu.iso88591': 'de_LU.ISO8859-1',
1026 'de_lu.iso885915': 'de_LU.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001027 'de_lu.iso885915@euro': 'de_LU.ISO8859-15',
1028 'de_lu.utf8@euro': 'de_LU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001029 'de_lu@euro': 'de_LU.ISO8859-15',
1030 'deutsch': 'de_DE.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001031 'doi_in': 'doi_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001032 'dutch': 'nl_NL.ISO8859-1',
1033 'dutch.iso88591': 'nl_BE.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001034 'dv_mv': 'dv_MV.UTF-8',
1035 'dz_bt': 'dz_BT.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001036 'ee': 'ee_EE.ISO8859-4',
1037 'ee_ee': 'ee_EE.ISO8859-4',
1038 'ee_ee.iso88594': 'ee_EE.ISO8859-4',
1039 'eesti': 'et_EE.ISO8859-1',
1040 'el': 'el_GR.ISO8859-7',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001041 'el_cy': 'el_CY.ISO8859-7',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001042 'el_gr': 'el_GR.ISO8859-7',
1043 'el_gr.iso88597': 'el_GR.ISO8859-7',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001044 'el_gr@euro': 'el_GR.ISO8859-15',
1045 'en': 'en_US.ISO8859-1',
1046 'en.iso88591': 'en_US.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001047 'en_ag': 'en_AG.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001048 'en_au': 'en_AU.ISO8859-1',
1049 'en_au.iso88591': 'en_AU.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001050 'en_be': 'en_BE.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001051 'en_be@euro': 'en_BE.ISO8859-15',
1052 'en_bw': 'en_BW.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001053 'en_bw.iso88591': 'en_BW.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001054 'en_ca': 'en_CA.ISO8859-1',
1055 'en_ca.iso88591': 'en_CA.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001056 'en_dk': 'en_DK.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001057 'en_dk.iso88591': 'en_DK.ISO8859-1',
1058 'en_dk.iso885915': 'en_DK.ISO8859-15',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +03001059 'en_dl.utf8': 'en_DL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001060 'en_gb': 'en_GB.ISO8859-1',
1061 'en_gb.88591': 'en_GB.ISO8859-1',
1062 'en_gb.iso88591': 'en_GB.ISO8859-1',
1063 'en_gb.iso885915': 'en_GB.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001064 'en_gb@euro': 'en_GB.ISO8859-15',
1065 'en_hk': 'en_HK.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001066 'en_hk.iso88591': 'en_HK.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001067 'en_ie': 'en_IE.ISO8859-1',
1068 'en_ie.iso88591': 'en_IE.ISO8859-1',
1069 'en_ie.iso885915': 'en_IE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001070 'en_ie.iso885915@euro': 'en_IE.ISO8859-15',
1071 'en_ie.utf8@euro': 'en_IE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001072 'en_ie@euro': 'en_IE.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001073 'en_il': 'en_IL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001074 'en_in': 'en_IN.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001075 'en_ng': 'en_NG.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001076 'en_nz': 'en_NZ.ISO8859-1',
1077 'en_nz.iso88591': 'en_NZ.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001078 'en_ph': 'en_PH.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001079 'en_ph.iso88591': 'en_PH.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001080 'en_sc.utf8': 'en_SC.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001081 'en_sg': 'en_SG.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001082 'en_sg.iso88591': 'en_SG.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001083 'en_uk': 'en_GB.ISO8859-1',
1084 'en_us': 'en_US.ISO8859-1',
1085 'en_us.88591': 'en_US.ISO8859-1',
1086 'en_us.885915': 'en_US.ISO8859-15',
1087 'en_us.iso88591': 'en_US.ISO8859-1',
1088 'en_us.iso885915': 'en_US.ISO8859-15',
1089 'en_us.iso885915@euro': 'en_US.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001090 'en_us@euro': 'en_US.ISO8859-15',
1091 'en_us@euro@euro': 'en_US.ISO8859-15',
1092 'en_za': 'en_ZA.ISO8859-1',
1093 'en_za.88591': 'en_ZA.ISO8859-1',
1094 'en_za.iso88591': 'en_ZA.ISO8859-1',
1095 'en_za.iso885915': 'en_ZA.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001096 'en_za@euro': 'en_ZA.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001097 'en_zm': 'en_ZM.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001098 'en_zw': 'en_ZW.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001099 'en_zw.iso88591': 'en_ZW.ISO8859-1',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +03001100 'en_zw.utf8': 'en_ZS.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001101 'eng_gb': 'en_GB.ISO8859-1',
1102 'eng_gb.8859': 'en_GB.ISO8859-1',
1103 'english': 'en_EN.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001104 'english.iso88591': 'en_US.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001105 'english_uk': 'en_GB.ISO8859-1',
1106 'english_uk.8859': 'en_GB.ISO8859-1',
1107 'english_united-states': 'en_US.ISO8859-1',
1108 'english_united-states.437': 'C',
1109 'english_us': 'en_US.ISO8859-1',
1110 'english_us.8859': 'en_US.ISO8859-1',
1111 'english_us.ascii': 'en_US.ISO8859-1',
1112 'eo': 'eo_XX.ISO8859-3',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001113 'eo.utf8': 'eo.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001114 'eo_eo': 'eo_EO.ISO8859-3',
1115 'eo_eo.iso88593': 'eo_EO.ISO8859-3',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001116 'eo_us.utf8': 'eo_US.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001117 'eo_xx': 'eo_XX.ISO8859-3',
1118 'eo_xx.iso88593': 'eo_XX.ISO8859-3',
1119 'es': 'es_ES.ISO8859-1',
1120 'es_ar': 'es_AR.ISO8859-1',
1121 'es_ar.iso88591': 'es_AR.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001122 'es_bo': 'es_BO.ISO8859-1',
1123 'es_bo.iso88591': 'es_BO.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001124 'es_cl': 'es_CL.ISO8859-1',
1125 'es_cl.iso88591': 'es_CL.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001126 'es_co': 'es_CO.ISO8859-1',
1127 'es_co.iso88591': 'es_CO.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001128 'es_cr': 'es_CR.ISO8859-1',
1129 'es_cr.iso88591': 'es_CR.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001130 'es_cu': 'es_CU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001131 'es_do': 'es_DO.ISO8859-1',
1132 'es_do.iso88591': 'es_DO.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001133 'es_ec': 'es_EC.ISO8859-1',
1134 'es_ec.iso88591': 'es_EC.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001135 'es_es': 'es_ES.ISO8859-1',
1136 'es_es.88591': 'es_ES.ISO8859-1',
1137 'es_es.iso88591': 'es_ES.ISO8859-1',
1138 'es_es.iso885915': 'es_ES.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001139 'es_es.iso885915@euro': 'es_ES.ISO8859-15',
1140 'es_es.utf8@euro': 'es_ES.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001141 'es_es@euro': 'es_ES.ISO8859-15',
1142 'es_gt': 'es_GT.ISO8859-1',
1143 'es_gt.iso88591': 'es_GT.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001144 'es_hn': 'es_HN.ISO8859-1',
1145 'es_hn.iso88591': 'es_HN.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001146 'es_mx': 'es_MX.ISO8859-1',
1147 'es_mx.iso88591': 'es_MX.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001148 'es_ni': 'es_NI.ISO8859-1',
1149 'es_ni.iso88591': 'es_NI.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001150 'es_pa': 'es_PA.ISO8859-1',
1151 'es_pa.iso88591': 'es_PA.ISO8859-1',
1152 'es_pa.iso885915': 'es_PA.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001153 'es_pa@euro': 'es_PA.ISO8859-15',
1154 'es_pe': 'es_PE.ISO8859-1',
1155 'es_pe.iso88591': 'es_PE.ISO8859-1',
1156 'es_pe.iso885915': 'es_PE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001157 'es_pe@euro': 'es_PE.ISO8859-15',
1158 'es_pr': 'es_PR.ISO8859-1',
1159 'es_pr.iso88591': 'es_PR.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001160 'es_py': 'es_PY.ISO8859-1',
1161 'es_py.iso88591': 'es_PY.ISO8859-1',
1162 'es_py.iso885915': 'es_PY.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001163 'es_py@euro': 'es_PY.ISO8859-15',
1164 'es_sv': 'es_SV.ISO8859-1',
1165 'es_sv.iso88591': 'es_SV.ISO8859-1',
1166 'es_sv.iso885915': 'es_SV.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001167 'es_sv@euro': 'es_SV.ISO8859-15',
1168 'es_us': 'es_US.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001169 'es_us.iso88591': 'es_US.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001170 'es_uy': 'es_UY.ISO8859-1',
1171 'es_uy.iso88591': 'es_UY.ISO8859-1',
1172 'es_uy.iso885915': 'es_UY.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001173 'es_uy@euro': 'es_UY.ISO8859-15',
1174 'es_ve': 'es_VE.ISO8859-1',
1175 'es_ve.iso88591': 'es_VE.ISO8859-1',
1176 'es_ve.iso885915': 'es_VE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001177 'es_ve@euro': 'es_VE.ISO8859-15',
1178 'estonian': 'et_EE.ISO8859-1',
1179 'et': 'et_EE.ISO8859-15',
1180 'et_ee': 'et_EE.ISO8859-15',
1181 'et_ee.iso88591': 'et_EE.ISO8859-1',
1182 'et_ee.iso885913': 'et_EE.ISO8859-13',
1183 'et_ee.iso885915': 'et_EE.ISO8859-15',
1184 'et_ee.iso88594': 'et_EE.ISO8859-4',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001185 'et_ee@euro': 'et_EE.ISO8859-15',
1186 'eu': 'eu_ES.ISO8859-1',
1187 'eu_es': 'eu_ES.ISO8859-1',
1188 'eu_es.iso88591': 'eu_ES.ISO8859-1',
1189 'eu_es.iso885915': 'eu_ES.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001190 'eu_es.iso885915@euro': 'eu_ES.ISO8859-15',
1191 'eu_es.utf8@euro': 'eu_ES.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001192 'eu_es@euro': 'eu_ES.ISO8859-15',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001193 'eu_fr': 'eu_FR.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001194 'fa': 'fa_IR.UTF-8',
1195 'fa_ir': 'fa_IR.UTF-8',
1196 'fa_ir.isiri3342': 'fa_IR.ISIRI-3342',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001197 'ff_sn': 'ff_SN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001198 'fi': 'fi_FI.ISO8859-15',
Antoine Pitroufc531532010-04-11 22:32:39 +00001199 'fi.iso885915': 'fi_FI.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001200 'fi_fi': 'fi_FI.ISO8859-15',
1201 'fi_fi.88591': 'fi_FI.ISO8859-1',
1202 'fi_fi.iso88591': 'fi_FI.ISO8859-1',
1203 'fi_fi.iso885915': 'fi_FI.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001204 'fi_fi.iso885915@euro': 'fi_FI.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001205 'fi_fi.utf8@euro': 'fi_FI.UTF-8',
1206 'fi_fi@euro': 'fi_FI.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001207 'fil_ph': 'fil_PH.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001208 'finnish': 'fi_FI.ISO8859-1',
1209 'finnish.iso88591': 'fi_FI.ISO8859-1',
1210 'fo': 'fo_FO.ISO8859-1',
1211 'fo_fo': 'fo_FO.ISO8859-1',
1212 'fo_fo.iso88591': 'fo_FO.ISO8859-1',
1213 'fo_fo.iso885915': 'fo_FO.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001214 'fo_fo@euro': 'fo_FO.ISO8859-15',
1215 'fr': 'fr_FR.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001216 'fr.iso885915': 'fr_FR.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001217 'fr_be': 'fr_BE.ISO8859-1',
1218 'fr_be.88591': 'fr_BE.ISO8859-1',
1219 'fr_be.iso88591': 'fr_BE.ISO8859-1',
1220 'fr_be.iso885915': 'fr_BE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001221 'fr_be.iso885915@euro': 'fr_BE.ISO8859-15',
1222 'fr_be.utf8@euro': 'fr_BE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001223 'fr_be@euro': 'fr_BE.ISO8859-15',
1224 'fr_ca': 'fr_CA.ISO8859-1',
1225 'fr_ca.88591': 'fr_CA.ISO8859-1',
1226 'fr_ca.iso88591': 'fr_CA.ISO8859-1',
1227 'fr_ca.iso885915': 'fr_CA.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001228 'fr_ca@euro': 'fr_CA.ISO8859-15',
1229 'fr_ch': 'fr_CH.ISO8859-1',
1230 'fr_ch.88591': 'fr_CH.ISO8859-1',
1231 'fr_ch.iso88591': 'fr_CH.ISO8859-1',
1232 'fr_ch.iso885915': 'fr_CH.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001233 'fr_ch@euro': 'fr_CH.ISO8859-15',
1234 'fr_fr': 'fr_FR.ISO8859-1',
1235 'fr_fr.88591': 'fr_FR.ISO8859-1',
1236 'fr_fr.iso88591': 'fr_FR.ISO8859-1',
1237 'fr_fr.iso885915': 'fr_FR.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001238 'fr_fr.iso885915@euro': 'fr_FR.ISO8859-15',
1239 'fr_fr.utf8@euro': 'fr_FR.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001240 'fr_fr@euro': 'fr_FR.ISO8859-15',
1241 'fr_lu': 'fr_LU.ISO8859-1',
1242 'fr_lu.88591': 'fr_LU.ISO8859-1',
1243 'fr_lu.iso88591': 'fr_LU.ISO8859-1',
1244 'fr_lu.iso885915': 'fr_LU.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001245 'fr_lu.iso885915@euro': 'fr_LU.ISO8859-15',
1246 'fr_lu.utf8@euro': 'fr_LU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001247 'fr_lu@euro': 'fr_LU.ISO8859-15',
1248 'fran\xe7ais': 'fr_FR.ISO8859-1',
1249 'fre_fr': 'fr_FR.ISO8859-1',
1250 'fre_fr.8859': 'fr_FR.ISO8859-1',
1251 'french': 'fr_FR.ISO8859-1',
1252 'french.iso88591': 'fr_CH.ISO8859-1',
1253 'french_france': 'fr_FR.ISO8859-1',
1254 'french_france.8859': 'fr_FR.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001255 'fur_it': 'fur_IT.UTF-8',
1256 'fy_de': 'fy_DE.UTF-8',
1257 'fy_nl': 'fy_NL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001258 'ga': 'ga_IE.ISO8859-1',
1259 'ga_ie': 'ga_IE.ISO8859-1',
1260 'ga_ie.iso88591': 'ga_IE.ISO8859-1',
1261 'ga_ie.iso885914': 'ga_IE.ISO8859-14',
1262 'ga_ie.iso885915': 'ga_IE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001263 'ga_ie.iso885915@euro': 'ga_IE.ISO8859-15',
1264 'ga_ie.utf8@euro': 'ga_IE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001265 'ga_ie@euro': 'ga_IE.ISO8859-15',
1266 'galego': 'gl_ES.ISO8859-1',
1267 'galician': 'gl_ES.ISO8859-1',
1268 'gd': 'gd_GB.ISO8859-1',
1269 'gd_gb': 'gd_GB.ISO8859-1',
1270 'gd_gb.iso88591': 'gd_GB.ISO8859-1',
1271 'gd_gb.iso885914': 'gd_GB.ISO8859-14',
1272 'gd_gb.iso885915': 'gd_GB.ISO8859-15',
1273 'gd_gb@euro': 'gd_GB.ISO8859-15',
1274 'ger_de': 'de_DE.ISO8859-1',
1275 'ger_de.8859': 'de_DE.ISO8859-1',
1276 'german': 'de_DE.ISO8859-1',
1277 'german.iso88591': 'de_CH.ISO8859-1',
1278 'german_germany': 'de_DE.ISO8859-1',
1279 'german_germany.8859': 'de_DE.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001280 'gez_er': 'gez_ER.UTF-8',
1281 'gez_et': 'gez_ET.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001282 'gl': 'gl_ES.ISO8859-1',
1283 'gl_es': 'gl_ES.ISO8859-1',
1284 'gl_es.iso88591': 'gl_ES.ISO8859-1',
1285 'gl_es.iso885915': 'gl_ES.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001286 'gl_es.iso885915@euro': 'gl_ES.ISO8859-15',
1287 'gl_es.utf8@euro': 'gl_ES.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001288 'gl_es@euro': 'gl_ES.ISO8859-15',
1289 'greek': 'el_GR.ISO8859-7',
1290 'greek.iso88597': 'el_GR.ISO8859-7',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001291 'gu_in': 'gu_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001292 'gv': 'gv_GB.ISO8859-1',
1293 'gv_gb': 'gv_GB.ISO8859-1',
1294 'gv_gb.iso88591': 'gv_GB.ISO8859-1',
1295 'gv_gb.iso885914': 'gv_GB.ISO8859-14',
1296 'gv_gb.iso885915': 'gv_GB.ISO8859-15',
1297 'gv_gb@euro': 'gv_GB.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001298 'ha_ng': 'ha_NG.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001299 'hak_tw': 'hak_TW.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001300 'he': 'he_IL.ISO8859-8',
1301 'he_il': 'he_IL.ISO8859-8',
1302 'he_il.cp1255': 'he_IL.CP1255',
1303 'he_il.iso88598': 'he_IL.ISO8859-8',
1304 'he_il.microsoftcp1255': 'he_IL.CP1255',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001305 'hebrew': 'he_IL.ISO8859-8',
1306 'hebrew.iso88598': 'he_IL.ISO8859-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001307 'hi': 'hi_IN.ISCII-DEV',
1308 'hi_in': 'hi_IN.ISCII-DEV',
1309 'hi_in.isciidev': 'hi_IN.ISCII-DEV',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001310 'hif_fj': 'hif_FJ.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001311 'hne': 'hne_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001312 'hne_in': 'hne_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001313 'hr': 'hr_HR.ISO8859-2',
1314 'hr_hr': 'hr_HR.ISO8859-2',
1315 'hr_hr.iso88592': 'hr_HR.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001316 'hrvatski': 'hr_HR.ISO8859-2',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001317 'hsb_de': 'hsb_DE.ISO8859-2',
1318 'ht_ht': 'ht_HT.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001319 'hu': 'hu_HU.ISO8859-2',
1320 'hu_hu': 'hu_HU.ISO8859-2',
1321 'hu_hu.iso88592': 'hu_HU.ISO8859-2',
1322 'hungarian': 'hu_HU.ISO8859-2',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001323 'hy_am': 'hy_AM.UTF-8',
1324 'hy_am.armscii8': 'hy_AM.ARMSCII_8',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001325 'ia': 'ia.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001326 'ia_fr': 'ia_FR.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001327 'icelandic': 'is_IS.ISO8859-1',
1328 'icelandic.iso88591': 'is_IS.ISO8859-1',
1329 'id': 'id_ID.ISO8859-1',
1330 'id_id': 'id_ID.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001331 'ig_ng': 'ig_NG.UTF-8',
1332 'ik_ca': 'ik_CA.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001333 'in': 'id_ID.ISO8859-1',
1334 'in_id': 'id_ID.ISO8859-1',
1335 'is': 'is_IS.ISO8859-1',
1336 'is_is': 'is_IS.ISO8859-1',
1337 'is_is.iso88591': 'is_IS.ISO8859-1',
1338 'is_is.iso885915': 'is_IS.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001339 'is_is@euro': 'is_IS.ISO8859-15',
1340 'iso-8859-1': 'en_US.ISO8859-1',
1341 'iso-8859-15': 'en_US.ISO8859-15',
1342 'iso8859-1': 'en_US.ISO8859-1',
1343 'iso8859-15': 'en_US.ISO8859-15',
1344 'iso_8859_1': 'en_US.ISO8859-1',
1345 'iso_8859_15': 'en_US.ISO8859-15',
1346 'it': 'it_IT.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001347 'it.iso885915': 'it_IT.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001348 'it_ch': 'it_CH.ISO8859-1',
1349 'it_ch.iso88591': 'it_CH.ISO8859-1',
1350 'it_ch.iso885915': 'it_CH.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001351 'it_ch@euro': 'it_CH.ISO8859-15',
1352 'it_it': 'it_IT.ISO8859-1',
1353 'it_it.88591': 'it_IT.ISO8859-1',
1354 'it_it.iso88591': 'it_IT.ISO8859-1',
1355 'it_it.iso885915': 'it_IT.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001356 'it_it.iso885915@euro': 'it_IT.ISO8859-15',
1357 'it_it.utf8@euro': 'it_IT.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001358 'it_it@euro': 'it_IT.ISO8859-15',
1359 'italian': 'it_IT.ISO8859-1',
1360 'italian.iso88591': 'it_IT.ISO8859-1',
1361 'iu': 'iu_CA.NUNACOM-8',
1362 'iu_ca': 'iu_CA.NUNACOM-8',
1363 'iu_ca.nunacom8': 'iu_CA.NUNACOM-8',
1364 'iw': 'he_IL.ISO8859-8',
1365 'iw_il': 'he_IL.ISO8859-8',
1366 'iw_il.iso88598': 'he_IL.ISO8859-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001367 'iw_il.utf8': 'iw_IL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001368 'ja': 'ja_JP.eucJP',
1369 'ja.jis': 'ja_JP.JIS7',
1370 'ja.sjis': 'ja_JP.SJIS',
1371 'ja_jp': 'ja_JP.eucJP',
1372 'ja_jp.ajec': 'ja_JP.eucJP',
1373 'ja_jp.euc': 'ja_JP.eucJP',
1374 'ja_jp.eucjp': 'ja_JP.eucJP',
1375 'ja_jp.iso-2022-jp': 'ja_JP.JIS7',
1376 'ja_jp.iso2022jp': 'ja_JP.JIS7',
1377 'ja_jp.jis': 'ja_JP.JIS7',
1378 'ja_jp.jis7': 'ja_JP.JIS7',
1379 'ja_jp.mscode': 'ja_JP.SJIS',
Antoine Pitroufc531532010-04-11 22:32:39 +00001380 'ja_jp.pck': 'ja_JP.SJIS',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001381 'ja_jp.sjis': 'ja_JP.SJIS',
1382 'ja_jp.ujis': 'ja_JP.eucJP',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001383 'japan': 'ja_JP.eucJP',
1384 'japanese': 'ja_JP.eucJP',
1385 'japanese-euc': 'ja_JP.eucJP',
1386 'japanese.euc': 'ja_JP.eucJP',
1387 'japanese.sjis': 'ja_JP.SJIS',
1388 'jp_jp': 'ja_JP.eucJP',
1389 'ka': 'ka_GE.GEORGIAN-ACADEMY',
1390 'ka_ge': 'ka_GE.GEORGIAN-ACADEMY',
1391 'ka_ge.georgianacademy': 'ka_GE.GEORGIAN-ACADEMY',
1392 'ka_ge.georgianps': 'ka_GE.GEORGIAN-PS',
1393 'ka_ge.georgianrs': 'ka_GE.GEORGIAN-ACADEMY',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001394 'kab_dz': 'kab_DZ.UTF-8',
1395 'kk_kz': 'kk_KZ.ptcp154',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001396 'kl': 'kl_GL.ISO8859-1',
1397 'kl_gl': 'kl_GL.ISO8859-1',
1398 'kl_gl.iso88591': 'kl_GL.ISO8859-1',
1399 'kl_gl.iso885915': 'kl_GL.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001400 'kl_gl@euro': 'kl_GL.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001401 'km_kh': 'km_KH.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001402 'kn': 'kn_IN.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001403 'kn_in': 'kn_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001404 'ko': 'ko_KR.eucKR',
1405 'ko_kr': 'ko_KR.eucKR',
1406 'ko_kr.euc': 'ko_KR.eucKR',
1407 'ko_kr.euckr': 'ko_KR.eucKR',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001408 'kok_in': 'kok_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001409 'korean': 'ko_KR.eucKR',
1410 'korean.euc': 'ko_KR.eucKR',
Antoine Pitroufc531532010-04-11 22:32:39 +00001411 'ks': 'ks_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001412 'ks_in': 'ks_IN.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001413 'ks_in.utf8@devanagari': 'ks_IN.UTF-8@devanagari',
Serhiy Storchakad551b282013-12-26 21:20:46 +02001414 'ks_in@devanagari': 'ks_IN.UTF-8@devanagari',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +03001415 'ks_in@devanagari.utf8': 'ks_IN.UTF-8@devanagari',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001416 'ku_tr': 'ku_TR.ISO8859-9',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001417 'kw': 'kw_GB.ISO8859-1',
1418 'kw_gb': 'kw_GB.ISO8859-1',
1419 'kw_gb.iso88591': 'kw_GB.ISO8859-1',
1420 'kw_gb.iso885914': 'kw_GB.ISO8859-14',
1421 'kw_gb.iso885915': 'kw_GB.ISO8859-15',
1422 'kw_gb@euro': 'kw_GB.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001423 'ky': 'ky_KG.UTF-8',
1424 'ky_kg': 'ky_KG.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001425 'lb_lu': 'lb_LU.UTF-8',
1426 'lg_ug': 'lg_UG.ISO8859-10',
1427 'li_be': 'li_BE.UTF-8',
1428 'li_nl': 'li_NL.UTF-8',
1429 'lij_it': 'lij_IT.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001430 'lithuanian': 'lt_LT.ISO8859-13',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001431 'ln_cd': 'ln_CD.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001432 'lo': 'lo_LA.MULELAO-1',
1433 'lo_la': 'lo_LA.MULELAO-1',
1434 'lo_la.cp1133': 'lo_LA.IBM-CP1133',
1435 'lo_la.ibmcp1133': 'lo_LA.IBM-CP1133',
1436 'lo_la.mulelao1': 'lo_LA.MULELAO-1',
1437 'lt': 'lt_LT.ISO8859-13',
1438 'lt_lt': 'lt_LT.ISO8859-13',
1439 'lt_lt.iso885913': 'lt_LT.ISO8859-13',
1440 'lt_lt.iso88594': 'lt_LT.ISO8859-4',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001441 'lv': 'lv_LV.ISO8859-13',
1442 'lv_lv': 'lv_LV.ISO8859-13',
1443 'lv_lv.iso885913': 'lv_LV.ISO8859-13',
1444 'lv_lv.iso88594': 'lv_LV.ISO8859-4',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001445 'lzh_tw': 'lzh_TW.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001446 'mag_in': 'mag_IN.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001447 'mai': 'mai_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001448 'mai_in': 'mai_IN.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001449 'mai_np': 'mai_NP.UTF-8',
1450 'mfe_mu': 'mfe_MU.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001451 'mg_mg': 'mg_MG.ISO8859-15',
1452 'mhr_ru': 'mhr_RU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001453 'mi': 'mi_NZ.ISO8859-1',
1454 'mi_nz': 'mi_NZ.ISO8859-1',
1455 'mi_nz.iso88591': 'mi_NZ.ISO8859-1',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001456 'miq_ni': 'miq_NI.UTF-8',
1457 'mjw_in': 'mjw_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001458 'mk': 'mk_MK.ISO8859-5',
1459 'mk_mk': 'mk_MK.ISO8859-5',
1460 'mk_mk.cp1251': 'mk_MK.CP1251',
1461 'mk_mk.iso88595': 'mk_MK.ISO8859-5',
1462 'mk_mk.microsoftcp1251': 'mk_MK.CP1251',
Antoine Pitroufc531532010-04-11 22:32:39 +00001463 'ml': 'ml_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001464 'ml_in': 'ml_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001465 'mn_mn': 'mn_MN.UTF-8',
1466 'mni_in': 'mni_IN.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001467 'mr': 'mr_IN.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001468 'mr_in': 'mr_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001469 'ms': 'ms_MY.ISO8859-1',
1470 'ms_my': 'ms_MY.ISO8859-1',
1471 'ms_my.iso88591': 'ms_MY.ISO8859-1',
1472 'mt': 'mt_MT.ISO8859-3',
1473 'mt_mt': 'mt_MT.ISO8859-3',
1474 'mt_mt.iso88593': 'mt_MT.ISO8859-3',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001475 'my_mm': 'my_MM.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001476 'nan_tw': 'nan_TW.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001477 'nb': 'nb_NO.ISO8859-1',
1478 'nb_no': 'nb_NO.ISO8859-1',
1479 'nb_no.88591': 'nb_NO.ISO8859-1',
1480 'nb_no.iso88591': 'nb_NO.ISO8859-1',
1481 'nb_no.iso885915': 'nb_NO.ISO8859-15',
1482 'nb_no@euro': 'nb_NO.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001483 'nds_de': 'nds_DE.UTF-8',
1484 'nds_nl': 'nds_NL.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001485 'ne_np': 'ne_NP.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001486 'nhn_mx': 'nhn_MX.UTF-8',
1487 'niu_nu': 'niu_NU.UTF-8',
1488 'niu_nz': 'niu_NZ.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001489 'nl': 'nl_NL.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001490 'nl.iso885915': 'nl_NL.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001491 'nl_aw': 'nl_AW.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001492 'nl_be': 'nl_BE.ISO8859-1',
1493 'nl_be.88591': 'nl_BE.ISO8859-1',
1494 'nl_be.iso88591': 'nl_BE.ISO8859-1',
1495 'nl_be.iso885915': 'nl_BE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001496 'nl_be.iso885915@euro': 'nl_BE.ISO8859-15',
1497 'nl_be.utf8@euro': 'nl_BE.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001498 'nl_be@euro': 'nl_BE.ISO8859-15',
1499 'nl_nl': 'nl_NL.ISO8859-1',
1500 'nl_nl.88591': 'nl_NL.ISO8859-1',
1501 'nl_nl.iso88591': 'nl_NL.ISO8859-1',
1502 'nl_nl.iso885915': 'nl_NL.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001503 'nl_nl.iso885915@euro': 'nl_NL.ISO8859-15',
1504 'nl_nl.utf8@euro': 'nl_NL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001505 'nl_nl@euro': 'nl_NL.ISO8859-15',
1506 'nn': 'nn_NO.ISO8859-1',
1507 'nn_no': 'nn_NO.ISO8859-1',
1508 'nn_no.88591': 'nn_NO.ISO8859-1',
1509 'nn_no.iso88591': 'nn_NO.ISO8859-1',
1510 'nn_no.iso885915': 'nn_NO.ISO8859-15',
1511 'nn_no@euro': 'nn_NO.ISO8859-15',
1512 'no': 'no_NO.ISO8859-1',
1513 'no@nynorsk': 'ny_NO.ISO8859-1',
1514 'no_no': 'no_NO.ISO8859-1',
1515 'no_no.88591': 'no_NO.ISO8859-1',
1516 'no_no.iso88591': 'no_NO.ISO8859-1',
1517 'no_no.iso885915': 'no_NO.ISO8859-15',
Antoine Pitroufc531532010-04-11 22:32:39 +00001518 'no_no.iso88591@bokmal': 'no_NO.ISO8859-1',
1519 'no_no.iso88591@nynorsk': 'no_NO.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001520 'no_no@euro': 'no_NO.ISO8859-15',
1521 'norwegian': 'no_NO.ISO8859-1',
1522 'norwegian.iso88591': 'no_NO.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001523 'nr': 'nr_ZA.ISO8859-1',
1524 'nr_za': 'nr_ZA.ISO8859-1',
1525 'nr_za.iso88591': 'nr_ZA.ISO8859-1',
1526 'nso': 'nso_ZA.ISO8859-15',
1527 'nso_za': 'nso_ZA.ISO8859-15',
1528 'nso_za.iso885915': 'nso_ZA.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001529 'ny': 'ny_NO.ISO8859-1',
1530 'ny_no': 'ny_NO.ISO8859-1',
1531 'ny_no.88591': 'ny_NO.ISO8859-1',
1532 'ny_no.iso88591': 'ny_NO.ISO8859-1',
1533 'ny_no.iso885915': 'ny_NO.ISO8859-15',
1534 'ny_no@euro': 'ny_NO.ISO8859-15',
1535 'nynorsk': 'nn_NO.ISO8859-1',
1536 'oc': 'oc_FR.ISO8859-1',
1537 'oc_fr': 'oc_FR.ISO8859-1',
1538 'oc_fr.iso88591': 'oc_FR.ISO8859-1',
1539 'oc_fr.iso885915': 'oc_FR.ISO8859-15',
1540 'oc_fr@euro': 'oc_FR.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001541 'om_et': 'om_ET.UTF-8',
1542 'om_ke': 'om_KE.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001543 'or': 'or_IN.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001544 'or_in': 'or_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001545 'os_ru': 'os_RU.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001546 'pa': 'pa_IN.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001547 'pa_in': 'pa_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001548 'pa_pk': 'pa_PK.UTF-8',
1549 'pap_an': 'pap_AN.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001550 'pap_aw': 'pap_AW.UTF-8',
1551 'pap_cw': 'pap_CW.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001552 'pd': 'pd_US.ISO8859-1',
1553 'pd_de': 'pd_DE.ISO8859-1',
1554 'pd_de.iso88591': 'pd_DE.ISO8859-1',
1555 'pd_de.iso885915': 'pd_DE.ISO8859-15',
1556 'pd_de@euro': 'pd_DE.ISO8859-15',
1557 'pd_us': 'pd_US.ISO8859-1',
1558 'pd_us.iso88591': 'pd_US.ISO8859-1',
1559 'pd_us.iso885915': 'pd_US.ISO8859-15',
1560 'pd_us@euro': 'pd_US.ISO8859-15',
1561 'ph': 'ph_PH.ISO8859-1',
1562 'ph_ph': 'ph_PH.ISO8859-1',
1563 'ph_ph.iso88591': 'ph_PH.ISO8859-1',
1564 'pl': 'pl_PL.ISO8859-2',
1565 'pl_pl': 'pl_PL.ISO8859-2',
1566 'pl_pl.iso88592': 'pl_PL.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001567 'polish': 'pl_PL.ISO8859-2',
1568 'portuguese': 'pt_PT.ISO8859-1',
1569 'portuguese.iso88591': 'pt_PT.ISO8859-1',
1570 'portuguese_brazil': 'pt_BR.ISO8859-1',
1571 'portuguese_brazil.8859': 'pt_BR.ISO8859-1',
1572 'posix': 'C',
1573 'posix-utf2': 'C',
1574 'pp': 'pp_AN.ISO8859-1',
1575 'pp_an': 'pp_AN.ISO8859-1',
1576 'pp_an.iso88591': 'pp_AN.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001577 'ps_af': 'ps_AF.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001578 'pt': 'pt_PT.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001579 'pt.iso885915': 'pt_PT.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001580 'pt_br': 'pt_BR.ISO8859-1',
1581 'pt_br.88591': 'pt_BR.ISO8859-1',
1582 'pt_br.iso88591': 'pt_BR.ISO8859-1',
1583 'pt_br.iso885915': 'pt_BR.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001584 'pt_br@euro': 'pt_BR.ISO8859-15',
1585 'pt_pt': 'pt_PT.ISO8859-1',
1586 'pt_pt.88591': 'pt_PT.ISO8859-1',
1587 'pt_pt.iso88591': 'pt_PT.ISO8859-1',
1588 'pt_pt.iso885915': 'pt_PT.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001589 'pt_pt.iso885915@euro': 'pt_PT.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001590 'pt_pt.utf8@euro': 'pt_PT.UTF-8',
1591 'pt_pt@euro': 'pt_PT.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001592 'quz_pe': 'quz_PE.UTF-8',
1593 'raj_in': 'raj_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001594 'ro': 'ro_RO.ISO8859-2',
1595 'ro_ro': 'ro_RO.ISO8859-2',
1596 'ro_ro.iso88592': 'ro_RO.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001597 'romanian': 'ro_RO.ISO8859-2',
Antoine Pitroufc531532010-04-11 22:32:39 +00001598 'ru': 'ru_RU.UTF-8',
1599 'ru.koi8r': 'ru_RU.KOI8-R',
1600 'ru_ru': 'ru_RU.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001601 'ru_ru.cp1251': 'ru_RU.CP1251',
1602 'ru_ru.iso88595': 'ru_RU.ISO8859-5',
1603 'ru_ru.koi8r': 'ru_RU.KOI8-R',
1604 'ru_ru.microsoftcp1251': 'ru_RU.CP1251',
1605 'ru_ua': 'ru_UA.KOI8-U',
1606 'ru_ua.cp1251': 'ru_UA.CP1251',
1607 'ru_ua.koi8u': 'ru_UA.KOI8-U',
1608 'ru_ua.microsoftcp1251': 'ru_UA.CP1251',
1609 'rumanian': 'ro_RO.ISO8859-2',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001610 'russian': 'ru_RU.KOI8-R',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001611 'rw': 'rw_RW.ISO8859-1',
1612 'rw_rw': 'rw_RW.ISO8859-1',
1613 'rw_rw.iso88591': 'rw_RW.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001614 'sa_in': 'sa_IN.UTF-8',
1615 'sat_in': 'sat_IN.UTF-8',
1616 'sc_it': 'sc_IT.UTF-8',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001617 'sd': 'sd_IN.UTF-8',
Serhiy Storchakad551b282013-12-26 21:20:46 +02001618 'sd@devanagari': 'sd_IN.UTF-8@devanagari',
1619 'sd_in': 'sd_IN.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001620 'sd_in.utf8@devanagari': 'sd_IN.UTF-8@devanagari',
Serhiy Storchakad551b282013-12-26 21:20:46 +02001621 'sd_in@devanagari': 'sd_IN.UTF-8@devanagari',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +03001622 'sd_in@devanagari.utf8': 'sd_IN.UTF-8@devanagari',
Serhiy Storchaka5f4e55c2014-10-02 10:49:04 +03001623 'sd_pk': 'sd_PK.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001624 'se_no': 'se_NO.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001625 'serbocroatian': 'sr_RS.UTF-8@latin',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001626 'sgs_lt': 'sgs_LT.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001627 'sh': 'sr_RS.UTF-8@latin',
1628 'sh_ba.iso88592@bosnia': 'sr_CS.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001629 'sh_hr': 'sh_HR.ISO8859-2',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001630 'sh_hr.iso88592': 'hr_HR.ISO8859-2',
1631 'sh_sp': 'sr_CS.ISO8859-2',
Antoine Pitroufc531532010-04-11 22:32:39 +00001632 'sh_yu': 'sr_RS.UTF-8@latin',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001633 'shn_mm': 'shn_MM.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001634 'shs_ca': 'shs_CA.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001635 'si': 'si_LK.UTF-8',
1636 'si_lk': 'si_LK.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001637 'sid_et': 'sid_ET.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001638 'sinhala': 'si_LK.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001639 'sk': 'sk_SK.ISO8859-2',
1640 'sk_sk': 'sk_SK.ISO8859-2',
1641 'sk_sk.iso88592': 'sk_SK.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001642 'sl': 'sl_SI.ISO8859-2',
1643 'sl_cs': 'sl_CS.ISO8859-2',
1644 'sl_si': 'sl_SI.ISO8859-2',
1645 'sl_si.iso88592': 'sl_SI.ISO8859-2',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001646 'slovak': 'sk_SK.ISO8859-2',
1647 'slovene': 'sl_SI.ISO8859-2',
1648 'slovenian': 'sl_SI.ISO8859-2',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001649 'sm_ws': 'sm_WS.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001650 'so_dj': 'so_DJ.ISO8859-1',
1651 'so_et': 'so_ET.UTF-8',
1652 'so_ke': 'so_KE.ISO8859-1',
1653 'so_so': 'so_SO.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001654 'sp': 'sr_CS.ISO8859-5',
1655 'sp_yu': 'sr_CS.ISO8859-5',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001656 'spanish': 'es_ES.ISO8859-1',
1657 'spanish.iso88591': 'es_ES.ISO8859-1',
1658 'spanish_spain': 'es_ES.ISO8859-1',
1659 'spanish_spain.8859': 'es_ES.ISO8859-1',
1660 'sq': 'sq_AL.ISO8859-2',
1661 'sq_al': 'sq_AL.ISO8859-2',
1662 'sq_al.iso88592': 'sq_AL.ISO8859-2',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001663 'sq_mk': 'sq_MK.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001664 'sr': 'sr_RS.UTF-8',
1665 'sr@cyrillic': 'sr_RS.UTF-8',
1666 'sr@latin': 'sr_RS.UTF-8@latin',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001667 'sr@latn': 'sr_CS.UTF-8@latin',
1668 'sr_cs': 'sr_CS.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001669 'sr_cs.iso88592': 'sr_CS.ISO8859-2',
1670 'sr_cs.iso88592@latn': 'sr_CS.ISO8859-2',
1671 'sr_cs.iso88595': 'sr_CS.ISO8859-5',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001672 'sr_cs.utf8@latn': 'sr_CS.UTF-8@latin',
1673 'sr_cs@latn': 'sr_CS.UTF-8@latin',
Antoine Pitroufc531532010-04-11 22:32:39 +00001674 'sr_me': 'sr_ME.UTF-8',
1675 'sr_rs': 'sr_RS.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001676 'sr_rs.utf8@latn': 'sr_RS.UTF-8@latin',
Antoine Pitroufc531532010-04-11 22:32:39 +00001677 'sr_rs@latin': 'sr_RS.UTF-8@latin',
1678 'sr_rs@latn': 'sr_RS.UTF-8@latin',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001679 'sr_sp': 'sr_CS.ISO8859-2',
Antoine Pitroufc531532010-04-11 22:32:39 +00001680 'sr_yu': 'sr_RS.UTF-8@latin',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001681 'sr_yu.cp1251@cyrillic': 'sr_CS.CP1251',
1682 'sr_yu.iso88592': 'sr_CS.ISO8859-2',
1683 'sr_yu.iso88595': 'sr_CS.ISO8859-5',
1684 'sr_yu.iso88595@cyrillic': 'sr_CS.ISO8859-5',
1685 'sr_yu.microsoftcp1251@cyrillic': 'sr_CS.CP1251',
Serhiy Storchakab3d80a22014-10-02 00:09:17 +03001686 'sr_yu.utf8': 'sr_RS.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001687 'sr_yu.utf8@cyrillic': 'sr_RS.UTF-8',
1688 'sr_yu@cyrillic': 'sr_RS.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001689 'ss': 'ss_ZA.ISO8859-1',
1690 'ss_za': 'ss_ZA.ISO8859-1',
1691 'ss_za.iso88591': 'ss_ZA.ISO8859-1',
1692 'st': 'st_ZA.ISO8859-1',
1693 'st_za': 'st_ZA.ISO8859-1',
1694 'st_za.iso88591': 'st_ZA.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001695 'sv': 'sv_SE.ISO8859-1',
Antoine Pitroufc531532010-04-11 22:32:39 +00001696 'sv.iso885915': 'sv_SE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001697 'sv_fi': 'sv_FI.ISO8859-1',
1698 'sv_fi.iso88591': 'sv_FI.ISO8859-1',
1699 'sv_fi.iso885915': 'sv_FI.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001700 'sv_fi.iso885915@euro': 'sv_FI.ISO8859-15',
1701 'sv_fi.utf8@euro': 'sv_FI.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001702 'sv_fi@euro': 'sv_FI.ISO8859-15',
1703 'sv_se': 'sv_SE.ISO8859-1',
1704 'sv_se.88591': 'sv_SE.ISO8859-1',
1705 'sv_se.iso88591': 'sv_SE.ISO8859-1',
1706 'sv_se.iso885915': 'sv_SE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001707 'sv_se@euro': 'sv_SE.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001708 'sw_ke': 'sw_KE.UTF-8',
1709 'sw_tz': 'sw_TZ.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001710 'swedish': 'sv_SE.ISO8859-1',
1711 'swedish.iso88591': 'sv_SE.ISO8859-1',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001712 'szl_pl': 'szl_PL.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001713 'ta': 'ta_IN.TSCII-0',
1714 'ta_in': 'ta_IN.TSCII-0',
1715 'ta_in.tscii': 'ta_IN.TSCII-0',
1716 'ta_in.tscii0': 'ta_IN.TSCII-0',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001717 'ta_lk': 'ta_LK.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001718 'tcy_in.utf8': 'tcy_IN.UTF-8',
Antoine Pitroufc531532010-04-11 22:32:39 +00001719 'te': 'te_IN.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001720 'te_in': 'te_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001721 'tg': 'tg_TJ.KOI8-C',
1722 'tg_tj': 'tg_TJ.KOI8-C',
1723 'tg_tj.koi8c': 'tg_TJ.KOI8-C',
1724 'th': 'th_TH.ISO8859-11',
1725 'th_th': 'th_TH.ISO8859-11',
1726 'th_th.iso885911': 'th_TH.ISO8859-11',
1727 'th_th.tactis': 'th_TH.TIS620',
1728 'th_th.tis620': 'th_TH.TIS620',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001729 'thai': 'th_TH.ISO8859-11',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001730 'the_np': 'the_NP.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001731 'ti_er': 'ti_ER.UTF-8',
1732 'ti_et': 'ti_ET.UTF-8',
1733 'tig_er': 'tig_ER.UTF-8',
1734 'tk_tm': 'tk_TM.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001735 'tl': 'tl_PH.ISO8859-1',
1736 'tl_ph': 'tl_PH.ISO8859-1',
1737 'tl_ph.iso88591': 'tl_PH.ISO8859-1',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001738 'tn': 'tn_ZA.ISO8859-15',
1739 'tn_za': 'tn_ZA.ISO8859-15',
1740 'tn_za.iso885915': 'tn_ZA.ISO8859-15',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001741 'to_to': 'to_TO.UTF-8',
1742 'tpi_pg': 'tpi_PG.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001743 'tr': 'tr_TR.ISO8859-9',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001744 'tr_cy': 'tr_CY.ISO8859-9',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001745 'tr_tr': 'tr_TR.ISO8859-9',
1746 'tr_tr.iso88599': 'tr_TR.ISO8859-9',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001747 'ts': 'ts_ZA.ISO8859-1',
1748 'ts_za': 'ts_ZA.ISO8859-1',
1749 'ts_za.iso88591': 'ts_ZA.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001750 'tt': 'tt_RU.TATAR-CYR',
1751 'tt_ru': 'tt_RU.TATAR-CYR',
1752 'tt_ru.koi8c': 'tt_RU.KOI8-C',
1753 'tt_ru.tatarcyr': 'tt_RU.TATAR-CYR',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001754 'tt_ru@iqtelif': 'tt_RU.UTF-8@iqtelif',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001755 'turkish': 'tr_TR.ISO8859-9',
1756 'turkish.iso88599': 'tr_TR.ISO8859-9',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001757 'ug_cn': 'ug_CN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001758 'uk': 'uk_UA.KOI8-U',
1759 'uk_ua': 'uk_UA.KOI8-U',
1760 'uk_ua.cp1251': 'uk_UA.CP1251',
1761 'uk_ua.iso88595': 'uk_UA.ISO8859-5',
1762 'uk_ua.koi8u': 'uk_UA.KOI8-U',
1763 'uk_ua.microsoftcp1251': 'uk_UA.CP1251',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001764 'univ': 'en_US.utf',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001765 'universal': 'en_US.utf',
1766 'universal.utf8@ucs4': 'en_US.UTF-8',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001767 'unm_us': 'unm_US.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001768 'ur': 'ur_PK.CP1256',
Serhiy Storchaka0e4d8522013-12-20 18:22:38 +02001769 'ur_in': 'ur_IN.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001770 'ur_pk': 'ur_PK.CP1256',
1771 'ur_pk.cp1256': 'ur_PK.CP1256',
1772 'ur_pk.microsoftcp1256': 'ur_PK.CP1256',
1773 'uz': 'uz_UZ.UTF-8',
1774 'uz_uz': 'uz_UZ.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001775 'uz_uz.iso88591': 'uz_UZ.ISO8859-1',
1776 'uz_uz.utf8@cyrillic': 'uz_UZ.UTF-8',
1777 'uz_uz@cyrillic': 'uz_UZ.UTF-8',
1778 've': 've_ZA.UTF-8',
1779 've_za': 've_ZA.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001780 'vi': 'vi_VN.TCVN',
1781 'vi_vn': 'vi_VN.TCVN',
1782 'vi_vn.tcvn': 'vi_VN.TCVN',
1783 'vi_vn.tcvn5712': 'vi_VN.TCVN',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001784 'vi_vn.viscii': 'vi_VN.VISCII',
1785 'vi_vn.viscii111': 'vi_VN.VISCII',
1786 'wa': 'wa_BE.ISO8859-1',
1787 'wa_be': 'wa_BE.ISO8859-1',
1788 'wa_be.iso88591': 'wa_BE.ISO8859-1',
1789 'wa_be.iso885915': 'wa_BE.ISO8859-15',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001790 'wa_be.iso885915@euro': 'wa_BE.ISO8859-15',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001791 'wa_be@euro': 'wa_BE.ISO8859-15',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001792 'wae_ch': 'wae_CH.UTF-8',
1793 'wal_et': 'wal_ET.UTF-8',
1794 'wo_sn': 'wo_SN.UTF-8',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001795 'xh': 'xh_ZA.ISO8859-1',
1796 'xh_za': 'xh_ZA.ISO8859-1',
1797 'xh_za.iso88591': 'xh_ZA.ISO8859-1',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001798 'yi': 'yi_US.CP1255',
1799 'yi_us': 'yi_US.CP1255',
1800 'yi_us.cp1255': 'yi_US.CP1255',
1801 'yi_us.microsoftcp1255': 'yi_US.CP1255',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001802 'yo_ng': 'yo_NG.UTF-8',
1803 'yue_hk': 'yue_HK.UTF-8',
Serhiy Storchakaa55ac802018-05-06 10:51:49 +03001804 'yuw_pg': 'yuw_PG.UTF-8',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001805 'zh': 'zh_CN.eucCN',
1806 'zh_cn': 'zh_CN.gb2312',
1807 'zh_cn.big5': 'zh_TW.big5',
1808 'zh_cn.euc': 'zh_CN.eucCN',
1809 'zh_cn.gb18030': 'zh_CN.gb18030',
1810 'zh_cn.gb2312': 'zh_CN.gb2312',
1811 'zh_cn.gbk': 'zh_CN.gbk',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001812 'zh_hk': 'zh_HK.big5hkscs',
1813 'zh_hk.big5': 'zh_HK.big5',
Antoine Pitroufc531532010-04-11 22:32:39 +00001814 'zh_hk.big5hk': 'zh_HK.big5hkscs',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001815 'zh_hk.big5hkscs': 'zh_HK.big5hkscs',
Serhiy Storchaka4e286eb2014-10-01 23:44:20 +03001816 'zh_sg': 'zh_SG.GB2312',
1817 'zh_sg.gbk': 'zh_SG.GBK',
Marc-André Lemburgbb4f1bd2004-12-10 21:58:14 +00001818 'zh_tw': 'zh_TW.big5',
1819 'zh_tw.big5': 'zh_TW.big5',
1820 'zh_tw.euc': 'zh_TW.eucTW',
Marc-André Lemburgadff65b2008-05-30 20:52:18 +00001821 'zh_tw.euctw': 'zh_TW.eucTW',
1822 'zu': 'zu_ZA.ISO8859-1',
1823 'zu_za': 'zu_ZA.ISO8859-1',
1824 'zu_za.iso88591': 'zu_ZA.ISO8859-1',
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00001825}
1826
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001827#
Georg Brandlb709c2c2006-01-20 09:07:35 +00001828# This maps Windows language identifiers to locale strings.
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001829#
Tim Peters777f1082006-01-20 20:03:24 +00001830# This list has been updated from
Georg Brandlb709c2c2006-01-20 09:07:35 +00001831# http://msdn.microsoft.com/library/default.asp?url=/library/en-us/intl/nls_238z.asp
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001832# to include every locale up to Windows Vista.
Fredrik Lundh37a09822002-10-19 20:19:10 +00001833#
Georg Brandl5035c1c2006-01-20 13:38:26 +00001834# NOTE: this mapping is incomplete. If your language is missing, please
Éric Araujo8d4d74e2012-02-26 01:28:34 +01001835# submit a bug report to the Python bug tracker at http://bugs.python.org/
Georg Brandl5035c1c2006-01-20 13:38:26 +00001836# Make sure you include the missing language identifier and the suggested
1837# locale code.
1838#
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001839
1840windows_locale = {
Georg Brandlb709c2c2006-01-20 09:07:35 +00001841 0x0436: "af_ZA", # Afrikaans
1842 0x041c: "sq_AL", # Albanian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001843 0x0484: "gsw_FR",# Alsatian - France
1844 0x045e: "am_ET", # Amharic - Ethiopia
Georg Brandlb709c2c2006-01-20 09:07:35 +00001845 0x0401: "ar_SA", # Arabic - Saudi Arabia
1846 0x0801: "ar_IQ", # Arabic - Iraq
1847 0x0c01: "ar_EG", # Arabic - Egypt
1848 0x1001: "ar_LY", # Arabic - Libya
1849 0x1401: "ar_DZ", # Arabic - Algeria
1850 0x1801: "ar_MA", # Arabic - Morocco
1851 0x1c01: "ar_TN", # Arabic - Tunisia
1852 0x2001: "ar_OM", # Arabic - Oman
1853 0x2401: "ar_YE", # Arabic - Yemen
1854 0x2801: "ar_SY", # Arabic - Syria
1855 0x2c01: "ar_JO", # Arabic - Jordan
1856 0x3001: "ar_LB", # Arabic - Lebanon
1857 0x3401: "ar_KW", # Arabic - Kuwait
1858 0x3801: "ar_AE", # Arabic - United Arab Emirates
1859 0x3c01: "ar_BH", # Arabic - Bahrain
1860 0x4001: "ar_QA", # Arabic - Qatar
1861 0x042b: "hy_AM", # Armenian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001862 0x044d: "as_IN", # Assamese - India
1863 0x042c: "az_AZ", # Azeri - Latin
Georg Brandlb709c2c2006-01-20 09:07:35 +00001864 0x082c: "az_AZ", # Azeri - Cyrillic
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001865 0x046d: "ba_RU", # Bashkir
1866 0x042d: "eu_ES", # Basque - Russia
Georg Brandlb709c2c2006-01-20 09:07:35 +00001867 0x0423: "be_BY", # Belarusian
1868 0x0445: "bn_IN", # Begali
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001869 0x201a: "bs_BA", # Bosnian - Cyrillic
1870 0x141a: "bs_BA", # Bosnian - Latin
Georg Brandlb709c2c2006-01-20 09:07:35 +00001871 0x047e: "br_FR", # Breton - France
1872 0x0402: "bg_BG", # Bulgarian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001873# 0x0455: "my_MM", # Burmese - Not supported
Georg Brandlb709c2c2006-01-20 09:07:35 +00001874 0x0403: "ca_ES", # Catalan
1875 0x0004: "zh_CHS",# Chinese - Simplified
1876 0x0404: "zh_TW", # Chinese - Taiwan
1877 0x0804: "zh_CN", # Chinese - PRC
1878 0x0c04: "zh_HK", # Chinese - Hong Kong S.A.R.
1879 0x1004: "zh_SG", # Chinese - Singapore
1880 0x1404: "zh_MO", # Chinese - Macao S.A.R.
1881 0x7c04: "zh_CHT",# Chinese - Traditional
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001882 0x0483: "co_FR", # Corsican - France
Georg Brandlb709c2c2006-01-20 09:07:35 +00001883 0x041a: "hr_HR", # Croatian
1884 0x101a: "hr_BA", # Croatian - Bosnia
1885 0x0405: "cs_CZ", # Czech
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001886 0x0406: "da_DK", # Danish
Georg Brandlb709c2c2006-01-20 09:07:35 +00001887 0x048c: "gbz_AF",# Dari - Afghanistan
1888 0x0465: "div_MV",# Divehi - Maldives
1889 0x0413: "nl_NL", # Dutch - The Netherlands
1890 0x0813: "nl_BE", # Dutch - Belgium
1891 0x0409: "en_US", # English - United States
1892 0x0809: "en_GB", # English - United Kingdom
1893 0x0c09: "en_AU", # English - Australia
1894 0x1009: "en_CA", # English - Canada
1895 0x1409: "en_NZ", # English - New Zealand
1896 0x1809: "en_IE", # English - Ireland
1897 0x1c09: "en_ZA", # English - South Africa
1898 0x2009: "en_JA", # English - Jamaica
Martin Panterb1d867f2016-05-26 05:28:50 +00001899 0x2409: "en_CB", # English - Caribbean
Georg Brandlb709c2c2006-01-20 09:07:35 +00001900 0x2809: "en_BZ", # English - Belize
1901 0x2c09: "en_TT", # English - Trinidad
1902 0x3009: "en_ZW", # English - Zimbabwe
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001903 0x3409: "en_PH", # English - Philippines
1904 0x4009: "en_IN", # English - India
1905 0x4409: "en_MY", # English - Malaysia
1906 0x4809: "en_IN", # English - Singapore
Georg Brandlb709c2c2006-01-20 09:07:35 +00001907 0x0425: "et_EE", # Estonian
1908 0x0438: "fo_FO", # Faroese
1909 0x0464: "fil_PH",# Filipino
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001910 0x040b: "fi_FI", # Finnish
Georg Brandlb709c2c2006-01-20 09:07:35 +00001911 0x040c: "fr_FR", # French - France
1912 0x080c: "fr_BE", # French - Belgium
1913 0x0c0c: "fr_CA", # French - Canada
1914 0x100c: "fr_CH", # French - Switzerland
1915 0x140c: "fr_LU", # French - Luxembourg
1916 0x180c: "fr_MC", # French - Monaco
1917 0x0462: "fy_NL", # Frisian - Netherlands
1918 0x0456: "gl_ES", # Galician
1919 0x0437: "ka_GE", # Georgian
1920 0x0407: "de_DE", # German - Germany
1921 0x0807: "de_CH", # German - Switzerland
1922 0x0c07: "de_AT", # German - Austria
1923 0x1007: "de_LU", # German - Luxembourg
1924 0x1407: "de_LI", # German - Liechtenstein
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001925 0x0408: "el_GR", # Greek
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001926 0x046f: "kl_GL", # Greenlandic - Greenland
Georg Brandlb709c2c2006-01-20 09:07:35 +00001927 0x0447: "gu_IN", # Gujarati
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001928 0x0468: "ha_NG", # Hausa - Latin
Georg Brandlb709c2c2006-01-20 09:07:35 +00001929 0x040d: "he_IL", # Hebrew
1930 0x0439: "hi_IN", # Hindi
1931 0x040e: "hu_HU", # Hungarian
Fredrik Lundh6c86b992000-07-09 17:12:58 +00001932 0x040f: "is_IS", # Icelandic
Georg Brandlb709c2c2006-01-20 09:07:35 +00001933 0x0421: "id_ID", # Indonesian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001934 0x045d: "iu_CA", # Inuktitut - Syllabics
Georg Brandlb709c2c2006-01-20 09:07:35 +00001935 0x085d: "iu_CA", # Inuktitut - Latin
1936 0x083c: "ga_IE", # Irish - Ireland
Georg Brandlb709c2c2006-01-20 09:07:35 +00001937 0x0410: "it_IT", # Italian - Italy
1938 0x0810: "it_CH", # Italian - Switzerland
1939 0x0411: "ja_JP", # Japanese
1940 0x044b: "kn_IN", # Kannada - India
1941 0x043f: "kk_KZ", # Kazakh
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001942 0x0453: "kh_KH", # Khmer - Cambodia
1943 0x0486: "qut_GT",# K'iche - Guatemala
1944 0x0487: "rw_RW", # Kinyarwanda - Rwanda
Georg Brandlb709c2c2006-01-20 09:07:35 +00001945 0x0457: "kok_IN",# Konkani
1946 0x0412: "ko_KR", # Korean
1947 0x0440: "ky_KG", # Kyrgyz
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001948 0x0454: "lo_LA", # Lao - Lao PDR
Georg Brandlb709c2c2006-01-20 09:07:35 +00001949 0x0426: "lv_LV", # Latvian
1950 0x0427: "lt_LT", # Lithuanian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001951 0x082e: "dsb_DE",# Lower Sorbian - Germany
Georg Brandlb709c2c2006-01-20 09:07:35 +00001952 0x046e: "lb_LU", # Luxembourgish
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001953 0x042f: "mk_MK", # FYROM Macedonian
Georg Brandlb709c2c2006-01-20 09:07:35 +00001954 0x043e: "ms_MY", # Malay - Malaysia
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001955 0x083e: "ms_BN", # Malay - Brunei Darussalam
Georg Brandlb709c2c2006-01-20 09:07:35 +00001956 0x044c: "ml_IN", # Malayalam - India
1957 0x043a: "mt_MT", # Maltese
1958 0x0481: "mi_NZ", # Maori
1959 0x047a: "arn_CL",# Mapudungun
1960 0x044e: "mr_IN", # Marathi
1961 0x047c: "moh_CA",# Mohawk - Canada
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001962 0x0450: "mn_MN", # Mongolian - Cyrillic
1963 0x0850: "mn_CN", # Mongolian - PRC
Georg Brandlb709c2c2006-01-20 09:07:35 +00001964 0x0461: "ne_NP", # Nepali
1965 0x0414: "nb_NO", # Norwegian - Bokmal
1966 0x0814: "nn_NO", # Norwegian - Nynorsk
1967 0x0482: "oc_FR", # Occitan - France
1968 0x0448: "or_IN", # Oriya - India
1969 0x0463: "ps_AF", # Pashto - Afghanistan
1970 0x0429: "fa_IR", # Persian
1971 0x0415: "pl_PL", # Polish
1972 0x0416: "pt_BR", # Portuguese - Brazil
1973 0x0816: "pt_PT", # Portuguese - Portugal
1974 0x0446: "pa_IN", # Punjabi
1975 0x046b: "quz_BO",# Quechua (Bolivia)
1976 0x086b: "quz_EC",# Quechua (Ecuador)
1977 0x0c6b: "quz_PE",# Quechua (Peru)
1978 0x0418: "ro_RO", # Romanian - Romania
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001979 0x0417: "rm_CH", # Romansh
Georg Brandlb709c2c2006-01-20 09:07:35 +00001980 0x0419: "ru_RU", # Russian
1981 0x243b: "smn_FI",# Sami Finland
1982 0x103b: "smj_NO",# Sami Norway
1983 0x143b: "smj_SE",# Sami Sweden
1984 0x043b: "se_NO", # Sami Northern Norway
1985 0x083b: "se_SE", # Sami Northern Sweden
1986 0x0c3b: "se_FI", # Sami Northern Finland
1987 0x203b: "sms_FI",# Sami Skolt
1988 0x183b: "sma_NO",# Sami Southern Norway
1989 0x1c3b: "sma_SE",# Sami Southern Sweden
1990 0x044f: "sa_IN", # Sanskrit
1991 0x0c1a: "sr_SP", # Serbian - Cyrillic
1992 0x1c1a: "sr_BA", # Serbian - Bosnia Cyrillic
1993 0x081a: "sr_SP", # Serbian - Latin
1994 0x181a: "sr_BA", # Serbian - Bosnia Latin
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00001995 0x045b: "si_LK", # Sinhala - Sri Lanka
Georg Brandlb709c2c2006-01-20 09:07:35 +00001996 0x046c: "ns_ZA", # Northern Sotho
1997 0x0432: "tn_ZA", # Setswana - Southern Africa
1998 0x041b: "sk_SK", # Slovak
1999 0x0424: "sl_SI", # Slovenian
2000 0x040a: "es_ES", # Spanish - Spain
2001 0x080a: "es_MX", # Spanish - Mexico
2002 0x0c0a: "es_ES", # Spanish - Spain (Modern)
2003 0x100a: "es_GT", # Spanish - Guatemala
2004 0x140a: "es_CR", # Spanish - Costa Rica
2005 0x180a: "es_PA", # Spanish - Panama
2006 0x1c0a: "es_DO", # Spanish - Dominican Republic
2007 0x200a: "es_VE", # Spanish - Venezuela
2008 0x240a: "es_CO", # Spanish - Colombia
2009 0x280a: "es_PE", # Spanish - Peru
2010 0x2c0a: "es_AR", # Spanish - Argentina
2011 0x300a: "es_EC", # Spanish - Ecuador
2012 0x340a: "es_CL", # Spanish - Chile
2013 0x380a: "es_UR", # Spanish - Uruguay
2014 0x3c0a: "es_PY", # Spanish - Paraguay
2015 0x400a: "es_BO", # Spanish - Bolivia
2016 0x440a: "es_SV", # Spanish - El Salvador
2017 0x480a: "es_HN", # Spanish - Honduras
2018 0x4c0a: "es_NI", # Spanish - Nicaragua
2019 0x500a: "es_PR", # Spanish - Puerto Rico
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002020 0x540a: "es_US", # Spanish - United States
2021# 0x0430: "", # Sutu - Not supported
Georg Brandlb709c2c2006-01-20 09:07:35 +00002022 0x0441: "sw_KE", # Swahili
2023 0x041d: "sv_SE", # Swedish - Sweden
2024 0x081d: "sv_FI", # Swedish - Finland
2025 0x045a: "syr_SY",# Syriac
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002026 0x0428: "tg_TJ", # Tajik - Cyrillic
2027 0x085f: "tmz_DZ",# Tamazight - Latin
Georg Brandlb709c2c2006-01-20 09:07:35 +00002028 0x0449: "ta_IN", # Tamil
2029 0x0444: "tt_RU", # Tatar
2030 0x044a: "te_IN", # Telugu
2031 0x041e: "th_TH", # Thai
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002032 0x0851: "bo_BT", # Tibetan - Bhutan
2033 0x0451: "bo_CN", # Tibetan - PRC
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002034 0x041f: "tr_TR", # Turkish
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002035 0x0442: "tk_TM", # Turkmen - Cyrillic
2036 0x0480: "ug_CN", # Uighur - Arabic
Georg Brandlb709c2c2006-01-20 09:07:35 +00002037 0x0422: "uk_UA", # Ukrainian
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002038 0x042e: "wen_DE",# Upper Sorbian - Germany
Georg Brandlb709c2c2006-01-20 09:07:35 +00002039 0x0420: "ur_PK", # Urdu
2040 0x0820: "ur_IN", # Urdu - India
2041 0x0443: "uz_UZ", # Uzbek - Latin
2042 0x0843: "uz_UZ", # Uzbek - Cyrillic
2043 0x042a: "vi_VN", # Vietnamese
2044 0x0452: "cy_GB", # Welsh
Jeroen Ruigrok van der Wervenb87b3342009-05-08 14:11:23 +00002045 0x0488: "wo_SN", # Wolof - Senegal
2046 0x0434: "xh_ZA", # Xhosa - South Africa
2047 0x0485: "sah_RU",# Yakut - Cyrillic
2048 0x0478: "ii_CN", # Yi - PRC
2049 0x046a: "yo_NG", # Yoruba - Nigeria
2050 0x0435: "zu_ZA", # Zulu
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002051}
2052
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002053def _print_locale():
2054
2055 """ Test function.
2056 """
2057 categories = {}
2058 def _init_categories(categories=categories):
2059 for k,v in globals().items():
2060 if k[:3] == 'LC_':
2061 categories[k] = v
2062 _init_categories()
2063 del categories['LC_ALL']
2064
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002065 print 'Locale defaults as determined by getdefaultlocale():'
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002066 print '-'*72
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002067 lang, enc = getdefaultlocale()
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002068 print 'Language: ', lang or '(undefined)'
2069 print 'Encoding: ', enc or '(undefined)'
2070 print
2071
2072 print 'Locale settings on startup:'
2073 print '-'*72
2074 for name,category in categories.items():
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002075 print name, '...'
2076 lang, enc = getlocale(category)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002077 print ' Language: ', lang or '(undefined)'
2078 print ' Encoding: ', enc or '(undefined)'
2079 print
2080
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002081 print
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002082 print 'Locale settings after calling resetlocale():'
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002083 print '-'*72
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002084 resetlocale()
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002085 for name,category in categories.items():
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002086 print name, '...'
2087 lang, enc = getlocale(category)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002088 print ' Language: ', lang or '(undefined)'
2089 print ' Encoding: ', enc or '(undefined)'
2090 print
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002091
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002092 try:
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002093 setlocale(LC_ALL, "")
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002094 except:
2095 print 'NOTE:'
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002096 print 'setlocale(LC_ALL, "") does not support the default locale'
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002097 print 'given in the OS environment variables.'
2098 else:
2099 print
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002100 print 'Locale settings after calling setlocale(LC_ALL, ""):'
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002101 print '-'*72
2102 for name,category in categories.items():
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002103 print name, '...'
2104 lang, enc = getlocale(category)
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002105 print ' Language: ', lang or '(undefined)'
2106 print ' Encoding: ', enc or '(undefined)'
2107 print
Fredrik Lundh6c86b992000-07-09 17:12:58 +00002108
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002109###
Guido van Rossumeef1d4e1997-11-19 19:01:43 +00002110
Tim Peters1baf8292001-01-24 10:13:46 +00002111try:
2112 LC_MESSAGES
Skip Montanaro0897f0c2002-03-25 21:40:36 +00002113except NameError:
Tim Peters1baf8292001-01-24 10:13:46 +00002114 pass
2115else:
2116 __all__.append("LC_MESSAGES")
2117
Guido van Rossumeef1d4e1997-11-19 19:01:43 +00002118if __name__=='__main__':
Marc-André Lemburg5431bc32000-06-07 09:11:40 +00002119 print 'Locale aliasing:'
2120 print
2121 _print_locale()
2122 print
2123 print 'Number formatting:'
2124 print
2125 _test()