Lib/locale.py - platform/external/python/cpython2 - Gitiles

 """ Locale support.

     The module provides low-level access to the C lib's locale APIs
     and adds high level number formatting APIs as well as a locale
     aliasing engine to complement these.

     The aliasing engine includes support for many commonly used locale
     names and maps them to values suitable for passing to the C lib's
     setlocale() function. It also includes default encodings for all
     supported locale names.

 """

 import string

 ### Load C lib locale APIs or use an emulation

 try:
     from _locale import *

 except ImportError:

     CHAR_MAX = 127
     LC_ALL = 6
     LC_COLLATE = 3
     LC_CTYPE = 0
     LC_MESSAGES = 5
     LC_MONETARY = 4
     LC_NUMERIC = 1
     LC_TIME = 2
     Error = ValueError

     def localeconv():
         """ localeconv() -> dict.
             Returns numeric and monetary locale-specific parameters.
         """
         # 'C' locale default values
         return {'grouping': [127],
                 'currency_symbol': '',
                 'n_sign_posn': 127,
                 'p_cs_precedes': 127,
                 'n_cs_precedes': 127,
                 'mon_grouping': [],
                 'n_sep_by_space': 127,
                 'decimal_point': '.',
                 'negative_sign': '',
                 'positive_sign': '',
                 'p_sep_by_space': 127,
                 'int_curr_symbol': '',
                 'p_sign_posn': 127,
                 'thousands_sep': '',
                 'mon_thousands_sep': '',
                 'frac_digits': 127,
                 'mon_decimal_point': '',
                 'int_frac_digits': 127}

     def setlocale(category, value=None):
         """ setlocale(integer,string=None) -> string.
             Activates/queries locale processing.
         """
         if value is not None and \
            value is not 'C':
             raise Error,'_locale emulation only supports "C" locale'
         return 'C'

     def strcoll(a,b):
         """ strcoll(string,string) -> int.
             Compares two strings according to the locale.
         """
         return cmp(a,b)

     def strxfrm(s):
         """ strxfrm(string) -> string.
             Returns a string that behaves for cmp locale-aware.
         """
         return s

 ### Number formatting APIs

 # Author: Martin von Loewis

 #perform the grouping from right to left
 def _group(s):
     conv=localeconv()
     grouping=conv['grouping']
     if not grouping:return s
     result=""
     while s and grouping:
         # if grouping is -1, we are done
         if grouping[0]==CHAR_MAX:
             break
         # 0: re-use last group ad infinitum
         elif grouping[0]!=0:
             #process last group
             group=grouping[0]
             grouping=grouping[1:]
         if result:
             result=s[-group:]+conv['thousands_sep']+result
         else:
             result=s[-group:]
         s=s[:-group]
     if not result:
         return s
     if s:
         result=s+conv['thousands_sep']+result
     return result

 def format(f,val,grouping=0):
     """Formats a value in the same way that the % formatting would use,
     but takes the current locale into account.
     Grouping is applied if the third parameter is true."""
     result = f % val
     fields = string.split(result, ".")
     if grouping:
         fields[0]=_group(fields[0])
     if len(fields)==2:
         return fields[0]+localeconv()['decimal_point']+fields[1]
     elif len(fields)==1:
         return fields[0]
     else:
         raise Error,"Too many decimal points in result string"

 def str(val):
     """Convert float to integer, taking the locale into account."""
     return format("%.12g",val)

 def atof(str,func=string.atof):
     "Parses a string as a float according to the locale settings."
     #First, get rid of the grouping
     ts = localeconv()['thousands_sep']
     if ts:
         s=string.split(str,ts)
         str=string.join(s, "")
     #next, replace the decimal point with a dot
     dd = localeconv()['decimal_point']
     if dd:
         s=string.split(str,dd)
         str=string.join(s,'.')
     #finally, parse the string
     return func(str)

 def atoi(str):
     "Converts a string to an integer according to the locale settings."
     return atof(str,string.atoi)

 def _test():
     setlocale(LC_ALL,"")
     #do grouping
     s1=format("%d",123456789,1)
     print s1,"is",atoi(s1)
     #standard formatting
     s1=str(3.14)
     print s1,"is",atof(s1)

 ### Locale name aliasing engine

 # Author: Marc-Andre Lemburg, mal@lemburg.com

 def normalize(localename):

     """ Returns a normalized locale code for the given locale
         name.

         The returned locale code is formatted for use with
         setlocale().

         If normalization fails, the original name is returned
         unchanged.

         If the given encoding is not known, the function defaults to
         the default encoding for the locale code just like setlocale()
         does.

     """
     # Normalize the locale name and extract the encoding
     fullname = string.lower(localename)
     if ':' in fullname:
         # ':' is sometimes used as encoding delimiter.
         fullname = string.replace(fullname, ':', '.')
     if '.' in fullname:
         langname, encoding = string.split(fullname, '.')[:2]
         fullname = langname + '.' + encoding
     else:
         langname = fullname
         encoding = ''

     # First lookup: fullname (possibly with encoding)
     code = locale_alias.get(fullname, None)
     if code is not None:
         return code

     # Second try: langname (without encoding)
     code = locale_alias.get(langname, None)
     if code is not None:
         if '.' in code:
             langname, defenc = string.split(code, '.')
         else:
             langname = code
             defenc = ''
         if encoding:
             encoding = encoding_alias.get(encoding, encoding)
         else:
             encoding = defenc
         if encoding:
             return langname + '.' + encoding
         else:
             return langname

     else:
         return localename

 def _parse_localename(localename):

     """ Parses the locale code for localename and returns the
         result as tuple (language code, encoding).

         The localename is normalized and passed through the locale
         alias engine. A ValueError is raised in case the locale name
         cannot be parsed.

         The language code corresponds to RFC 1766.  code and encoding
         can be None in case the values cannot be determined or are
         unkown to this implementation.

     """
     code = normalize(localename)
     if '.' in code:
         return string.split(code, '.')[:2]
     elif code == 'C':
         return None, None
     else:
         raise ValueError,'unkown locale: %s' % localename
     return l

 def _build_localename(localetuple):

     """ Builds a locale code from the given tuple (language code,
         encoding).

         No aliasing or normalizing takes place.

     """
     language, encoding = localetuple
     if language is None:
         language = 'C'
     if encoding is None:
         return language
     else:
         return language + '.' + encoding

 def get_default(envvars=('LANGUAGE', 'LC_ALL', 'LC_CTYPE', 'LANG')):

     """ Tries to determine the default locale settings and returns
         them as tuple (language code, encoding).

         According to POSIX, a program which has not called
         setlocale(LC_ALL,"") runs using the portable 'C' locale.
         Calling setlocale(LC_ALL,"") lets it use the default locale as
         defined by the LANG variable. Since we don't want to interfere
         with the current locale setting we thus emulate the behaviour
         in the way described above.

         To maintain compatibility with other platforms, not only the
         LANG variable is tested, but a list of variables given as
         envvars parameter. The first found to be defined will be
         used. envvars defaults to the search path used in GNU gettext;
         it must always contain the variable name 'LANG'.

         Except for the code 'C', the language code corresponds to RFC
         1766.  code and encoding can be None in case the values cannot
         be determined.

     """
     import os
     lookup = os.environ.get
     for variable in envvars:
         localename = lookup(variable,None)
         if localename is not None:
             break
     else:
         localename = 'C'
     return _parse_localename(localename)

 def get_locale(category=LC_CTYPE):

     """ Returns the current setting for the given locale category as
         tuple (language code, encoding).

         category may be one of the LC_* value except LC_ALL. It
         defaults to LC_CTYPE.

         Except for the code 'C', the language code corresponds to RFC
         1766.  code and encoding can be None in case the values cannot
         be determined.

     """
     localename = setlocale(category)
     if category == LC_ALL and ';' in localename:
         raise TypeError,'category LC_ALL is not supported'
     return _parse_localename(localename)

 def set_locale(localetuple, category=LC_ALL):

     """ Set the locale according to the localetuple (language code,
         encoding) as returned by get_locale() and get_default().

         The given codes are passed through the locale aliasing engine
         before being given to setlocale() for processing.

         category may be given as one of the LC_* values. It defaults
         to LC_ALL.

     """
     setlocale(category, normalize(_build_localename(localetuple)))

 def set_to_default(category=LC_ALL):

     """ Sets the locale for category to the default setting.

         The default setting is determined by calling
         get_default(). category defaults to LC_ALL.

     """
     setlocale(category, _build_localename(get_default()))

 ### Database
 #
 # The following data was extracted from the locale.alias file which
 # comes with X11 and then hand edited removing the explicit encoding
 # definitions and adding some more aliases. The file is usually
 # available as /usr/lib/X11/locale/locale.alias.
 #

 #
 # The encoding_alias table maps lowercase encoding alias names to C
 # locale encoding names (case-sensitive).
 #
 encoding_alias = {
         '437': 				'C',
         'c': 				'C',
         'iso8859': 			'ISO8859-1',
         '8859': 			'ISO8859-1',
         '88591': 			'ISO8859-1',
         'ascii': 			'ISO8859-1',
         'en': 				'ISO8859-1',
         'iso88591': 			'ISO8859-1',
         'iso_8859-1': 			'ISO8859-1',
         '885915': 			'ISO8859-15',
         'iso885915': 			'ISO8859-15',
         'iso_8859-15': 			'ISO8859-15',
         'iso8859-2': 			'ISO8859-2',
         'iso88592': 			'ISO8859-2',
         'iso_8859-2': 			'ISO8859-2',
         'iso88595': 			'ISO8859-5',
         'iso88596': 			'ISO8859-6',
         'iso88597': 			'ISO8859-7',
         'iso88598': 			'ISO8859-8',
         'iso88599': 			'ISO8859-9',
         'iso-2022-jp': 			'JIS7',
         'jis': 				'JIS7',
         'jis7': 			'JIS7',
         'sjis': 			'SJIS',
         'tis620': 			'TACTIS',
         'ajec': 			'eucJP',
         'eucjp': 			'eucJP',
         'ujis': 			'eucJP',
         'utf-8': 			'utf',
         'utf8': 			'utf',
         'utf8@ucs4': 			'utf',
 }

 #
 # The locale_alias table maps lowercase alias names to C locale names
 # (case-sensitive). Encodings are always separated from the locale
 # name using a dot ('.'); they should only be given in case the
 # language name is needed to interpret the given encoding alias
 # correctly (CJK codes often have this need).
 #
 locale_alias = {
         'american':                      'en_US.ISO8859-1',
         'ar':                            'ar_AA.ISO8859-6',
         'ar_aa':                         'ar_AA.ISO8859-6',
         'ar_sa':                         'ar_SA.ISO8859-6',
         'arabic':                        'ar_AA.ISO8859-6',
         'bg':                            'bg_BG.ISO8859-5',
         'bg_bg':                         'bg_BG.ISO8859-5',
         'bulgarian':                     'bg_BG.ISO8859-5',
         'c-french':                      'fr_CA.ISO8859-1',
         'c':                             'C',
         'c_c':                           'C',
         'cextend':                       'en_US.ISO8859-1',
         'chinese-s':                     'zh_CN.eucCN',
         'chinese-t':                     'zh_TW.eucTW',
         'croatian':                      'hr_HR.ISO8859-2',
         'cs':                            'cs_CZ.ISO8859-2',
         'cs_cs':                         'cs_CZ.ISO8859-2',
         'cs_cz':                         'cs_CZ.ISO8859-2',
         'cz':                            'cz_CZ.ISO8859-2',
         'cz_cz':                         'cz_CZ.ISO8859-2',
         'czech':                         'cs_CS.ISO8859-2',
         'da':                            'da_DK.ISO8859-1',
         'da_dk':                         'da_DK.ISO8859-1',
         'danish':                        'da_DK.ISO8859-1',
         'de':                            'de_DE.ISO8859-1',
         'de_at':                         'de_AT.ISO8859-1',
         'de_ch':                         'de_CH.ISO8859-1',
         'de_de':                         'de_DE.ISO8859-1',
         'dutch':                         'nl_BE.ISO8859-1',
         'ee':                            'ee_EE.ISO8859-4',
         'el':                            'el_GR.ISO8859-7',
         'el_gr':                         'el_GR.ISO8859-7',
         'en':                            'en_US.ISO8859-1',
         'en_au':                         'en_AU.ISO8859-1',
         'en_ca':                         'en_CA.ISO8859-1',
         'en_gb':                         'en_GB.ISO8859-1',
         'en_ie':                         'en_IE.ISO8859-1',
         'en_nz':                         'en_NZ.ISO8859-1',
         'en_uk':                         'en_GB.ISO8859-1',
         'en_us':                         'en_US.ISO8859-1',
         'eng_gb':                        'en_GB.ISO8859-1',
         'english':                       'en_EN.ISO8859-1',
         'english_uk':                    'en_GB.ISO8859-1',
         'english_united-states':         'en_US.ISO8859-1',
         'english_us':                    'en_US.ISO8859-1',
         'es':                            'es_ES.ISO8859-1',
         'es_ar':                         'es_AR.ISO8859-1',
         'es_bo':                         'es_BO.ISO8859-1',
         'es_cl':                         'es_CL.ISO8859-1',
         'es_co':                         'es_CO.ISO8859-1',
         'es_cr':                         'es_CR.ISO8859-1',
         'es_ec':                         'es_EC.ISO8859-1',
         'es_es':                         'es_ES.ISO8859-1',
         'es_gt':                         'es_GT.ISO8859-1',
         'es_mx':                         'es_MX.ISO8859-1',
         'es_ni':                         'es_NI.ISO8859-1',
         'es_pa':                         'es_PA.ISO8859-1',
         'es_pe':                         'es_PE.ISO8859-1',
         'es_py':                         'es_PY.ISO8859-1',
         'es_sv':                         'es_SV.ISO8859-1',
         'es_uy':                         'es_UY.ISO8859-1',
         'es_ve':                         'es_VE.ISO8859-1',
         'et':                            'et_EE.ISO8859-4',
         'et_ee':                         'et_EE.ISO8859-4',
         'fi':                            'fi_FI.ISO8859-1',
         'fi_fi':                         'fi_FI.ISO8859-1',
         'finnish':                       'fi_FI.ISO8859-1',
         'fr':                            'fr_FR.ISO8859-1',
         'fr_be':                         'fr_BE.ISO8859-1',
         'fr_ca':                         'fr_CA.ISO8859-1',
         'fr_ch':                         'fr_CH.ISO8859-1',
         'fr_fr':                         'fr_FR.ISO8859-1',
         'fre_fr':                        'fr_FR.ISO8859-1',
         'french':                        'fr_FR.ISO8859-1',
         'french_france':                 'fr_FR.ISO8859-1',
         'ger_de':                        'de_DE.ISO8859-1',
         'german':                        'de_DE.ISO8859-1',
         'german_germany':                'de_DE.ISO8859-1',
         'greek':                         'el_GR.ISO8859-7',
         'hebrew':                        'iw_IL.ISO8859-8',
         'hr':                            'hr_HR.ISO8859-2',
         'hr_hr':                         'hr_HR.ISO8859-2',
         'hu':                            'hu_HU.ISO8859-2',
         'hu_hu':                         'hu_HU.ISO8859-2',
         'hungarian':                     'hu_HU.ISO8859-2',
         'icelandic':                     'is_IS.ISO8859-1',
         'id':                            'id_ID.ISO8859-1',
         'id_id':                         'id_ID.ISO8859-1',
         'is':                            'is_IS.ISO8859-1',
         'is_is':                         'is_IS.ISO8859-1',
         'iso-8859-1':                    'en_US.ISO8859-1',
         'iso-8859-15':                   'en_US.ISO8859-15',
         'iso8859-1':                     'en_US.ISO8859-1',
         'iso8859-15':                    'en_US.ISO8859-15',
         'iso_8859_1':                    'en_US.ISO8859-1',
         'iso_8859_15':                   'en_US.ISO8859-15',
         'it':                            'it_IT.ISO8859-1',
         'it_ch':                         'it_CH.ISO8859-1',
         'it_it':                         'it_IT.ISO8859-1',
         'italian':                       'it_IT.ISO8859-1',
         'iw':                            'iw_IL.ISO8859-8',
         'iw_il':                         'iw_IL.ISO8859-8',
         'ja':                            'ja_JP.eucJP',
         'ja.jis':                        'ja_JP.JIS7',
         'ja.sjis':                       'ja_JP.SJIS',
         'ja_jp':                         'ja_JP.eucJP',
         'ja_jp.ajec':                    'ja_JP.eucJP',
         'ja_jp.euc':                     'ja_JP.eucJP',
         'ja_jp.eucjp':                   'ja_JP.eucJP',
         'ja_jp.iso-2022-jp':             'ja_JP.JIS7',
         'ja_jp.jis':                     'ja_JP.JIS7',
         'ja_jp.jis7':                    'ja_JP.JIS7',
         'ja_jp.mscode':                  'ja_JP.SJIS',
         'ja_jp.sjis':                    'ja_JP.SJIS',
         'ja_jp.ujis':                    'ja_JP.eucJP',
         'japan':                         'ja_JP.eucJP',
         'japanese':                      'ja_JP.SJIS',
         'japanese-euc':                  'ja_JP.eucJP',
         'japanese.euc':                  'ja_JP.eucJP',
         'jp_jp':                         'ja_JP.eucJP',
         'ko':                            'ko_KR.eucKR',
         'ko_kr':                         'ko_KR.eucKR',
         'ko_kr.euc':                     'ko_KR.eucKR',
         'korean':                        'ko_KR.eucKR',
         'lt':                            'lt_LT.ISO8859-4',
         'lv':                            'lv_LV.ISO8859-4',
         'mk':                            'mk_MK.ISO8859-5',
         'mk_mk':                         'mk_MK.ISO8859-5',
         'nl':                            'nl_NL.ISO8859-1',
         'nl_be':                         'nl_BE.ISO8859-1',
         'nl_nl':                         'nl_NL.ISO8859-1',
         'no':                            'no_NO.ISO8859-1',
         'no_no':                         'no_NO.ISO8859-1',
         'norwegian':                     'no_NO.ISO8859-1',
         'pl':                            'pl_PL.ISO8859-2',
         'pl_pl':                         'pl_PL.ISO8859-2',
         'polish':                        'pl_PL.ISO8859-2',
         'portuguese':                    'pt_PT.ISO8859-1',
         'portuguese_brazil':             'pt_BR.ISO8859-1',
         'posix':                         'C',
         'posix-utf2':                    'C',
         'pt':                            'pt_PT.ISO8859-1',
         'pt_br':                         'pt_BR.ISO8859-1',
         'pt_pt':                         'pt_PT.ISO8859-1',
         'ro':                            'ro_RO.ISO8859-2',
         'ro_ro':                         'ro_RO.ISO8859-2',
         'ru':                            'ru_RU.ISO8859-5',
         'ru_ru':                         'ru_RU.ISO8859-5',
         'rumanian':                      'ro_RO.ISO8859-2',
         'russian':                       'ru_RU.ISO8859-5',
         'serbocroatian':                 'sh_YU.ISO8859-2',
         'sh':                            'sh_YU.ISO8859-2',
         'sh_hr':                         'sh_HR.ISO8859-2',
         'sh_sp':                         'sh_YU.ISO8859-2',
         'sh_yu':                         'sh_YU.ISO8859-2',
         'sk':                            'sk_SK.ISO8859-2',
         'sk_sk':                         'sk_SK.ISO8859-2',
         'sl':                            'sl_CS.ISO8859-2',
         'sl_cs':                         'sl_CS.ISO8859-2',
         'sl_si':                         'sl_SI.ISO8859-2',
         'slovak':                        'sk_SK.ISO8859-2',
         'slovene':                       'sl_CS.ISO8859-2',
         'sp':                            'sp_YU.ISO8859-5',
         'sp_yu':                         'sp_YU.ISO8859-5',
         'spanish':                       'es_ES.ISO8859-1',
         'spanish_spain':                 'es_ES.ISO8859-1',
         'sr_sp':                         'sr_SP.ISO8859-2',
         'sv':                            'sv_SE.ISO8859-1',
         'sv_se':                         'sv_SE.ISO8859-1',
         'swedish':                       'sv_SE.ISO8859-1',
         'th_th':                         'th_TH.TACTIS',
         'tr':                            'tr_TR.ISO8859-9',
         'tr_tr':                         'tr_TR.ISO8859-9',
         'turkish':                       'tr_TR.ISO8859-9',
         'univ':                          'en_US.utf',
         'universal':                     'en_US.utf',
         'zh':                            'zh_CN.eucCN',
         'zh_cn':                         'zh_CN.eucCN',
         'zh_cn.big5':                    'zh_TW.eucTW',
         'zh_cn.euc':                     'zh_CN.eucCN',
         'zh_tw':                         'zh_TW.eucTW',
         'zh_tw.euc':                     'zh_TW.eucTW',
 }

 def _print_locale():

     """ Test function.
     """
     categories = {}
     def _init_categories(categories=categories):
         for k,v in globals().items():
             if k[:3] == 'LC_':
                 categories[k] = v
     _init_categories()
     del categories['LC_ALL']

     print 'Locale defaults as determined by get_default():'
     print '-'*72
     lang, enc = get_default()
     print 'Language: ', lang or '(undefined)'
     print 'Encoding: ', enc or '(undefined)'
     print

     print 'Locale settings on startup:'
     print '-'*72
     for name,category in categories.items():
         print name,'...'
         lang, enc = get_locale(category)
         print '   Language: ', lang or '(undefined)'
         print '   Encoding: ', enc or '(undefined)'
         print

     set_to_default()
     print
     print 'Locale settings after calling set_to_default():'
     print '-'*72
     for name,category in categories.items():
         print name,'...'
         lang, enc = get_locale(category)
         print '   Language: ', lang or '(undefined)'
         print '   Encoding: ', enc or '(undefined)'
         print

     try:
         setlocale(LC_ALL,"")
     except:
         print 'NOTE:'
         print 'setlocale(LC_ALL,"") does not support the default locale'
         print 'given in the OS environment variables.'
     else:
         print
         print 'Locale settings after calling setlocale(LC_ALL,""):'
         print '-'*72
         for name,category in categories.items():
             print name,'...'
             lang, enc = get_locale(category)
             print '   Language: ', lang or '(undefined)'
             print '   Encoding: ', enc or '(undefined)'
             print

 ###

 if __name__=='__main__':
     print 'Locale aliasing:'
     print
     _print_locale()
     print
     print 'Number formatting:'
     print
     _test()
	""" Locale support.

	The module provides low-level access to the C lib's locale APIs
	and adds high level number formatting APIs as well as a locale
	aliasing engine to complement these.

	The aliasing engine includes support for many commonly used locale
	names and maps them to values suitable for passing to the C lib's
	setlocale() function. It also includes default encodings for all
	supported locale names.

	"""

	import string

	### Load C lib locale APIs or use an emulation

	try:
	from _locale import *

	except ImportError:

	CHAR_MAX = 127
	LC_ALL = 6
	LC_COLLATE = 3
	LC_CTYPE = 0
	LC_MESSAGES = 5
	LC_MONETARY = 4
	LC_NUMERIC = 1
	LC_TIME = 2
	Error = ValueError

	def localeconv():
	""" localeconv() -> dict.
	Returns numeric and monetary locale-specific parameters.
	"""
	# 'C' locale default values
	return {'grouping': [127],
	'currency_symbol': '',
	'n_sign_posn': 127,
	'p_cs_precedes': 127,
	'n_cs_precedes': 127,
	'mon_grouping': [],
	'n_sep_by_space': 127,
	'decimal_point': '.',
	'negative_sign': '',
	'positive_sign': '',
	'p_sep_by_space': 127,
	'int_curr_symbol': '',
	'p_sign_posn': 127,
	'thousands_sep': '',
	'mon_thousands_sep': '',
	'frac_digits': 127,
	'mon_decimal_point': '',
	'int_frac_digits': 127}

	def setlocale(category, value=None):
	""" setlocale(integer,string=None) -> string.
	Activates/queries locale processing.
	"""
	if value is not None and \
	value is not 'C':
	raise Error,'_locale emulation only supports "C" locale'
	return 'C'

	def strcoll(a,b):
	""" strcoll(string,string) -> int.
	Compares two strings according to the locale.
	"""
	return cmp(a,b)

	def strxfrm(s):
	""" strxfrm(string) -> string.
	Returns a string that behaves for cmp locale-aware.
	"""
	return s

	### Number formatting APIs

	# Author: Martin von Loewis

	#perform the grouping from right to left
	def _group(s):
	conv=localeconv()
	grouping=conv['grouping']
	if not grouping:return s
	result=""
	while s and grouping:
	# if grouping is -1, we are done
	if grouping[0]==CHAR_MAX:
	break
	# 0: re-use last group ad infinitum
	elif grouping[0]!=0:
	#process last group
	group=grouping[0]
	grouping=grouping[1:]
	if result:
	result=s[-group:]+conv['thousands_sep']+result
	else:
	result=s[-group:]
	s=s[:-group]
	if not result:
	return s
	if s:
	result=s+conv['thousands_sep']+result
	return result

	def format(f,val,grouping=0):
	"""Formats a value in the same way that the % formatting would use,
	but takes the current locale into account.
	Grouping is applied if the third parameter is true."""
	result = f % val
	fields = string.split(result, ".")
	if grouping:
	fields[0]=_group(fields[0])
	if len(fields)==2:
	return fields[0]+localeconv()['decimal_point']+fields[1]
	elif len(fields)==1:
	return fields[0]
	else:
	raise Error,"Too many decimal points in result string"

	def str(val):
	"""Convert float to integer, taking the locale into account."""
	return format("%.12g",val)

	def atof(str,func=string.atof):
	"Parses a string as a float according to the locale settings."
	#First, get rid of the grouping
	ts = localeconv()['thousands_sep']
	if ts:
	s=string.split(str,ts)
	str=string.join(s, "")
	#next, replace the decimal point with a dot
	dd = localeconv()['decimal_point']
	if dd:
	s=string.split(str,dd)
	str=string.join(s,'.')
	#finally, parse the string
	return func(str)

	def atoi(str):
	"Converts a string to an integer according to the locale settings."
	return atof(str,string.atoi)

	def _test():
	setlocale(LC_ALL,"")
	#do grouping
	s1=format("%d",123456789,1)
	print s1,"is",atoi(s1)
	#standard formatting
	s1=str(3.14)
	print s1,"is",atof(s1)

	### Locale name aliasing engine

	# Author: Marc-Andre Lemburg, mal@lemburg.com

	def normalize(localename):

	""" Returns a normalized locale code for the given locale
	name.

	The returned locale code is formatted for use with
	setlocale().

	If normalization fails, the original name is returned
	unchanged.

	If the given encoding is not known, the function defaults to
	the default encoding for the locale code just like setlocale()
	does.

	"""
	# Normalize the locale name and extract the encoding
	fullname = string.lower(localename)
	if ':' in fullname:
	# ':' is sometimes used as encoding delimiter.
	fullname = string.replace(fullname, ':', '.')
	if '.' in fullname:
	langname, encoding = string.split(fullname, '.')[:2]
	fullname = langname + '.' + encoding
	else:
	langname = fullname
	encoding = ''

	# First lookup: fullname (possibly with encoding)
	code = locale_alias.get(fullname, None)
	if code is not None:
	return code

	# Second try: langname (without encoding)
	code = locale_alias.get(langname, None)
	if code is not None:
	if '.' in code:
	langname, defenc = string.split(code, '.')
	else:
	langname = code
	defenc = ''
	if encoding:
	encoding = encoding_alias.get(encoding, encoding)
	else:
	encoding = defenc
	if encoding:
	return langname + '.' + encoding
	else:
	return langname

	else:
	return localename

	def _parse_localename(localename):

	""" Parses the locale code for localename and returns the
	result as tuple (language code, encoding).

	The localename is normalized and passed through the locale
	alias engine. A ValueError is raised in case the locale name
	cannot be parsed.

	The language code corresponds to RFC 1766. code and encoding
	can be None in case the values cannot be determined or are
	unkown to this implementation.

	"""
	code = normalize(localename)
	if '.' in code:
	return string.split(code, '.')[:2]
	elif code == 'C':
	return None, None
	else:
	raise ValueError,'unkown locale: %s' % localename
	return l

	def _build_localename(localetuple):

	""" Builds a locale code from the given tuple (language code,
	encoding).

	No aliasing or normalizing takes place.

	"""
	language, encoding = localetuple
	if language is None:
	language = 'C'
	if encoding is None:
	return language
	else:
	return language + '.' + encoding

	def get_default(envvars=('LANGUAGE', 'LC_ALL', 'LC_CTYPE', 'LANG')):

	""" Tries to determine the default locale settings and returns
	them as tuple (language code, encoding).

	According to POSIX, a program which has not called
	setlocale(LC_ALL,"") runs using the portable 'C' locale.
	Calling setlocale(LC_ALL,"") lets it use the default locale as
	defined by the LANG variable. Since we don't want to interfere
	with the current locale setting we thus emulate the behaviour
	in the way described above.

	To maintain compatibility with other platforms, not only the
	LANG variable is tested, but a list of variables given as
	envvars parameter. The first found to be defined will be
	used. envvars defaults to the search path used in GNU gettext;
	it must always contain the variable name 'LANG'.

	Except for the code 'C', the language code corresponds to RFC
	1766. code and encoding can be None in case the values cannot
	be determined.

	"""
	import os
	lookup = os.environ.get
	for variable in envvars:
	localename = lookup(variable,None)
	if localename is not None:
	break
	else:
	localename = 'C'
	return _parse_localename(localename)

	def get_locale(category=LC_CTYPE):

	""" Returns the current setting for the given locale category as
	tuple (language code, encoding).

	category may be one of the LC_* value except LC_ALL. It
	defaults to LC_CTYPE.

	Except for the code 'C', the language code corresponds to RFC
	1766. code and encoding can be None in case the values cannot
	be determined.

	"""
	localename = setlocale(category)
	if category == LC_ALL and ';' in localename:
	raise TypeError,'category LC_ALL is not supported'
	return _parse_localename(localename)

	def set_locale(localetuple, category=LC_ALL):

	""" Set the locale according to the localetuple (language code,
	encoding) as returned by get_locale() and get_default().

	The given codes are passed through the locale aliasing engine
	before being given to setlocale() for processing.

	category may be given as one of the LC_* values. It defaults
	to LC_ALL.

	"""
	setlocale(category, normalize(_build_localename(localetuple)))

	def set_to_default(category=LC_ALL):

	""" Sets the locale for category to the default setting.

	The default setting is determined by calling
	get_default(). category defaults to LC_ALL.

	"""
	setlocale(category, _build_localename(get_default()))

	### Database
	#
	# The following data was extracted from the locale.alias file which
	# comes with X11 and then hand edited removing the explicit encoding
	# definitions and adding some more aliases. The file is usually
	# available as /usr/lib/X11/locale/locale.alias.
	#

	#
	# The encoding_alias table maps lowercase encoding alias names to C
	# locale encoding names (case-sensitive).
	#
	encoding_alias = {
	'437': 'C',
	'c': 'C',
	'iso8859': 'ISO8859-1',
	'8859': 'ISO8859-1',
	'88591': 'ISO8859-1',
	'ascii': 'ISO8859-1',
	'en': 'ISO8859-1',
	'iso88591': 'ISO8859-1',
	'iso_8859-1': 'ISO8859-1',
	'885915': 'ISO8859-15',
	'iso885915': 'ISO8859-15',
	'iso_8859-15': 'ISO8859-15',
	'iso8859-2': 'ISO8859-2',
	'iso88592': 'ISO8859-2',
	'iso_8859-2': 'ISO8859-2',
	'iso88595': 'ISO8859-5',
	'iso88596': 'ISO8859-6',
	'iso88597': 'ISO8859-7',
	'iso88598': 'ISO8859-8',
	'iso88599': 'ISO8859-9',
	'iso-2022-jp': 'JIS7',
	'jis': 'JIS7',
	'jis7': 'JIS7',
	'sjis': 'SJIS',
	'tis620': 'TACTIS',
	'ajec': 'eucJP',
	'eucjp': 'eucJP',
	'ujis': 'eucJP',
	'utf-8': 'utf',
	'utf8': 'utf',
	'utf8@ucs4': 'utf',
	}

	#
	# The locale_alias table maps lowercase alias names to C locale names
	# (case-sensitive). Encodings are always separated from the locale
	# name using a dot ('.'); they should only be given in case the
	# language name is needed to interpret the given encoding alias
	# correctly (CJK codes often have this need).
	#
	locale_alias = {
	'american': 'en_US.ISO8859-1',
	'ar': 'ar_AA.ISO8859-6',
	'ar_aa': 'ar_AA.ISO8859-6',
	'ar_sa': 'ar_SA.ISO8859-6',
	'arabic': 'ar_AA.ISO8859-6',
	'bg': 'bg_BG.ISO8859-5',
	'bg_bg': 'bg_BG.ISO8859-5',
	'bulgarian': 'bg_BG.ISO8859-5',
	'c-french': 'fr_CA.ISO8859-1',
	'c': 'C',
	'c_c': 'C',
	'cextend': 'en_US.ISO8859-1',
	'chinese-s': 'zh_CN.eucCN',
	'chinese-t': 'zh_TW.eucTW',
	'croatian': 'hr_HR.ISO8859-2',
	'cs': 'cs_CZ.ISO8859-2',
	'cs_cs': 'cs_CZ.ISO8859-2',
	'cs_cz': 'cs_CZ.ISO8859-2',
	'cz': 'cz_CZ.ISO8859-2',
	'cz_cz': 'cz_CZ.ISO8859-2',
	'czech': 'cs_CS.ISO8859-2',
	'da': 'da_DK.ISO8859-1',
	'da_dk': 'da_DK.ISO8859-1',
	'danish': 'da_DK.ISO8859-1',
	'de': 'de_DE.ISO8859-1',
	'de_at': 'de_AT.ISO8859-1',
	'de_ch': 'de_CH.ISO8859-1',
	'de_de': 'de_DE.ISO8859-1',
	'dutch': 'nl_BE.ISO8859-1',
	'ee': 'ee_EE.ISO8859-4',
	'el': 'el_GR.ISO8859-7',
	'el_gr': 'el_GR.ISO8859-7',
	'en': 'en_US.ISO8859-1',
	'en_au': 'en_AU.ISO8859-1',
	'en_ca': 'en_CA.ISO8859-1',
	'en_gb': 'en_GB.ISO8859-1',
	'en_ie': 'en_IE.ISO8859-1',
	'en_nz': 'en_NZ.ISO8859-1',
	'en_uk': 'en_GB.ISO8859-1',
	'en_us': 'en_US.ISO8859-1',
	'eng_gb': 'en_GB.ISO8859-1',
	'english': 'en_EN.ISO8859-1',
	'english_uk': 'en_GB.ISO8859-1',
	'english_united-states': 'en_US.ISO8859-1',
	'english_us': 'en_US.ISO8859-1',
	'es': 'es_ES.ISO8859-1',
	'es_ar': 'es_AR.ISO8859-1',
	'es_bo': 'es_BO.ISO8859-1',
	'es_cl': 'es_CL.ISO8859-1',
	'es_co': 'es_CO.ISO8859-1',
	'es_cr': 'es_CR.ISO8859-1',
	'es_ec': 'es_EC.ISO8859-1',
	'es_es': 'es_ES.ISO8859-1',
	'es_gt': 'es_GT.ISO8859-1',
	'es_mx': 'es_MX.ISO8859-1',
	'es_ni': 'es_NI.ISO8859-1',
	'es_pa': 'es_PA.ISO8859-1',
	'es_pe': 'es_PE.ISO8859-1',
	'es_py': 'es_PY.ISO8859-1',
	'es_sv': 'es_SV.ISO8859-1',
	'es_uy': 'es_UY.ISO8859-1',
	'es_ve': 'es_VE.ISO8859-1',
	'et': 'et_EE.ISO8859-4',
	'et_ee': 'et_EE.ISO8859-4',
	'fi': 'fi_FI.ISO8859-1',
	'fi_fi': 'fi_FI.ISO8859-1',
	'finnish': 'fi_FI.ISO8859-1',
	'fr': 'fr_FR.ISO8859-1',
	'fr_be': 'fr_BE.ISO8859-1',
	'fr_ca': 'fr_CA.ISO8859-1',
	'fr_ch': 'fr_CH.ISO8859-1',
	'fr_fr': 'fr_FR.ISO8859-1',
	'fre_fr': 'fr_FR.ISO8859-1',
	'french': 'fr_FR.ISO8859-1',
	'french_france': 'fr_FR.ISO8859-1',
	'ger_de': 'de_DE.ISO8859-1',
	'german': 'de_DE.ISO8859-1',
	'german_germany': 'de_DE.ISO8859-1',
	'greek': 'el_GR.ISO8859-7',
	'hebrew': 'iw_IL.ISO8859-8',
	'hr': 'hr_HR.ISO8859-2',
	'hr_hr': 'hr_HR.ISO8859-2',
	'hu': 'hu_HU.ISO8859-2',
	'hu_hu': 'hu_HU.ISO8859-2',
	'hungarian': 'hu_HU.ISO8859-2',
	'icelandic': 'is_IS.ISO8859-1',
	'id': 'id_ID.ISO8859-1',
	'id_id': 'id_ID.ISO8859-1',
	'is': 'is_IS.ISO8859-1',
	'is_is': 'is_IS.ISO8859-1',
	'iso-8859-1': 'en_US.ISO8859-1',
	'iso-8859-15': 'en_US.ISO8859-15',
	'iso8859-1': 'en_US.ISO8859-1',
	'iso8859-15': 'en_US.ISO8859-15',
	'iso_8859_1': 'en_US.ISO8859-1',
	'iso_8859_15': 'en_US.ISO8859-15',
	'it': 'it_IT.ISO8859-1',
	'it_ch': 'it_CH.ISO8859-1',
	'it_it': 'it_IT.ISO8859-1',
	'italian': 'it_IT.ISO8859-1',
	'iw': 'iw_IL.ISO8859-8',
	'iw_il': 'iw_IL.ISO8859-8',
	'ja': 'ja_JP.eucJP',
	'ja.jis': 'ja_JP.JIS7',
	'ja.sjis': 'ja_JP.SJIS',
	'ja_jp': 'ja_JP.eucJP',
	'ja_jp.ajec': 'ja_JP.eucJP',
	'ja_jp.euc': 'ja_JP.eucJP',
	'ja_jp.eucjp': 'ja_JP.eucJP',
	'ja_jp.iso-2022-jp': 'ja_JP.JIS7',
	'ja_jp.jis': 'ja_JP.JIS7',
	'ja_jp.jis7': 'ja_JP.JIS7',
	'ja_jp.mscode': 'ja_JP.SJIS',
	'ja_jp.sjis': 'ja_JP.SJIS',
	'ja_jp.ujis': 'ja_JP.eucJP',
	'japan': 'ja_JP.eucJP',
	'japanese': 'ja_JP.SJIS',
	'japanese-euc': 'ja_JP.eucJP',
	'japanese.euc': 'ja_JP.eucJP',
	'jp_jp': 'ja_JP.eucJP',
	'ko': 'ko_KR.eucKR',
	'ko_kr': 'ko_KR.eucKR',
	'ko_kr.euc': 'ko_KR.eucKR',
	'korean': 'ko_KR.eucKR',
	'lt': 'lt_LT.ISO8859-4',
	'lv': 'lv_LV.ISO8859-4',
	'mk': 'mk_MK.ISO8859-5',
	'mk_mk': 'mk_MK.ISO8859-5',
	'nl': 'nl_NL.ISO8859-1',
	'nl_be': 'nl_BE.ISO8859-1',
	'nl_nl': 'nl_NL.ISO8859-1',
	'no': 'no_NO.ISO8859-1',
	'no_no': 'no_NO.ISO8859-1',
	'norwegian': 'no_NO.ISO8859-1',
	'pl': 'pl_PL.ISO8859-2',
	'pl_pl': 'pl_PL.ISO8859-2',
	'polish': 'pl_PL.ISO8859-2',
	'portuguese': 'pt_PT.ISO8859-1',
	'portuguese_brazil': 'pt_BR.ISO8859-1',
	'posix': 'C',
	'posix-utf2': 'C',
	'pt': 'pt_PT.ISO8859-1',
	'pt_br': 'pt_BR.ISO8859-1',
	'pt_pt': 'pt_PT.ISO8859-1',
	'ro': 'ro_RO.ISO8859-2',
	'ro_ro': 'ro_RO.ISO8859-2',
	'ru': 'ru_RU.ISO8859-5',
	'ru_ru': 'ru_RU.ISO8859-5',
	'rumanian': 'ro_RO.ISO8859-2',
	'russian': 'ru_RU.ISO8859-5',
	'serbocroatian': 'sh_YU.ISO8859-2',
	'sh': 'sh_YU.ISO8859-2',
	'sh_hr': 'sh_HR.ISO8859-2',
	'sh_sp': 'sh_YU.ISO8859-2',
	'sh_yu': 'sh_YU.ISO8859-2',
	'sk': 'sk_SK.ISO8859-2',
	'sk_sk': 'sk_SK.ISO8859-2',
	'sl': 'sl_CS.ISO8859-2',
	'sl_cs': 'sl_CS.ISO8859-2',
	'sl_si': 'sl_SI.ISO8859-2',
	'slovak': 'sk_SK.ISO8859-2',
	'slovene': 'sl_CS.ISO8859-2',
	'sp': 'sp_YU.ISO8859-5',
	'sp_yu': 'sp_YU.ISO8859-5',
	'spanish': 'es_ES.ISO8859-1',
	'spanish_spain': 'es_ES.ISO8859-1',
	'sr_sp': 'sr_SP.ISO8859-2',
	'sv': 'sv_SE.ISO8859-1',
	'sv_se': 'sv_SE.ISO8859-1',
	'swedish': 'sv_SE.ISO8859-1',
	'th_th': 'th_TH.TACTIS',
	'tr': 'tr_TR.ISO8859-9',
	'tr_tr': 'tr_TR.ISO8859-9',
	'turkish': 'tr_TR.ISO8859-9',
	'univ': 'en_US.utf',
	'universal': 'en_US.utf',
	'zh': 'zh_CN.eucCN',
	'zh_cn': 'zh_CN.eucCN',
	'zh_cn.big5': 'zh_TW.eucTW',
	'zh_cn.euc': 'zh_CN.eucCN',
	'zh_tw': 'zh_TW.eucTW',
	'zh_tw.euc': 'zh_TW.eucTW',
	}

	def _print_locale():

	""" Test function.
	"""
	categories = {}
	def _init_categories(categories=categories):
	for k,v in globals().items():
	if k[:3] == 'LC_':
	categories[k] = v
	_init_categories()
	del categories['LC_ALL']

	print 'Locale defaults as determined by get_default():'
	print '-'*72
	lang, enc = get_default()
	print 'Language: ', lang or '(undefined)'
	print 'Encoding: ', enc or '(undefined)'
	print

	print 'Locale settings on startup:'
	print '-'*72
	for name,category in categories.items():
	print name,'...'
	lang, enc = get_locale(category)
	print ' Language: ', lang or '(undefined)'
	print ' Encoding: ', enc or '(undefined)'
	print

	set_to_default()
	print
	print 'Locale settings after calling set_to_default():'
	print '-'*72
	for name,category in categories.items():
	print name,'...'
	lang, enc = get_locale(category)
	print ' Language: ', lang or '(undefined)'
	print ' Encoding: ', enc or '(undefined)'
	print

	try:
	setlocale(LC_ALL,"")
	except:
	print 'NOTE:'
	print 'setlocale(LC_ALL,"") does not support the default locale'
	print 'given in the OS environment variables.'
	else:
	print
	print 'Locale settings after calling setlocale(LC_ALL,""):'
	print '-'*72
	for name,category in categories.items():
	print name,'...'
	lang, enc = get_locale(category)
	print ' Language: ', lang or '(undefined)'
	print ' Encoding: ', enc or '(undefined)'
	print

	###

	if __name__=='__main__':
	print 'Locale aliasing:'
	print
	_print_locale()
	print
	print 'Number formatting:'
	print
	_test()