Home | History | Annotate | Download | only in test
      1 from test.test_support import run_unittest, verbose
      2 import unittest
      3 import locale
      4 import sys
      5 import codecs
      6 
      7 
      8 enUS_locale = None
      9 
     10 def get_enUS_locale():
     11     global enUS_locale
     12     if sys.platform == 'darwin':
     13         import os
     14         tlocs = ("en_US.UTF-8", "en_US.ISO8859-1", "en_US")
     15         if int(os.uname()[2].split('.')[0]) < 10:
     16             # The locale test work fine on OSX 10.6, I (ronaldoussoren)
     17             # haven't had time yet to verify if tests work on OSX 10.5
     18             # (10.4 is known to be bad)
     19             raise unittest.SkipTest("Locale support on MacOSX is minimal")
     20     if sys.platform.startswith("win"):
     21         tlocs = ("En", "English")
     22     else:
     23         tlocs = ("en_US.UTF-8", "en_US.US-ASCII", "en_US")
     24     oldlocale = locale.setlocale(locale.LC_NUMERIC)
     25     for tloc in tlocs:
     26         try:
     27             locale.setlocale(locale.LC_NUMERIC, tloc)
     28         except locale.Error:
     29             continue
     30         break
     31     else:
     32         raise unittest.SkipTest(
     33             "Test locale not supported (tried %s)" % (', '.join(tlocs)))
     34     enUS_locale = tloc
     35     locale.setlocale(locale.LC_NUMERIC, oldlocale)
     36 
     37 
     38 class BaseLocalizedTest(unittest.TestCase):
     39     #
     40     # Base class for tests using a real locale
     41     #
     42 
     43     def setUp(self):
     44         self.oldlocale = locale.setlocale(self.locale_type)
     45         locale.setlocale(self.locale_type, enUS_locale)
     46         if verbose:
     47             print "testing with \"%s\"..." % enUS_locale,
     48 
     49     def tearDown(self):
     50         locale.setlocale(self.locale_type, self.oldlocale)
     51 
     52 
     53 class BaseCookedTest(unittest.TestCase):
     54     #
     55     # Base class for tests using cooked localeconv() values
     56     #
     57 
     58     def setUp(self):
     59         locale._override_localeconv = self.cooked_values
     60 
     61     def tearDown(self):
     62         locale._override_localeconv = {}
     63 
     64 
     65 class CCookedTest(BaseCookedTest):
     66     # A cooked "C" locale
     67 
     68     cooked_values = {
     69         'currency_symbol': '',
     70         'decimal_point': '.',
     71         'frac_digits': 127,
     72         'grouping': [],
     73         'int_curr_symbol': '',
     74         'int_frac_digits': 127,
     75         'mon_decimal_point': '',
     76         'mon_grouping': [],
     77         'mon_thousands_sep': '',
     78         'n_cs_precedes': 127,
     79         'n_sep_by_space': 127,
     80         'n_sign_posn': 127,
     81         'negative_sign': '',
     82         'p_cs_precedes': 127,
     83         'p_sep_by_space': 127,
     84         'p_sign_posn': 127,
     85         'positive_sign': '',
     86         'thousands_sep': ''
     87     }
     88 
     89 class EnUSCookedTest(BaseCookedTest):
     90     # A cooked "en_US" locale
     91 
     92     cooked_values = {
     93         'currency_symbol': '$',
     94         'decimal_point': '.',
     95         'frac_digits': 2,
     96         'grouping': [3, 3, 0],
     97         'int_curr_symbol': 'USD ',
     98         'int_frac_digits': 2,
     99         'mon_decimal_point': '.',
    100         'mon_grouping': [3, 3, 0],
    101         'mon_thousands_sep': ',',
    102         'n_cs_precedes': 1,
    103         'n_sep_by_space': 0,
    104         'n_sign_posn': 1,
    105         'negative_sign': '-',
    106         'p_cs_precedes': 1,
    107         'p_sep_by_space': 0,
    108         'p_sign_posn': 1,
    109         'positive_sign': '',
    110         'thousands_sep': ','
    111     }
    112 
    113 
    114 class FrFRCookedTest(BaseCookedTest):
    115     # A cooked "fr_FR" locale with a space character as decimal separator
    116     # and a non-ASCII currency symbol.
    117 
    118     cooked_values = {
    119         'currency_symbol': '\xe2\x82\xac',
    120         'decimal_point': ',',
    121         'frac_digits': 2,
    122         'grouping': [3, 3, 0],
    123         'int_curr_symbol': 'EUR ',
    124         'int_frac_digits': 2,
    125         'mon_decimal_point': ',',
    126         'mon_grouping': [3, 3, 0],
    127         'mon_thousands_sep': ' ',
    128         'n_cs_precedes': 0,
    129         'n_sep_by_space': 1,
    130         'n_sign_posn': 1,
    131         'negative_sign': '-',
    132         'p_cs_precedes': 0,
    133         'p_sep_by_space': 1,
    134         'p_sign_posn': 1,
    135         'positive_sign': '',
    136         'thousands_sep': ' '
    137     }
    138 
    139 
    140 class BaseFormattingTest(object):
    141     #
    142     # Utility functions for formatting tests
    143     #
    144 
    145     def _test_formatfunc(self, format, value, out, func, **format_opts):
    146         self.assertEqual(
    147             func(format, value, **format_opts), out)
    148 
    149     def _test_format(self, format, value, out, **format_opts):
    150         self._test_formatfunc(format, value, out,
    151             func=locale.format, **format_opts)
    152 
    153     def _test_format_string(self, format, value, out, **format_opts):
    154         self._test_formatfunc(format, value, out,
    155             func=locale.format_string, **format_opts)
    156 
    157     def _test_currency(self, value, out, **format_opts):
    158         self.assertEqual(locale.currency(value, **format_opts), out)
    159 
    160 
    161 class EnUSNumberFormatting(BaseFormattingTest):
    162     # XXX there is a grouping + padding bug when the thousands separator
    163     # is empty but the grouping array contains values (e.g. Solaris 10)
    164 
    165     def setUp(self):
    166         self.sep = locale.localeconv()['thousands_sep']
    167 
    168     def test_grouping(self):
    169         self._test_format("%f", 1024, grouping=1, out='1%s024.000000' % self.sep)
    170         self._test_format("%f", 102, grouping=1, out='102.000000')
    171         self._test_format("%f", -42, grouping=1, out='-42.000000')
    172         self._test_format("%+f", -42, grouping=1, out='-42.000000')
    173 
    174     def test_grouping_and_padding(self):
    175         self._test_format("%20.f", -42, grouping=1, out='-42'.rjust(20))
    176         if self.sep:
    177             self._test_format("%+10.f", -4200, grouping=1,
    178                 out=('-4%s200' % self.sep).rjust(10))
    179             self._test_format("%-10.f", -4200, grouping=1,
    180                 out=('-4%s200' % self.sep).ljust(10))
    181 
    182     def test_integer_grouping(self):
    183         self._test_format("%d", 4200, grouping=True, out='4%s200' % self.sep)
    184         self._test_format("%+d", 4200, grouping=True, out='+4%s200' % self.sep)
    185         self._test_format("%+d", -4200, grouping=True, out='-4%s200' % self.sep)
    186 
    187     def test_integer_grouping_and_padding(self):
    188         self._test_format("%10d", 4200, grouping=True,
    189             out=('4%s200' % self.sep).rjust(10))
    190         self._test_format("%-10d", -4200, grouping=True,
    191             out=('-4%s200' % self.sep).ljust(10))
    192 
    193     def test_simple(self):
    194         self._test_format("%f", 1024, grouping=0, out='1024.000000')
    195         self._test_format("%f", 102, grouping=0, out='102.000000')
    196         self._test_format("%f", -42, grouping=0, out='-42.000000')
    197         self._test_format("%+f", -42, grouping=0, out='-42.000000')
    198 
    199     def test_padding(self):
    200         self._test_format("%20.f", -42, grouping=0, out='-42'.rjust(20))
    201         self._test_format("%+10.f", -4200, grouping=0, out='-4200'.rjust(10))
    202         self._test_format("%-10.f", 4200, grouping=0, out='4200'.ljust(10))
    203 
    204     def test_complex_formatting(self):
    205         # Spaces in formatting string
    206         self._test_format_string("One million is %i", 1000000, grouping=1,
    207             out='One million is 1%s000%s000' % (self.sep, self.sep))
    208         self._test_format_string("One  million is %i", 1000000, grouping=1,
    209             out='One  million is 1%s000%s000' % (self.sep, self.sep))
    210         # Dots in formatting string
    211         self._test_format_string(".%f.", 1000.0, out='.1000.000000.')
    212         # Padding
    213         if self.sep:
    214             self._test_format_string("-->  %10.2f", 4200, grouping=1,
    215                 out='-->  ' + ('4%s200.00' % self.sep).rjust(10))
    216         # Asterisk formats
    217         self._test_format_string("%10.*f", (2, 1000), grouping=0,
    218             out='1000.00'.rjust(10))
    219         if self.sep:
    220             self._test_format_string("%*.*f", (10, 2, 1000), grouping=1,
    221                 out=('1%s000.00' % self.sep).rjust(10))
    222         # Test more-in-one
    223         if self.sep:
    224             self._test_format_string("int %i float %.2f str %s",
    225                 (1000, 1000.0, 'str'), grouping=1,
    226                 out='int 1%s000 float 1%s000.00 str str' %
    227                 (self.sep, self.sep))
    228 
    229 
    230 class TestFormatPatternArg(unittest.TestCase):
    231     # Test handling of pattern argument of format
    232 
    233     def test_onlyOnePattern(self):
    234         # Issue 2522: accept exactly one % pattern, and no extra chars.
    235         self.assertRaises(ValueError, locale.format, "%f\n", 'foo')
    236         self.assertRaises(ValueError, locale.format, "%f\r", 'foo')
    237         self.assertRaises(ValueError, locale.format, "%f\r\n", 'foo')
    238         self.assertRaises(ValueError, locale.format, " %f", 'foo')
    239         self.assertRaises(ValueError, locale.format, "%fg", 'foo')
    240         self.assertRaises(ValueError, locale.format, "%^g", 'foo')
    241         self.assertRaises(ValueError, locale.format, "%f%%", 'foo')
    242 
    243 
    244 class TestLocaleFormatString(unittest.TestCase):
    245     """General tests on locale.format_string"""
    246 
    247     def test_percent_escape(self):
    248         self.assertEqual(locale.format_string('%f%%', 1.0), '%f%%' % 1.0)
    249         self.assertEqual(locale.format_string('%d %f%%d', (1, 1.0)),
    250             '%d %f%%d' % (1, 1.0))
    251         self.assertEqual(locale.format_string('%(foo)s %%d', {'foo': 'bar'}),
    252             ('%(foo)s %%d' % {'foo': 'bar'}))
    253 
    254     def test_mapping(self):
    255         self.assertEqual(locale.format_string('%(foo)s bing.', {'foo': 'bar'}),
    256             ('%(foo)s bing.' % {'foo': 'bar'}))
    257         self.assertEqual(locale.format_string('%(foo)s', {'foo': 'bar'}),
    258             ('%(foo)s' % {'foo': 'bar'}))
    259 
    260 
    261 
    262 class TestNumberFormatting(BaseLocalizedTest, EnUSNumberFormatting):
    263     # Test number formatting with a real English locale.
    264 
    265     locale_type = locale.LC_NUMERIC
    266 
    267     def setUp(self):
    268         BaseLocalizedTest.setUp(self)
    269         EnUSNumberFormatting.setUp(self)
    270 
    271 
    272 class TestEnUSNumberFormatting(EnUSCookedTest, EnUSNumberFormatting):
    273     # Test number formatting with a cooked "en_US" locale.
    274 
    275     def setUp(self):
    276         EnUSCookedTest.setUp(self)
    277         EnUSNumberFormatting.setUp(self)
    278 
    279     def test_currency(self):
    280         self._test_currency(50000, "$50000.00")
    281         self._test_currency(50000, "$50,000.00", grouping=True)
    282         self._test_currency(50000, "USD 50,000.00",
    283             grouping=True, international=True)
    284 
    285 
    286 class TestCNumberFormatting(CCookedTest, BaseFormattingTest):
    287     # Test number formatting with a cooked "C" locale.
    288 
    289     def test_grouping(self):
    290         self._test_format("%.2f", 12345.67, grouping=True, out='12345.67')
    291 
    292     def test_grouping_and_padding(self):
    293         self._test_format("%9.2f", 12345.67, grouping=True, out=' 12345.67')
    294 
    295 
    296 class TestFrFRNumberFormatting(FrFRCookedTest, BaseFormattingTest):
    297     # Test number formatting with a cooked "fr_FR" locale.
    298 
    299     def test_decimal_point(self):
    300         self._test_format("%.2f", 12345.67, out='12345,67')
    301 
    302     def test_grouping(self):
    303         self._test_format("%.2f", 345.67, grouping=True, out='345,67')
    304         self._test_format("%.2f", 12345.67, grouping=True, out='12 345,67')
    305 
    306     def test_grouping_and_padding(self):
    307         self._test_format("%6.2f", 345.67, grouping=True, out='345,67')
    308         self._test_format("%7.2f", 345.67, grouping=True, out=' 345,67')
    309         self._test_format("%8.2f", 12345.67, grouping=True, out='12 345,67')
    310         self._test_format("%9.2f", 12345.67, grouping=True, out='12 345,67')
    311         self._test_format("%10.2f", 12345.67, grouping=True, out=' 12 345,67')
    312         self._test_format("%-6.2f", 345.67, grouping=True, out='345,67')
    313         self._test_format("%-7.2f", 345.67, grouping=True, out='345,67 ')
    314         self._test_format("%-8.2f", 12345.67, grouping=True, out='12 345,67')
    315         self._test_format("%-9.2f", 12345.67, grouping=True, out='12 345,67')
    316         self._test_format("%-10.2f", 12345.67, grouping=True, out='12 345,67 ')
    317 
    318     def test_integer_grouping(self):
    319         self._test_format("%d", 200, grouping=True, out='200')
    320         self._test_format("%d", 4200, grouping=True, out='4 200')
    321 
    322     def test_integer_grouping_and_padding(self):
    323         self._test_format("%4d", 4200, grouping=True, out='4 200')
    324         self._test_format("%5d", 4200, grouping=True, out='4 200')
    325         self._test_format("%10d", 4200, grouping=True, out='4 200'.rjust(10))
    326         self._test_format("%-4d", 4200, grouping=True, out='4 200')
    327         self._test_format("%-5d", 4200, grouping=True, out='4 200')
    328         self._test_format("%-10d", 4200, grouping=True, out='4 200'.ljust(10))
    329 
    330     def test_currency(self):
    331         euro = u'\u20ac'.encode('utf-8')
    332         self._test_currency(50000, "50000,00 " + euro)
    333         self._test_currency(50000, "50 000,00 " + euro, grouping=True)
    334         # XXX is the trailing space a bug?
    335         self._test_currency(50000, "50 000,00 EUR ",
    336             grouping=True, international=True)
    337 
    338 
    339 class TestStringMethods(BaseLocalizedTest):
    340     locale_type = locale.LC_CTYPE
    341 
    342     if sys.platform != 'sunos5' and not sys.platform.startswith("win"):
    343         # Test BSD Rune locale's bug for isctype functions.
    344 
    345         def test_isspace(self):
    346             self.assertEqual('\x20'.isspace(), True)
    347             self.assertEqual('\xa0'.isspace(), False)
    348             self.assertEqual('\xa1'.isspace(), False)
    349 
    350         def test_isalpha(self):
    351             self.assertEqual('\xc0'.isalpha(), False)
    352 
    353         def test_isalnum(self):
    354             self.assertEqual('\xc0'.isalnum(), False)
    355 
    356         def test_isupper(self):
    357             self.assertEqual('\xc0'.isupper(), False)
    358 
    359         def test_islower(self):
    360             self.assertEqual('\xc0'.islower(), False)
    361 
    362         def test_lower(self):
    363             self.assertEqual('\xcc\x85'.lower(), '\xcc\x85')
    364 
    365         def test_upper(self):
    366             self.assertEqual('\xed\x95\xa0'.upper(), '\xed\x95\xa0')
    367 
    368         def test_strip(self):
    369             self.assertEqual('\xed\x95\xa0'.strip(), '\xed\x95\xa0')
    370 
    371         def test_split(self):
    372             self.assertEqual('\xec\xa0\xbc'.split(), ['\xec\xa0\xbc'])
    373 
    374 
    375 class NormalizeTest(unittest.TestCase):
    376     def check(self, localename, expected):
    377         self.assertEqual(locale.normalize(localename), expected, msg=localename)
    378 
    379     def test_locale_alias(self):
    380         for localename, alias in locale.locale_alias.items():
    381             self.check(localename, alias)
    382 
    383     def test_empty(self):
    384         self.check('', '')
    385 
    386     def test_c(self):
    387         self.check('c', 'C')
    388         self.check('posix', 'C')
    389 
    390     def test_english(self):
    391         self.check('en', 'en_US.ISO8859-1')
    392         self.check('EN', 'en_US.ISO8859-1')
    393         self.check('en_US', 'en_US.ISO8859-1')
    394         self.check('en_us', 'en_US.ISO8859-1')
    395         self.check('en_GB', 'en_GB.ISO8859-1')
    396         self.check('en_US.UTF-8', 'en_US.UTF-8')
    397         self.check('en_US.utf8', 'en_US.UTF-8')
    398         self.check('en_US:UTF-8', 'en_US.UTF-8')
    399         self.check('en_US.ISO8859-1', 'en_US.ISO8859-1')
    400         self.check('en_US.US-ASCII', 'en_US.ISO8859-1')
    401         self.check('english', 'en_EN.ISO8859-1')
    402 
    403     def test_hyphenated_encoding(self):
    404         self.check('az_AZ.iso88599e', 'az_AZ.ISO8859-9E')
    405         self.check('az_AZ.ISO8859-9E', 'az_AZ.ISO8859-9E')
    406         self.check('tt_RU.koi8c', 'tt_RU.KOI8-C')
    407         self.check('tt_RU.KOI8-C', 'tt_RU.KOI8-C')
    408         self.check('lo_LA.cp1133', 'lo_LA.IBM-CP1133')
    409         self.check('lo_LA.ibmcp1133', 'lo_LA.IBM-CP1133')
    410         self.check('lo_LA.IBM-CP1133', 'lo_LA.IBM-CP1133')
    411         self.check('uk_ua.microsoftcp1251', 'uk_UA.CP1251')
    412         self.check('uk_ua.microsoft-cp1251', 'uk_UA.CP1251')
    413         self.check('ka_ge.georgianacademy', 'ka_GE.GEORGIAN-ACADEMY')
    414         self.check('ka_GE.GEORGIAN-ACADEMY', 'ka_GE.GEORGIAN-ACADEMY')
    415         self.check('cs_CZ.iso88592', 'cs_CZ.ISO8859-2')
    416         self.check('cs_CZ.ISO8859-2', 'cs_CZ.ISO8859-2')
    417 
    418     def test_euro_modifier(self):
    419         self.check('de_DE@euro', 'de_DE.ISO8859-15')
    420         self.check('en_US.ISO8859-15@euro', 'en_US.ISO8859-15')
    421 
    422     def test_latin_modifier(self):
    423         self.check('be_BY.UTF-8@latin', 'be_BY.UTF-8@latin')
    424         self.check('sr_RS.UTF-8@latin', 'sr_RS.UTF-8@latin')
    425 
    426     def test_valencia_modifier(self):
    427         self.check('ca_ES.UTF-8@valencia', 'ca_ES.UTF-8@valencia')
    428         self.check('ca_ES@valencia', 'ca_ES.ISO8859-15@valencia')
    429         self.check('ca@valencia', 'ca_ES.ISO8859-1@valencia')
    430 
    431     def test_devanagari_modifier(self):
    432         self.check('ks_IN.UTF-8@devanagari', 'ks_IN.UTF-8@devanagari')
    433         self.check('ks_IN@devanagari', 'ks_IN.UTF-8@devanagari')
    434         self.check('ks@devanagari', 'ks_IN.UTF-8@devanagari')
    435         self.check('ks_IN.UTF-8', 'ks_IN.UTF-8')
    436         self.check('ks_IN', 'ks_IN.UTF-8')
    437         self.check('ks', 'ks_IN.UTF-8')
    438         self.check('sd_IN.UTF-8@devanagari', 'sd_IN.UTF-8@devanagari')
    439         self.check('sd_IN@devanagari', 'sd_IN.UTF-8@devanagari')
    440         self.check('sd@devanagari', 'sd_IN.UTF-8@devanagari')
    441         self.check('sd_IN.UTF-8', 'sd_IN.UTF-8')
    442         self.check('sd_IN', 'sd_IN.UTF-8')
    443         self.check('sd', 'sd_IN.UTF-8')
    444 
    445 
    446 class TestMiscellaneous(unittest.TestCase):
    447     def test_getpreferredencoding(self):
    448         # Invoke getpreferredencoding to make sure it does not cause exceptions.
    449         enc = locale.getpreferredencoding()
    450         if enc:
    451             # If encoding non-empty, make sure it is valid
    452             codecs.lookup(enc)
    453 
    454     if hasattr(locale, "strcoll"):
    455         def test_strcoll_3303(self):
    456             # test crasher from bug #3303
    457             self.assertRaises(TypeError, locale.strcoll, u"a", None)
    458 
    459     def test_setlocale_category(self):
    460         locale.setlocale(locale.LC_ALL)
    461         locale.setlocale(locale.LC_TIME)
    462         locale.setlocale(locale.LC_CTYPE)
    463         locale.setlocale(locale.LC_COLLATE)
    464         locale.setlocale(locale.LC_MONETARY)
    465         locale.setlocale(locale.LC_NUMERIC)
    466 
    467         # crasher from bug #7419
    468         self.assertRaises(locale.Error, locale.setlocale, 12345)
    469 
    470     def test_getsetlocale_issue1813(self):
    471         # Issue #1813: setting and getting the locale under a Turkish locale
    472         oldlocale = locale.getlocale()
    473         self.addCleanup(locale.setlocale, locale.LC_CTYPE, oldlocale)
    474         for loc in ('tr_TR', 'tr_TR.UTF-8', 'tr_TR.ISO8859-9'):
    475             try:
    476                 locale.setlocale(locale.LC_CTYPE, loc)
    477                 break
    478             except locale.Error:
    479                 continue
    480         else:
    481             # Unsupported locale on this system
    482             self.skipTest('test needs Turkish locale')
    483         loc = locale.getlocale()
    484         try:
    485             locale.setlocale(locale.LC_CTYPE, loc)
    486         except Exception as e:
    487             self.fail("Failed to set locale %r (default locale is %r): %r" %
    488                       (loc, oldlocale, e))
    489         self.assertEqual(loc, locale.getlocale())
    490 
    491     def test_normalize_issue12752(self):
    492         # Issue #1813 caused a regression where locale.normalize() would no
    493         # longer accept unicode strings.
    494         self.assertEqual(locale.normalize(u'en_US'), 'en_US.ISO8859-1')
    495 
    496     def test_setlocale_unicode(self):
    497         oldlocale = locale.getlocale()
    498         self.addCleanup(locale.setlocale, locale.LC_CTYPE, oldlocale)
    499 
    500         user_locale = locale.setlocale(locale.LC_CTYPE, '')
    501         unicode_locale = user_locale.decode('utf-8')
    502 
    503         user_locale2 = locale.setlocale(locale.LC_CTYPE, unicode_locale)
    504         self.assertEqual(user_locale, user_locale2)
    505 
    506 
    507 def test_main():
    508     tests = [
    509         TestMiscellaneous,
    510         TestFormatPatternArg,
    511         TestLocaleFormatString,
    512         TestEnUSNumberFormatting,
    513         TestCNumberFormatting,
    514         TestFrFRNumberFormatting,
    515     ]
    516     # SkipTest can't be raised inside unittests, handle it manually instead
    517     try:
    518         get_enUS_locale()
    519     except unittest.SkipTest as e:
    520         if verbose:
    521             print "Some tests will be disabled: %s" % e
    522     else:
    523         tests += [TestNumberFormatting, TestStringMethods]
    524     run_unittest(*tests)
    525 
    526 if __name__ == '__main__':
    527     test_main()
    528