Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 1 | from test import support |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 2 | from test.support import bigmemtest, _1G, _2G, _4G |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 3 | |
| 4 | import unittest |
| 5 | import operator |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 6 | import sys |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 7 | import functools |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 8 | |
| 9 | # Bigmem testing houserules: |
| 10 | # |
| 11 | # - Try not to allocate too many large objects. It's okay to rely on |
| 12 | # refcounting semantics, but don't forget that 's = create_largestring()' |
| 13 | # doesn't release the old 's' (if it exists) until well after its new |
| 14 | # value has been created. Use 'del s' before the create_largestring call. |
| 15 | # |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 16 | # - Do *not* compare large objects using assertEqual or similar. It's a |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 17 | # lengthy operation and the errormessage will be utterly useless due to |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 18 | # its size. To make sure whether a result has the right contents, better |
| 19 | # to use the strip or count methods, or compare meaningful slices. |
| 20 | # |
| 21 | # - Don't forget to test for large indices, offsets and results and such, |
| 22 | # in addition to large sizes. |
| 23 | # |
| 24 | # - When repeating an object (say, a substring, or a small list) to create |
| 25 | # a large object, make the subobject of a length that is not a power of |
| 26 | # 2. That way, int-wrapping problems are more easily detected. |
| 27 | # |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 28 | # - Despite the bigmemtest decorator, all tests will actually be called |
| 29 | # with a much smaller number too, in the normal test run (5Kb currently.) |
| 30 | # This is so the tests themselves get frequent testing. |
| 31 | # Consequently, always make all large allocations based on the |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 32 | # passed-in 'size', and don't rely on the size being very large. Also, |
| 33 | # memuse-per-size should remain sane (less than a few thousand); if your |
| 34 | # test uses more, adjust 'size' upward, instead. |
| 35 | |
Antoine Pitrou | ec00e2f | 2009-03-07 23:52:26 +0000 | [diff] [blame] | 36 | # BEWARE: it seems that one failing test can yield other subsequent tests to |
| 37 | # fail as well. I do not know whether it is due to memory fragmentation |
| 38 | # issues, or other specifics of the platform malloc() routine. |
| 39 | |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 40 | character_size = 4 if sys.maxunicode > 0xFFFF else 2 |
| 41 | |
| 42 | |
| 43 | class BaseStrTest: |
| 44 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 45 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 46 | def test_capitalize(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 47 | _ = self.from_latin1 |
| 48 | SUBSTR = self.from_latin1(' abc def ghi') |
| 49 | s = _('-') * size + SUBSTR |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 50 | caps = s.capitalize() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 51 | self.assertEqual(caps[-len(SUBSTR):], |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 52 | SUBSTR.capitalize()) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 53 | self.assertEqual(caps.lstrip(_('-')), SUBSTR) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 54 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 55 | @bigmemtest(size=_2G + 10, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 56 | def test_center(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 57 | SUBSTR = self.from_latin1(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 58 | s = SUBSTR.center(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 59 | self.assertEqual(len(s), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 60 | lpadsize = rpadsize = (len(s) - len(SUBSTR)) // 2 |
| 61 | if len(s) % 2: |
| 62 | lpadsize += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 63 | self.assertEqual(s[lpadsize:-rpadsize], SUBSTR) |
| 64 | self.assertEqual(s.strip(), SUBSTR.strip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 65 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 66 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 67 | def test_count(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 68 | _ = self.from_latin1 |
| 69 | SUBSTR = _(' abc def ghi') |
| 70 | s = _('.') * size + SUBSTR |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 71 | self.assertEqual(s.count(_('.')), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 72 | s += _('.') |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 73 | self.assertEqual(s.count(_('.')), size + 1) |
| 74 | self.assertEqual(s.count(_(' ')), 3) |
| 75 | self.assertEqual(s.count(_('i')), 1) |
| 76 | self.assertEqual(s.count(_('j')), 0) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 77 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 78 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 79 | def test_endswith(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 80 | _ = self.from_latin1 |
| 81 | SUBSTR = _(' abc def ghi') |
| 82 | s = _('-') * size + SUBSTR |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 83 | self.assertTrue(s.endswith(SUBSTR)) |
| 84 | self.assertTrue(s.endswith(s)) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 85 | s2 = _('...') + s |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 86 | self.assertTrue(s2.endswith(s)) |
| 87 | self.assertFalse(s.endswith(_('a') + SUBSTR)) |
| 88 | self.assertFalse(SUBSTR.endswith(s)) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 89 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 90 | @bigmemtest(size=_2G + 10, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 91 | def test_expandtabs(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 92 | _ = self.from_latin1 |
| 93 | s = _('-') * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 94 | tabsize = 8 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 95 | self.assertEqual(s.expandtabs(), s) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 96 | del s |
| 97 | slen, remainder = divmod(size, tabsize) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 98 | s = _(' \t') * slen |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 99 | s = s.expandtabs(tabsize) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 100 | self.assertEqual(len(s), size - remainder) |
| 101 | self.assertEqual(len(s.strip(_(' '))), 0) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 102 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 103 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 104 | def test_find(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 105 | _ = self.from_latin1 |
| 106 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 107 | sublen = len(SUBSTR) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 108 | s = _('').join([SUBSTR, _('-') * size, SUBSTR]) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 109 | self.assertEqual(s.find(_(' ')), 0) |
| 110 | self.assertEqual(s.find(SUBSTR), 0) |
| 111 | self.assertEqual(s.find(_(' '), sublen), sublen + size) |
| 112 | self.assertEqual(s.find(SUBSTR, len(SUBSTR)), sublen + size) |
| 113 | self.assertEqual(s.find(_('i')), SUBSTR.find(_('i'))) |
| 114 | self.assertEqual(s.find(_('i'), sublen), |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 115 | sublen + size + SUBSTR.find(_('i'))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 116 | self.assertEqual(s.find(_('i'), size), |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 117 | sublen + size + SUBSTR.find(_('i'))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 118 | self.assertEqual(s.find(_('j')), -1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 119 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 120 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 121 | def test_index(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 122 | _ = self.from_latin1 |
| 123 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 124 | sublen = len(SUBSTR) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 125 | s = _('').join([SUBSTR, _('-') * size, SUBSTR]) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 126 | self.assertEqual(s.index(_(' ')), 0) |
| 127 | self.assertEqual(s.index(SUBSTR), 0) |
| 128 | self.assertEqual(s.index(_(' '), sublen), sublen + size) |
| 129 | self.assertEqual(s.index(SUBSTR, sublen), sublen + size) |
| 130 | self.assertEqual(s.index(_('i')), SUBSTR.index(_('i'))) |
| 131 | self.assertEqual(s.index(_('i'), sublen), |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 132 | sublen + size + SUBSTR.index(_('i'))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 133 | self.assertEqual(s.index(_('i'), size), |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 134 | sublen + size + SUBSTR.index(_('i'))) |
| 135 | self.assertRaises(ValueError, s.index, _('j')) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 136 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 137 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 138 | def test_isalnum(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 139 | _ = self.from_latin1 |
| 140 | SUBSTR = _('123456') |
| 141 | s = _('a') * size + SUBSTR |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 142 | self.assertTrue(s.isalnum()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 143 | s += _('.') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 144 | self.assertFalse(s.isalnum()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 145 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 146 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 147 | def test_isalpha(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 148 | _ = self.from_latin1 |
| 149 | SUBSTR = _('zzzzzzz') |
| 150 | s = _('a') * size + SUBSTR |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 151 | self.assertTrue(s.isalpha()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 152 | s += _('.') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 153 | self.assertFalse(s.isalpha()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 154 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 155 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 156 | def test_isdigit(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 157 | _ = self.from_latin1 |
| 158 | SUBSTR = _('123456') |
| 159 | s = _('9') * size + SUBSTR |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 160 | self.assertTrue(s.isdigit()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 161 | s += _('z') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 162 | self.assertFalse(s.isdigit()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 163 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 164 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 165 | def test_islower(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 166 | _ = self.from_latin1 |
| 167 | chars = _(''.join( |
| 168 | chr(c) for c in range(255) if not chr(c).isupper())) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 169 | repeats = size // len(chars) + 2 |
| 170 | s = chars * repeats |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 171 | self.assertTrue(s.islower()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 172 | s += _('A') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 173 | self.assertFalse(s.islower()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 174 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 175 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 176 | def test_isspace(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 177 | _ = self.from_latin1 |
| 178 | whitespace = _(' \f\n\r\t\v') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 179 | repeats = size // len(whitespace) + 2 |
| 180 | s = whitespace * repeats |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 181 | self.assertTrue(s.isspace()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 182 | s += _('j') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 183 | self.assertFalse(s.isspace()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 184 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 185 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 186 | def test_istitle(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 187 | _ = self.from_latin1 |
| 188 | SUBSTR = _('123456') |
| 189 | s = _('').join([_('A'), _('a') * size, SUBSTR]) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 190 | self.assertTrue(s.istitle()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 191 | s += _('A') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 192 | self.assertTrue(s.istitle()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 193 | s += _('aA') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 194 | self.assertFalse(s.istitle()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 195 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 196 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 197 | def test_isupper(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 198 | _ = self.from_latin1 |
| 199 | chars = _(''.join( |
| 200 | chr(c) for c in range(255) if not chr(c).islower())) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 201 | repeats = size // len(chars) + 2 |
| 202 | s = chars * repeats |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 203 | self.assertTrue(s.isupper()) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 204 | s += _('a') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 205 | self.assertFalse(s.isupper()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 206 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 207 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 208 | def test_join(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 209 | _ = self.from_latin1 |
| 210 | s = _('A') * size |
| 211 | x = s.join([_('aaaaa'), _('bbbbb')]) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 212 | self.assertEqual(x.count(_('a')), 5) |
| 213 | self.assertEqual(x.count(_('b')), 5) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 214 | self.assertTrue(x.startswith(_('aaaaaA'))) |
| 215 | self.assertTrue(x.endswith(_('Abbbbb'))) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 216 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 217 | @bigmemtest(size=_2G + 10, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 218 | def test_ljust(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 219 | _ = self.from_latin1 |
| 220 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 221 | s = SUBSTR.ljust(size) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 222 | self.assertTrue(s.startswith(SUBSTR + _(' '))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 223 | self.assertEqual(len(s), size) |
| 224 | self.assertEqual(s.strip(), SUBSTR.strip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 225 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 226 | @bigmemtest(size=_2G + 10, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 227 | def test_lower(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 228 | _ = self.from_latin1 |
| 229 | s = _('A') * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 230 | s = s.lower() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 231 | self.assertEqual(len(s), size) |
| 232 | self.assertEqual(s.count(_('a')), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 233 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 234 | @bigmemtest(size=_2G + 10, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 235 | def test_lstrip(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 236 | _ = self.from_latin1 |
| 237 | SUBSTR = _('abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 238 | s = SUBSTR.rjust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 239 | self.assertEqual(len(s), size) |
| 240 | self.assertEqual(s.lstrip(), SUBSTR.lstrip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 241 | del s |
| 242 | s = SUBSTR.ljust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 243 | self.assertEqual(len(s), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 244 | # Type-specific optimization |
| 245 | if isinstance(s, (str, bytes)): |
| 246 | stripped = s.lstrip() |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 247 | self.assertTrue(stripped is s) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 248 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 249 | @bigmemtest(size=_2G + 10, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 250 | def test_replace(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 251 | _ = self.from_latin1 |
| 252 | replacement = _('a') |
| 253 | s = _(' ') * size |
| 254 | s = s.replace(_(' '), replacement) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 255 | self.assertEqual(len(s), size) |
| 256 | self.assertEqual(s.count(replacement), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 257 | s = s.replace(replacement, _(' '), size - 4) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 258 | self.assertEqual(len(s), size) |
| 259 | self.assertEqual(s.count(replacement), 4) |
| 260 | self.assertEqual(s[-10:], _(' aaaa')) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 261 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 262 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 263 | def test_rfind(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 264 | _ = self.from_latin1 |
| 265 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 266 | sublen = len(SUBSTR) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 267 | s = _('').join([SUBSTR, _('-') * size, SUBSTR]) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 268 | self.assertEqual(s.rfind(_(' ')), sublen + size + SUBSTR.rfind(_(' '))) |
| 269 | self.assertEqual(s.rfind(SUBSTR), sublen + size) |
| 270 | self.assertEqual(s.rfind(_(' '), 0, size), SUBSTR.rfind(_(' '))) |
| 271 | self.assertEqual(s.rfind(SUBSTR, 0, sublen + size), 0) |
| 272 | self.assertEqual(s.rfind(_('i')), sublen + size + SUBSTR.rfind(_('i'))) |
| 273 | self.assertEqual(s.rfind(_('i'), 0, sublen), SUBSTR.rfind(_('i'))) |
| 274 | self.assertEqual(s.rfind(_('i'), 0, sublen + size), |
| 275 | SUBSTR.rfind(_('i'))) |
| 276 | self.assertEqual(s.rfind(_('j')), -1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 277 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 278 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 279 | def test_rindex(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 280 | _ = self.from_latin1 |
| 281 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 282 | sublen = len(SUBSTR) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 283 | s = _('').join([SUBSTR, _('-') * size, SUBSTR]) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 284 | self.assertEqual(s.rindex(_(' ')), |
| 285 | sublen + size + SUBSTR.rindex(_(' '))) |
| 286 | self.assertEqual(s.rindex(SUBSTR), sublen + size) |
| 287 | self.assertEqual(s.rindex(_(' '), 0, sublen + size - 1), |
| 288 | SUBSTR.rindex(_(' '))) |
| 289 | self.assertEqual(s.rindex(SUBSTR, 0, sublen + size), 0) |
| 290 | self.assertEqual(s.rindex(_('i')), |
| 291 | sublen + size + SUBSTR.rindex(_('i'))) |
| 292 | self.assertEqual(s.rindex(_('i'), 0, sublen), SUBSTR.rindex(_('i'))) |
| 293 | self.assertEqual(s.rindex(_('i'), 0, sublen + size), |
| 294 | SUBSTR.rindex(_('i'))) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 295 | self.assertRaises(ValueError, s.rindex, _('j')) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 296 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 297 | @bigmemtest(size=_2G + 10, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 298 | def test_rjust(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 299 | _ = self.from_latin1 |
| 300 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 301 | s = SUBSTR.ljust(size) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 302 | self.assertTrue(s.startswith(SUBSTR + _(' '))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 303 | self.assertEqual(len(s), size) |
| 304 | self.assertEqual(s.strip(), SUBSTR.strip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 305 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 306 | @bigmemtest(size=_2G + 10, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 307 | def test_rstrip(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 308 | _ = self.from_latin1 |
| 309 | SUBSTR = _(' abc def ghi') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 310 | s = SUBSTR.ljust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 311 | self.assertEqual(len(s), size) |
| 312 | self.assertEqual(s.rstrip(), SUBSTR.rstrip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 313 | del s |
| 314 | s = SUBSTR.rjust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 315 | self.assertEqual(len(s), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 316 | # Type-specific optimization |
| 317 | if isinstance(s, (str, bytes)): |
| 318 | stripped = s.rstrip() |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 319 | self.assertTrue(stripped is s) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 320 | |
| 321 | # The test takes about size bytes to build a string, and then about |
| 322 | # sqrt(size) substrings of sqrt(size) in size and a list to |
| 323 | # hold sqrt(size) items. It's close but just over 2x size. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 324 | @bigmemtest(size=_2G, memuse=2.1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 325 | def test_split_small(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 326 | _ = self.from_latin1 |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 327 | # Crudely calculate an estimate so that the result of s.split won't |
| 328 | # take up an inordinate amount of memory |
| 329 | chunksize = int(size ** 0.5 + 2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 330 | SUBSTR = _('a') + _(' ') * chunksize |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 331 | s = SUBSTR * chunksize |
| 332 | l = s.split() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 333 | self.assertEqual(len(l), chunksize) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 334 | expected = _('a') |
| 335 | for item in l: |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 336 | self.assertEqual(item, expected) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 337 | del l |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 338 | l = s.split(_('a')) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 339 | self.assertEqual(len(l), chunksize + 1) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 340 | expected = _(' ') * chunksize |
| 341 | for item in filter(None, l): |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 342 | self.assertEqual(item, expected) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 343 | |
| 344 | # Allocates a string of twice size (and briefly two) and a list of |
| 345 | # size. Because of internal affairs, the s.split() call produces a |
| 346 | # list of size times the same one-character string, so we only |
| 347 | # suffer for the list size. (Otherwise, it'd cost another 48 times |
| 348 | # size in bytes!) Nevertheless, a list of size takes |
| 349 | # 8*size bytes. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 350 | @bigmemtest(size=_2G + 5, memuse=10) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 351 | def test_split_large(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 352 | _ = self.from_latin1 |
| 353 | s = _(' a') * size + _(' ') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 354 | l = s.split() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 355 | self.assertEqual(len(l), size) |
| 356 | self.assertEqual(set(l), set([_('a')])) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 357 | del l |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 358 | l = s.split(_('a')) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 359 | self.assertEqual(len(l), size + 1) |
| 360 | self.assertEqual(set(l), set([_(' ')])) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 361 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 362 | @bigmemtest(size=_2G, memuse=2.1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 363 | def test_splitlines(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 364 | _ = self.from_latin1 |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 365 | # Crudely calculate an estimate so that the result of s.split won't |
| 366 | # take up an inordinate amount of memory |
| 367 | chunksize = int(size ** 0.5 + 2) // 2 |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 368 | SUBSTR = _(' ') * chunksize + _('\n') + _(' ') * chunksize + _('\r\n') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 369 | s = SUBSTR * chunksize |
| 370 | l = s.splitlines() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 371 | self.assertEqual(len(l), chunksize * 2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 372 | expected = _(' ') * chunksize |
| 373 | for item in l: |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 374 | self.assertEqual(item, expected) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 375 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 376 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 377 | def test_startswith(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 378 | _ = self.from_latin1 |
| 379 | SUBSTR = _(' abc def ghi') |
| 380 | s = _('-') * size + SUBSTR |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 381 | self.assertTrue(s.startswith(s)) |
| 382 | self.assertTrue(s.startswith(_('-') * size)) |
| 383 | self.assertFalse(s.startswith(SUBSTR)) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 384 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 385 | @bigmemtest(size=_2G, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 386 | def test_strip(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 387 | _ = self.from_latin1 |
| 388 | SUBSTR = _(' abc def ghi ') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 389 | s = SUBSTR.rjust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 390 | self.assertEqual(len(s), size) |
| 391 | self.assertEqual(s.strip(), SUBSTR.strip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 392 | del s |
| 393 | s = SUBSTR.ljust(size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 394 | self.assertEqual(len(s), size) |
| 395 | self.assertEqual(s.strip(), SUBSTR.strip()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 396 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 397 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 398 | def test_swapcase(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 399 | _ = self.from_latin1 |
| 400 | SUBSTR = _("aBcDeFG12.'\xa9\x00") |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 401 | sublen = len(SUBSTR) |
| 402 | repeats = size // sublen + 2 |
| 403 | s = SUBSTR * repeats |
| 404 | s = s.swapcase() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 405 | self.assertEqual(len(s), sublen * repeats) |
| 406 | self.assertEqual(s[:sublen * 3], SUBSTR.swapcase() * 3) |
| 407 | self.assertEqual(s[-sublen * 3:], SUBSTR.swapcase() * 3) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 408 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 409 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 410 | def test_title(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 411 | _ = self.from_latin1 |
| 412 | SUBSTR = _('SpaaHAaaAaham') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 413 | s = SUBSTR * (size // len(SUBSTR) + 2) |
| 414 | s = s.title() |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 415 | self.assertTrue(s.startswith((SUBSTR * 3).title())) |
| 416 | self.assertTrue(s.endswith(SUBSTR.lower() * 3)) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 417 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 418 | @bigmemtest(size=_2G, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 419 | def test_translate(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 420 | _ = self.from_latin1 |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 421 | SUBSTR = _('aZz.z.Aaz.') |
Georg Brandl | abc3877 | 2009-04-12 15:51:51 +0000 | [diff] [blame] | 422 | if isinstance(SUBSTR, str): |
| 423 | trans = { |
| 424 | ord(_('.')): _('-'), |
| 425 | ord(_('a')): _('!'), |
| 426 | ord(_('Z')): _('$'), |
| 427 | } |
| 428 | else: |
| 429 | trans = bytes.maketrans(b'.aZ', b'-!$') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 430 | sublen = len(SUBSTR) |
| 431 | repeats = size // sublen + 2 |
| 432 | s = SUBSTR * repeats |
| 433 | s = s.translate(trans) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 434 | self.assertEqual(len(s), repeats * sublen) |
| 435 | self.assertEqual(s[:sublen], SUBSTR.translate(trans)) |
| 436 | self.assertEqual(s[-sublen:], SUBSTR.translate(trans)) |
| 437 | self.assertEqual(s.count(_('.')), 0) |
| 438 | self.assertEqual(s.count(_('!')), repeats * 2) |
| 439 | self.assertEqual(s.count(_('z')), repeats * 3) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 440 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 441 | @bigmemtest(size=_2G + 5, memuse=2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 442 | def test_upper(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 443 | _ = self.from_latin1 |
| 444 | s = _('a') * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 445 | s = s.upper() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 446 | self.assertEqual(len(s), size) |
| 447 | self.assertEqual(s.count(_('A')), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 448 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 449 | @bigmemtest(size=_2G + 20, memuse=1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 450 | def test_zfill(self, size): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 451 | _ = self.from_latin1 |
| 452 | SUBSTR = _('-568324723598234') |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 453 | s = SUBSTR.zfill(size) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 454 | self.assertTrue(s.endswith(_('0') + SUBSTR[1:])) |
| 455 | self.assertTrue(s.startswith(_('-0'))) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 456 | self.assertEqual(len(s), size) |
| 457 | self.assertEqual(s.count(_('0')), size - len(SUBSTR)) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 458 | |
| 459 | # This test is meaningful even with size < 2G, as long as the |
| 460 | # doubled string is > 2G (but it tests more if both are > 2G :) |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 461 | @bigmemtest(size=_1G + 2, memuse=3) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 462 | def test_concat(self, size): |
| 463 | _ = self.from_latin1 |
| 464 | s = _('.') * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 465 | self.assertEqual(len(s), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 466 | s = s + s |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 467 | self.assertEqual(len(s), size * 2) |
| 468 | self.assertEqual(s.count(_('.')), size * 2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 469 | |
| 470 | # This test is meaningful even with size < 2G, as long as the |
| 471 | # repeated string is > 2G (but it tests more if both are > 2G :) |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 472 | @bigmemtest(size=_1G + 2, memuse=3) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 473 | def test_repeat(self, size): |
| 474 | _ = self.from_latin1 |
| 475 | s = _('.') * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 476 | self.assertEqual(len(s), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 477 | s = s * 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 478 | self.assertEqual(len(s), size * 2) |
| 479 | self.assertEqual(s.count(_('.')), size * 2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 480 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 481 | @bigmemtest(size=_2G + 20, memuse=2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 482 | def test_slice_and_getitem(self, size): |
| 483 | _ = self.from_latin1 |
| 484 | SUBSTR = _('0123456789') |
| 485 | sublen = len(SUBSTR) |
| 486 | s = SUBSTR * (size // sublen) |
| 487 | stepsize = len(s) // 100 |
| 488 | stepsize = stepsize - (stepsize % sublen) |
| 489 | for i in range(0, len(s) - stepsize, stepsize): |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 490 | self.assertEqual(s[i], SUBSTR[0]) |
| 491 | self.assertEqual(s[i:i + sublen], SUBSTR) |
| 492 | self.assertEqual(s[i:i + sublen:2], SUBSTR[::2]) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 493 | if i > 0: |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 494 | self.assertEqual(s[i + sublen - 1:i - 1:-3], |
| 495 | SUBSTR[sublen::-3]) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 496 | # Make sure we do some slicing and indexing near the end of the |
| 497 | # string, too. |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 498 | self.assertEqual(s[len(s) - 1], SUBSTR[-1]) |
| 499 | self.assertEqual(s[-1], SUBSTR[-1]) |
| 500 | self.assertEqual(s[len(s) - 10], SUBSTR[0]) |
| 501 | self.assertEqual(s[-sublen], SUBSTR[0]) |
| 502 | self.assertEqual(s[len(s):], _('')) |
| 503 | self.assertEqual(s[len(s) - 1:], SUBSTR[-1:]) |
| 504 | self.assertEqual(s[-1:], SUBSTR[-1:]) |
| 505 | self.assertEqual(s[len(s) - sublen:], SUBSTR) |
| 506 | self.assertEqual(s[-sublen:], SUBSTR) |
| 507 | self.assertEqual(len(s[:]), len(s)) |
| 508 | self.assertEqual(len(s[:len(s) - 5]), len(s) - 5) |
| 509 | self.assertEqual(len(s[5:-5]), len(s) - 10) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 510 | |
| 511 | self.assertRaises(IndexError, operator.getitem, s, len(s)) |
| 512 | self.assertRaises(IndexError, operator.getitem, s, len(s) + 1) |
| 513 | self.assertRaises(IndexError, operator.getitem, s, len(s) + 1<<31) |
| 514 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 515 | @bigmemtest(size=_2G, memuse=2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 516 | def test_contains(self, size): |
| 517 | _ = self.from_latin1 |
| 518 | SUBSTR = _('0123456789') |
| 519 | edge = _('-') * (size // 2) |
| 520 | s = _('').join([edge, SUBSTR, edge]) |
| 521 | del edge |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 522 | self.assertIn(SUBSTR, s) |
Ezio Melotti | b58e0bd | 2010-01-23 15:40:09 +0000 | [diff] [blame] | 523 | self.assertNotIn(SUBSTR * 2, s) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 524 | self.assertIn(_('-'), s) |
Ezio Melotti | b58e0bd | 2010-01-23 15:40:09 +0000 | [diff] [blame] | 525 | self.assertNotIn(_('a'), s) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 526 | s += _('a') |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 527 | self.assertIn(_('a'), s) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 528 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 529 | @bigmemtest(size=_2G + 10, memuse=2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 530 | def test_compare(self, size): |
| 531 | _ = self.from_latin1 |
| 532 | s1 = _('-') * size |
| 533 | s2 = _('-') * size |
| 534 | self.assertEqual(s1, s2) |
| 535 | del s2 |
| 536 | s2 = s1 + _('a') |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 537 | self.assertFalse(s1 == s2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 538 | del s2 |
| 539 | s2 = _('.') * size |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 540 | self.assertFalse(s1 == s2) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 541 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 542 | @bigmemtest(size=_2G + 10, memuse=1) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 543 | def test_hash(self, size): |
| 544 | # Not sure if we can do any meaningful tests here... Even if we |
| 545 | # start relying on the exact algorithm used, the result will be |
| 546 | # different depending on the size of the C 'long int'. Even this |
| 547 | # test is dodgy (there's no *guarantee* that the two things should |
| 548 | # have a different hash, even if they, in the current |
| 549 | # implementation, almost always do.) |
| 550 | _ = self.from_latin1 |
| 551 | s = _('\x00') * size |
| 552 | h1 = hash(s) |
| 553 | del s |
| 554 | s = _('\x00') * (size + 1) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 555 | self.assertFalse(h1 == hash(s)) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 556 | |
| 557 | |
| 558 | class StrTest(unittest.TestCase, BaseStrTest): |
| 559 | |
| 560 | def from_latin1(self, s): |
| 561 | return s |
| 562 | |
| 563 | def basic_encode_test(self, size, enc, c='.', expectedsize=None): |
| 564 | if expectedsize is None: |
| 565 | expectedsize = size |
| 566 | |
Antoine Pitrou | 45545f7 | 2011-01-12 20:46:37 +0000 | [diff] [blame] | 567 | try: |
| 568 | s = c * size |
| 569 | self.assertEqual(len(s.encode(enc)), expectedsize) |
| 570 | finally: |
| 571 | s = None |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 572 | |
| 573 | def setUp(self): |
| 574 | # HACK: adjust memory use of tests inherited from BaseStrTest |
| 575 | # according to character size. |
| 576 | self._adjusted = {} |
| 577 | for name in dir(BaseStrTest): |
| 578 | if not name.startswith('test_'): |
| 579 | continue |
| 580 | meth = getattr(type(self), name) |
| 581 | try: |
| 582 | memuse = meth.memuse |
| 583 | except AttributeError: |
| 584 | continue |
| 585 | meth.memuse = character_size * memuse |
| 586 | self._adjusted[name] = memuse |
| 587 | |
| 588 | def tearDown(self): |
| 589 | for name, memuse in self._adjusted.items(): |
| 590 | getattr(type(self), name).memuse = memuse |
| 591 | |
Antoine Pitrou | 45545f7 | 2011-01-12 20:46:37 +0000 | [diff] [blame] | 592 | # the utf8 encoder preallocates big time (4x the number of characters) |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 593 | @bigmemtest(size=_2G + 2, memuse=character_size + 4) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 594 | def test_encode(self, size): |
| 595 | return self.basic_encode_test(size, 'utf-8') |
| 596 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 597 | @bigmemtest(size=_4G // 6 + 2, memuse=character_size + 1) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 598 | def test_encode_raw_unicode_escape(self, size): |
| 599 | try: |
| 600 | return self.basic_encode_test(size, 'raw_unicode_escape') |
| 601 | except MemoryError: |
| 602 | pass # acceptable on 32-bit |
| 603 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 604 | @bigmemtest(size=_4G // 5 + 70, memuse=character_size + 1) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 605 | def test_encode_utf7(self, size): |
| 606 | try: |
| 607 | return self.basic_encode_test(size, 'utf7') |
| 608 | except MemoryError: |
| 609 | pass # acceptable on 32-bit |
| 610 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 611 | @bigmemtest(size=_4G // 4 + 5, memuse=character_size + 4) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 612 | def test_encode_utf32(self, size): |
| 613 | try: |
| 614 | return self.basic_encode_test(size, 'utf32', expectedsize=4*size+4) |
| 615 | except MemoryError: |
| 616 | pass # acceptable on 32-bit |
| 617 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 618 | @bigmemtest(size=_2G - 1, memuse=character_size + 1) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 619 | def test_encode_ascii(self, size): |
| 620 | return self.basic_encode_test(size, 'ascii', c='A') |
| 621 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 622 | @bigmemtest(size=_2G + 10, memuse=character_size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 623 | def test_format(self, size): |
| 624 | s = '-' * size |
| 625 | sf = '%s' % (s,) |
Guido van Rossum | e61fd5b | 2007-07-11 12:20:59 +0000 | [diff] [blame] | 626 | self.assertEqual(s, sf) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 627 | del sf |
| 628 | sf = '..%s..' % (s,) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 629 | self.assertEqual(len(sf), len(s) + 4) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 630 | self.assertTrue(sf.startswith('..-')) |
| 631 | self.assertTrue(sf.endswith('-..')) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 632 | del s, sf |
| 633 | |
| 634 | size //= 2 |
| 635 | edge = '-' * size |
| 636 | s = ''.join([edge, '%s', edge]) |
| 637 | del edge |
| 638 | s = s % '...' |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 639 | self.assertEqual(len(s), size * 2 + 3) |
| 640 | self.assertEqual(s.count('.'), 3) |
| 641 | self.assertEqual(s.count('-'), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 642 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 643 | @bigmemtest(size=_2G + 10, memuse=character_size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 644 | def test_repr_small(self, size): |
| 645 | s = '-' * size |
| 646 | s = repr(s) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 647 | self.assertEqual(len(s), size + 2) |
| 648 | self.assertEqual(s[0], "'") |
| 649 | self.assertEqual(s[-1], "'") |
| 650 | self.assertEqual(s.count('-'), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 651 | del s |
| 652 | # repr() will create a string four times as large as this 'binary |
| 653 | # string', but we don't want to allocate much more than twice |
| 654 | # size in total. (We do extra testing in test_repr_large()) |
| 655 | size = size // 5 * 2 |
| 656 | s = '\x00' * size |
| 657 | s = repr(s) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 658 | self.assertEqual(len(s), size * 4 + 2) |
| 659 | self.assertEqual(s[0], "'") |
| 660 | self.assertEqual(s[-1], "'") |
| 661 | self.assertEqual(s.count('\\'), size) |
| 662 | self.assertEqual(s.count('0'), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 663 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 664 | @bigmemtest(size=_2G + 10, memuse=character_size * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 665 | def test_repr_large(self, size): |
| 666 | s = '\x00' * size |
| 667 | s = repr(s) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 668 | self.assertEqual(len(s), size * 4 + 2) |
| 669 | self.assertEqual(s[0], "'") |
| 670 | self.assertEqual(s[-1], "'") |
| 671 | self.assertEqual(s.count('\\'), size) |
| 672 | self.assertEqual(s.count('0'), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 673 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 674 | @bigmemtest(size=_2G // 5 + 1, memuse=character_size * 7) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 675 | def test_unicode_repr(self, size): |
Florent Xicluna | faa663f | 2010-03-19 13:37:08 +0000 | [diff] [blame] | 676 | # Use an assigned, but not printable code point. |
| 677 | # It is in the range of the low surrogates \uDC00-\uDFFF. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 678 | char = "\uDCBA" |
| 679 | s = char * size |
| 680 | try: |
| 681 | for f in (repr, ascii): |
| 682 | r = f(s) |
| 683 | self.assertEqual(len(r), 2 + (len(f(char)) - 2) * size) |
| 684 | self.assertTrue(r.endswith(r"\udcba'"), r[-10:]) |
| 685 | r = None |
| 686 | finally: |
| 687 | r = s = None |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 688 | |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 689 | # The character takes 4 bytes even in UCS-2 builds because it will |
| 690 | # be decomposed into surrogates. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 691 | @bigmemtest(size=_2G // 5 + 1, memuse=4 + character_size * 9) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 692 | def test_unicode_repr_wide(self, size): |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 693 | char = "\U0001DCBA" |
| 694 | s = char * size |
| 695 | try: |
| 696 | for f in (repr, ascii): |
| 697 | r = f(s) |
| 698 | self.assertEqual(len(r), 2 + (len(f(char)) - 2) * size) |
| 699 | self.assertTrue(r.endswith(r"\U0001dcba'"), r[-12:]) |
| 700 | r = None |
| 701 | finally: |
| 702 | r = s = None |
| 703 | |
| 704 | @bigmemtest(size=_4G // 5, memuse=character_size * (6 + 1)) |
| 705 | def _test_unicode_repr_overflow(self, size): |
| 706 | # XXX not sure what this test is about |
| 707 | char = "\uDCBA" |
| 708 | s = char * size |
| 709 | try: |
| 710 | r = repr(s) |
| 711 | self.assertTrue(s == eval(r)) |
| 712 | finally: |
| 713 | r = s = None |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 714 | |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 715 | |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 716 | class BytesTest(unittest.TestCase, BaseStrTest): |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 717 | |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 718 | def from_latin1(self, s): |
| 719 | return s.encode("latin1") |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 720 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 721 | @bigmemtest(size=_2G + 2, memuse=1 + character_size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 722 | def test_decode(self, size): |
| 723 | s = self.from_latin1('.') * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 724 | self.assertEqual(len(s.decode('utf-8')), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 725 | |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 726 | |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 727 | class BytearrayTest(unittest.TestCase, BaseStrTest): |
| 728 | |
| 729 | def from_latin1(self, s): |
| 730 | return bytearray(s.encode("latin1")) |
| 731 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 732 | @bigmemtest(size=_2G + 2, memuse=1 + character_size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 733 | def test_decode(self, size): |
| 734 | s = self.from_latin1('.') * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 735 | self.assertEqual(len(s.decode('utf-8')), size) |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 736 | |
| 737 | test_hash = None |
| 738 | test_split_large = None |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 739 | |
| 740 | class TupleTest(unittest.TestCase): |
| 741 | |
| 742 | # Tuples have a small, fixed-sized head and an array of pointers to |
| 743 | # data. Since we're testing 64-bit addressing, we can assume that the |
| 744 | # pointers are 8 bytes, and that thus that the tuples take up 8 bytes |
| 745 | # per size. |
| 746 | |
| 747 | # As a side-effect of testing long tuples, these tests happen to test |
| 748 | # having more than 2<<31 references to any given object. Hence the |
| 749 | # use of different types of objects as contents in different tests. |
| 750 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 751 | @bigmemtest(size=_2G + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 752 | def test_compare(self, size): |
Guido van Rossum | ef87d6e | 2007-05-02 19:09:54 +0000 | [diff] [blame] | 753 | t1 = ('',) * size |
| 754 | t2 = ('',) * size |
Guido van Rossum | e61fd5b | 2007-07-11 12:20:59 +0000 | [diff] [blame] | 755 | self.assertEqual(t1, t2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 756 | del t2 |
Guido van Rossum | ef87d6e | 2007-05-02 19:09:54 +0000 | [diff] [blame] | 757 | t2 = ('',) * (size + 1) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 758 | self.assertFalse(t1 == t2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 759 | del t2 |
| 760 | t2 = (1,) * size |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 761 | self.assertFalse(t1 == t2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 762 | |
| 763 | # Test concatenating into a single tuple of more than 2G in length, |
| 764 | # and concatenating a tuple of more than 2G in length separately, so |
| 765 | # the smaller test still gets run even if there isn't memory for the |
| 766 | # larger test (but we still let the tester know the larger test is |
| 767 | # skipped, in verbose mode.) |
| 768 | def basic_concat_test(self, size): |
| 769 | t = ((),) * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 770 | self.assertEqual(len(t), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 771 | t = t + t |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 772 | self.assertEqual(len(t), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 773 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 774 | @bigmemtest(size=_2G // 2 + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 775 | def test_concat_small(self, size): |
| 776 | return self.basic_concat_test(size) |
| 777 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 778 | @bigmemtest(size=_2G + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 779 | def test_concat_large(self, size): |
| 780 | return self.basic_concat_test(size) |
| 781 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 782 | @bigmemtest(size=_2G // 5 + 10, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 783 | def test_contains(self, size): |
| 784 | t = (1, 2, 3, 4, 5) * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 785 | self.assertEqual(len(t), size * 5) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 786 | self.assertIn(5, t) |
Ezio Melotti | b58e0bd | 2010-01-23 15:40:09 +0000 | [diff] [blame] | 787 | self.assertNotIn((1, 2, 3, 4, 5), t) |
| 788 | self.assertNotIn(0, t) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 789 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 790 | @bigmemtest(size=_2G + 10, memuse=8) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 791 | def test_hash(self, size): |
| 792 | t1 = (0,) * size |
| 793 | h1 = hash(t1) |
| 794 | del t1 |
| 795 | t2 = (0,) * (size + 1) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 796 | self.assertFalse(h1 == hash(t2)) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 797 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 798 | @bigmemtest(size=_2G + 10, memuse=8) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 799 | def test_index_and_slice(self, size): |
| 800 | t = (None,) * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 801 | self.assertEqual(len(t), size) |
| 802 | self.assertEqual(t[-1], None) |
| 803 | self.assertEqual(t[5], None) |
| 804 | self.assertEqual(t[size - 1], None) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 805 | self.assertRaises(IndexError, operator.getitem, t, size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 806 | self.assertEqual(t[:5], (None,) * 5) |
| 807 | self.assertEqual(t[-5:], (None,) * 5) |
| 808 | self.assertEqual(t[20:25], (None,) * 5) |
| 809 | self.assertEqual(t[-25:-20], (None,) * 5) |
| 810 | self.assertEqual(t[size - 5:], (None,) * 5) |
| 811 | self.assertEqual(t[size - 5:size], (None,) * 5) |
| 812 | self.assertEqual(t[size - 6:size - 2], (None,) * 4) |
| 813 | self.assertEqual(t[size:size], ()) |
| 814 | self.assertEqual(t[size:size+5], ()) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 815 | |
| 816 | # Like test_concat, split in two. |
| 817 | def basic_test_repeat(self, size): |
| 818 | t = ('',) * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 819 | self.assertEqual(len(t), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 820 | t = t * 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 821 | self.assertEqual(len(t), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 822 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 823 | @bigmemtest(size=_2G // 2 + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 824 | def test_repeat_small(self, size): |
| 825 | return self.basic_test_repeat(size) |
| 826 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 827 | @bigmemtest(size=_2G + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 828 | def test_repeat_large(self, size): |
| 829 | return self.basic_test_repeat(size) |
| 830 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 831 | @bigmemtest(size=_1G - 1, memuse=12) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 832 | def test_repeat_large_2(self, size): |
| 833 | return self.basic_test_repeat(size) |
| 834 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 835 | @bigmemtest(size=_1G - 1, memuse=9) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 836 | def test_from_2G_generator(self, size): |
Antoine Pitrou | ea510eb | 2010-11-08 21:40:13 +0000 | [diff] [blame] | 837 | self.skipTest("test needs much more memory than advertised, see issue5438") |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 838 | try: |
| 839 | t = tuple(range(size)) |
| 840 | except MemoryError: |
| 841 | pass # acceptable on 32-bit |
| 842 | else: |
| 843 | count = 0 |
| 844 | for item in t: |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 845 | self.assertEqual(item, count) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 846 | count += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 847 | self.assertEqual(count, size) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 848 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 849 | @bigmemtest(size=_1G - 25, memuse=9) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 850 | def test_from_almost_2G_generator(self, size): |
Antoine Pitrou | ea510eb | 2010-11-08 21:40:13 +0000 | [diff] [blame] | 851 | self.skipTest("test needs much more memory than advertised, see issue5438") |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 852 | try: |
| 853 | t = tuple(range(size)) |
| 854 | count = 0 |
| 855 | for item in t: |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 856 | self.assertEqual(item, count) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 857 | count += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 858 | self.assertEqual(count, size) |
Neal Norwitz | 3ce5d92 | 2008-08-24 07:08:55 +0000 | [diff] [blame] | 859 | except MemoryError: |
| 860 | pass # acceptable, expected on 32-bit |
| 861 | |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 862 | # Like test_concat, split in two. |
| 863 | def basic_test_repr(self, size): |
| 864 | t = (0,) * size |
| 865 | s = repr(t) |
| 866 | # The repr of a tuple of 0's is exactly three times the tuple length. |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 867 | self.assertEqual(len(s), size * 3) |
| 868 | self.assertEqual(s[:5], '(0, 0') |
| 869 | self.assertEqual(s[-5:], '0, 0)') |
| 870 | self.assertEqual(s.count('0'), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 871 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 872 | @bigmemtest(size=_2G // 3 + 2, memuse=8 + 3 * character_size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 873 | def test_repr_small(self, size): |
| 874 | return self.basic_test_repr(size) |
| 875 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 876 | @bigmemtest(size=_2G + 2, memuse=8 + 3 * character_size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 877 | def test_repr_large(self, size): |
| 878 | return self.basic_test_repr(size) |
| 879 | |
| 880 | class ListTest(unittest.TestCase): |
| 881 | |
| 882 | # Like tuples, lists have a small, fixed-sized head and an array of |
| 883 | # pointers to data, so 8 bytes per size. Also like tuples, we make the |
| 884 | # lists hold references to various objects to test their refcount |
| 885 | # limits. |
| 886 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 887 | @bigmemtest(size=_2G + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 888 | def test_compare(self, size): |
Guido van Rossum | ef87d6e | 2007-05-02 19:09:54 +0000 | [diff] [blame] | 889 | l1 = [''] * size |
| 890 | l2 = [''] * size |
Guido van Rossum | e61fd5b | 2007-07-11 12:20:59 +0000 | [diff] [blame] | 891 | self.assertEqual(l1, l2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 892 | del l2 |
Guido van Rossum | ef87d6e | 2007-05-02 19:09:54 +0000 | [diff] [blame] | 893 | l2 = [''] * (size + 1) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 894 | self.assertFalse(l1 == l2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 895 | del l2 |
| 896 | l2 = [2] * size |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 897 | self.assertFalse(l1 == l2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 898 | |
| 899 | # Test concatenating into a single list of more than 2G in length, |
| 900 | # and concatenating a list of more than 2G in length separately, so |
| 901 | # the smaller test still gets run even if there isn't memory for the |
| 902 | # larger test (but we still let the tester know the larger test is |
| 903 | # skipped, in verbose mode.) |
| 904 | def basic_test_concat(self, size): |
| 905 | l = [[]] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 906 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 907 | l = l + l |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 908 | self.assertEqual(len(l), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 909 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 910 | @bigmemtest(size=_2G // 2 + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 911 | def test_concat_small(self, size): |
| 912 | return self.basic_test_concat(size) |
| 913 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 914 | @bigmemtest(size=_2G + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 915 | def test_concat_large(self, size): |
| 916 | return self.basic_test_concat(size) |
| 917 | |
| 918 | def basic_test_inplace_concat(self, size): |
| 919 | l = [sys.stdout] * size |
| 920 | l += l |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 921 | self.assertEqual(len(l), size * 2) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 922 | self.assertTrue(l[0] is l[-1]) |
| 923 | self.assertTrue(l[size - 1] is l[size + 1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 924 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 925 | @bigmemtest(size=_2G // 2 + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 926 | def test_inplace_concat_small(self, size): |
| 927 | return self.basic_test_inplace_concat(size) |
| 928 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 929 | @bigmemtest(size=_2G + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 930 | def test_inplace_concat_large(self, size): |
| 931 | return self.basic_test_inplace_concat(size) |
| 932 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 933 | @bigmemtest(size=_2G // 5 + 10, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 934 | def test_contains(self, size): |
| 935 | l = [1, 2, 3, 4, 5] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 936 | self.assertEqual(len(l), size * 5) |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 937 | self.assertIn(5, l) |
Ezio Melotti | b58e0bd | 2010-01-23 15:40:09 +0000 | [diff] [blame] | 938 | self.assertNotIn([1, 2, 3, 4, 5], l) |
| 939 | self.assertNotIn(0, l) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 940 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 941 | @bigmemtest(size=_2G + 10, memuse=8) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 942 | def test_hash(self, size): |
| 943 | l = [0] * size |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 944 | self.assertRaises(TypeError, hash, l) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 945 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 946 | @bigmemtest(size=_2G + 10, memuse=8) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 947 | def test_index_and_slice(self, size): |
| 948 | l = [None] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 949 | self.assertEqual(len(l), size) |
| 950 | self.assertEqual(l[-1], None) |
| 951 | self.assertEqual(l[5], None) |
| 952 | self.assertEqual(l[size - 1], None) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 953 | self.assertRaises(IndexError, operator.getitem, l, size) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 954 | self.assertEqual(l[:5], [None] * 5) |
| 955 | self.assertEqual(l[-5:], [None] * 5) |
| 956 | self.assertEqual(l[20:25], [None] * 5) |
| 957 | self.assertEqual(l[-25:-20], [None] * 5) |
| 958 | self.assertEqual(l[size - 5:], [None] * 5) |
| 959 | self.assertEqual(l[size - 5:size], [None] * 5) |
| 960 | self.assertEqual(l[size - 6:size - 2], [None] * 4) |
| 961 | self.assertEqual(l[size:size], []) |
| 962 | self.assertEqual(l[size:size+5], []) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 963 | |
| 964 | l[size - 2] = 5 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 965 | self.assertEqual(len(l), size) |
| 966 | self.assertEqual(l[-3:], [None, 5, None]) |
| 967 | self.assertEqual(l.count(5), 1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 968 | self.assertRaises(IndexError, operator.setitem, l, size, 6) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 969 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 970 | |
| 971 | l[size - 7:] = [1, 2, 3, 4, 5] |
| 972 | size -= 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 973 | self.assertEqual(len(l), size) |
| 974 | self.assertEqual(l[-7:], [None, None, 1, 2, 3, 4, 5]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 975 | |
| 976 | l[:7] = [1, 2, 3, 4, 5] |
| 977 | size -= 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 978 | self.assertEqual(len(l), size) |
| 979 | self.assertEqual(l[:7], [1, 2, 3, 4, 5, None, None]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 980 | |
| 981 | del l[size - 1] |
| 982 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 983 | self.assertEqual(len(l), size) |
| 984 | self.assertEqual(l[-1], 4) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 985 | |
| 986 | del l[-2:] |
| 987 | size -= 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 988 | self.assertEqual(len(l), size) |
| 989 | self.assertEqual(l[-1], 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 990 | |
| 991 | del l[0] |
| 992 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 993 | self.assertEqual(len(l), size) |
| 994 | self.assertEqual(l[0], 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 995 | |
| 996 | del l[:2] |
| 997 | size -= 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 998 | self.assertEqual(len(l), size) |
| 999 | self.assertEqual(l[0], 4) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1000 | |
| 1001 | # Like test_concat, split in two. |
| 1002 | def basic_test_repeat(self, size): |
| 1003 | l = [] * size |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 1004 | self.assertFalse(l) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1005 | l = [''] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1006 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1007 | l = l * 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1008 | self.assertEqual(len(l), size * 2) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1009 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1010 | @bigmemtest(size=_2G // 2 + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1011 | def test_repeat_small(self, size): |
| 1012 | return self.basic_test_repeat(size) |
| 1013 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1014 | @bigmemtest(size=_2G + 2, memuse=24) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1015 | def test_repeat_large(self, size): |
| 1016 | return self.basic_test_repeat(size) |
| 1017 | |
| 1018 | def basic_test_inplace_repeat(self, size): |
| 1019 | l = [''] |
| 1020 | l *= size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1021 | self.assertEqual(len(l), size) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 1022 | self.assertTrue(l[0] is l[-1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1023 | del l |
| 1024 | |
| 1025 | l = [''] * size |
| 1026 | l *= 2 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1027 | self.assertEqual(len(l), size * 2) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 1028 | self.assertTrue(l[size - 1] is l[-1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1029 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1030 | @bigmemtest(size=_2G // 2 + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1031 | def test_inplace_repeat_small(self, size): |
| 1032 | return self.basic_test_inplace_repeat(size) |
| 1033 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1034 | @bigmemtest(size=_2G + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1035 | def test_inplace_repeat_large(self, size): |
| 1036 | return self.basic_test_inplace_repeat(size) |
| 1037 | |
| 1038 | def basic_test_repr(self, size): |
| 1039 | l = [0] * size |
| 1040 | s = repr(l) |
| 1041 | # The repr of a list of 0's is exactly three times the list length. |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1042 | self.assertEqual(len(s), size * 3) |
| 1043 | self.assertEqual(s[:5], '[0, 0') |
| 1044 | self.assertEqual(s[-5:], '0, 0]') |
| 1045 | self.assertEqual(s.count('0'), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1046 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1047 | @bigmemtest(size=_2G // 3 + 2, memuse=8 + 3 * character_size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1048 | def test_repr_small(self, size): |
| 1049 | return self.basic_test_repr(size) |
| 1050 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1051 | @bigmemtest(size=_2G + 2, memuse=8 + 3 * character_size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1052 | def test_repr_large(self, size): |
| 1053 | return self.basic_test_repr(size) |
| 1054 | |
| 1055 | # list overallocates ~1/8th of the total size (on first expansion) so |
| 1056 | # the single list.append call puts memuse at 9 bytes per size. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1057 | @bigmemtest(size=_2G, memuse=9) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1058 | def test_append(self, size): |
| 1059 | l = [object()] * size |
| 1060 | l.append(object()) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1061 | self.assertEqual(len(l), size+1) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 1062 | self.assertTrue(l[-3] is l[-2]) |
| 1063 | self.assertFalse(l[-2] is l[-1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1064 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1065 | @bigmemtest(size=_2G // 5 + 2, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1066 | def test_count(self, size): |
| 1067 | l = [1, 2, 3, 4, 5] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1068 | self.assertEqual(l.count(1), size) |
| 1069 | self.assertEqual(l.count("1"), 0) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1070 | |
| 1071 | def basic_test_extend(self, size): |
Guido van Rossum | a5d0c26 | 2007-07-12 08:11:23 +0000 | [diff] [blame] | 1072 | l = [object] * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1073 | l.extend(l) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1074 | self.assertEqual(len(l), size * 2) |
Benjamin Peterson | c9c0f20 | 2009-06-30 23:06:06 +0000 | [diff] [blame] | 1075 | self.assertTrue(l[0] is l[-1]) |
| 1076 | self.assertTrue(l[size - 1] is l[size + 1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1077 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1078 | @bigmemtest(size=_2G // 2 + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1079 | def test_extend_small(self, size): |
| 1080 | return self.basic_test_extend(size) |
| 1081 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1082 | @bigmemtest(size=_2G + 2, memuse=16) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1083 | def test_extend_large(self, size): |
| 1084 | return self.basic_test_extend(size) |
| 1085 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1086 | @bigmemtest(size=_2G // 5 + 2, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1087 | def test_index(self, size): |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 1088 | l = [1, 2, 3, 4, 5] * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1089 | size *= 5 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1090 | self.assertEqual(l.index(1), 0) |
| 1091 | self.assertEqual(l.index(5, size - 5), size - 1) |
| 1092 | self.assertEqual(l.index(5, size - 5, size), size - 1) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1093 | self.assertRaises(ValueError, l.index, 1, size - 4, size) |
Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 1094 | self.assertRaises(ValueError, l.index, 6) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1095 | |
| 1096 | # This tests suffers from overallocation, just like test_append. |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1097 | @bigmemtest(size=_2G + 10, memuse=9) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1098 | def test_insert(self, size): |
| 1099 | l = [1.0] * size |
| 1100 | l.insert(size - 1, "A") |
| 1101 | size += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1102 | self.assertEqual(len(l), size) |
| 1103 | self.assertEqual(l[-3:], [1.0, "A", 1.0]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1104 | |
| 1105 | l.insert(size + 1, "B") |
| 1106 | size += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1107 | self.assertEqual(len(l), size) |
| 1108 | self.assertEqual(l[-3:], ["A", 1.0, "B"]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1109 | |
| 1110 | l.insert(1, "C") |
| 1111 | size += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1112 | self.assertEqual(len(l), size) |
| 1113 | self.assertEqual(l[:3], [1.0, "C", 1.0]) |
| 1114 | self.assertEqual(l[size - 3:], ["A", 1.0, "B"]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1115 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1116 | @bigmemtest(size=_2G // 5 + 4, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1117 | def test_pop(self, size): |
Guido van Rossum | ef87d6e | 2007-05-02 19:09:54 +0000 | [diff] [blame] | 1118 | l = ["a", "b", "c", "d", "e"] * size |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1119 | size *= 5 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1120 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1121 | |
| 1122 | item = l.pop() |
| 1123 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1124 | self.assertEqual(len(l), size) |
| 1125 | self.assertEqual(item, "e") |
| 1126 | self.assertEqual(l[-2:], ["c", "d"]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1127 | |
| 1128 | item = l.pop(0) |
| 1129 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1130 | self.assertEqual(len(l), size) |
| 1131 | self.assertEqual(item, "a") |
| 1132 | self.assertEqual(l[:2], ["b", "c"]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1133 | |
| 1134 | item = l.pop(size - 2) |
| 1135 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1136 | self.assertEqual(len(l), size) |
| 1137 | self.assertEqual(item, "c") |
| 1138 | self.assertEqual(l[-2:], ["b", "d"]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1139 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1140 | @bigmemtest(size=_2G + 10, memuse=8) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1141 | def test_remove(self, size): |
| 1142 | l = [10] * size |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1143 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1144 | |
| 1145 | l.remove(10) |
| 1146 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1147 | self.assertEqual(len(l), size) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1148 | |
| 1149 | # Because of the earlier l.remove(), this append doesn't trigger |
| 1150 | # a resize. |
| 1151 | l.append(5) |
| 1152 | size += 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1153 | self.assertEqual(len(l), size) |
| 1154 | self.assertEqual(l[-2:], [10, 5]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1155 | l.remove(5) |
| 1156 | size -= 1 |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1157 | self.assertEqual(len(l), size) |
| 1158 | self.assertEqual(l[-2:], [10, 10]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1159 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1160 | @bigmemtest(size=_2G // 5 + 2, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1161 | def test_reverse(self, size): |
| 1162 | l = [1, 2, 3, 4, 5] * size |
| 1163 | l.reverse() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1164 | self.assertEqual(len(l), size * 5) |
| 1165 | self.assertEqual(l[-5:], [5, 4, 3, 2, 1]) |
| 1166 | self.assertEqual(l[:5], [5, 4, 3, 2, 1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1167 | |
Antoine Pitrou | 94190bb | 2011-10-04 10:22:36 +0200 | [diff] [blame] | 1168 | @bigmemtest(size=_2G // 5 + 2, memuse=8 * 5) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1169 | def test_sort(self, size): |
| 1170 | l = [1, 2, 3, 4, 5] * size |
| 1171 | l.sort() |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 1172 | self.assertEqual(len(l), size * 5) |
| 1173 | self.assertEqual(l.count(1), size) |
| 1174 | self.assertEqual(l[:10], [1] * 10) |
| 1175 | self.assertEqual(l[-10:], [5] * 10) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1176 | |
| 1177 | def test_main(): |
Antoine Pitrou | 7cdb495 | 2009-03-07 23:40:49 +0000 | [diff] [blame] | 1178 | support.run_unittest(StrTest, BytesTest, BytearrayTest, |
| 1179 | TupleTest, ListTest) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1180 | |
| 1181 | if __name__ == '__main__': |
| 1182 | if len(sys.argv) > 1: |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 1183 | support.set_memlimit(sys.argv[1]) |
Thomas Wouters | 477c8d5 | 2006-05-27 19:21:47 +0000 | [diff] [blame] | 1184 | test_main() |