blob: d7925290206c2bf01e5232d8a00be036faea2cf4 [file] [log] [blame]
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001"""
2Common tests shared by test_str, test_unicode, test_userstring and test_string.
3"""
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +00004
Guido van Rossum360e4b82007-05-14 22:51:27 +00005import unittest, string, sys, struct
Benjamin Petersonee8712c2008-05-20 21:35:26 +00006from test import support
Raymond Hettinger53dbe392008-02-12 20:03:09 +00007from collections import UserList
Jeremy Hylton20f41b62000-07-11 03:31:55 +00008
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +00009class Sequence:
Walter Dörwald0fd583c2003-02-21 12:53:50 +000010 def __init__(self, seq='wxyz'): self.seq = seq
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000011 def __len__(self): return len(self.seq)
12 def __getitem__(self, i): return self.seq[i]
13
14class BadSeq1(Sequence):
Guido van Rossume2a383d2007-01-15 16:59:06 +000015 def __init__(self): self.seq = [7, 'hello', 123]
Guido van Rossumf1044292007-09-27 18:01:22 +000016 def __str__(self): return '{0} {1} {2}'.format(*self.seq)
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000017
18class BadSeq2(Sequence):
19 def __init__(self): self.seq = ['a', 'b', 'c']
20 def __len__(self): return 8
21
Georg Brandlc7885542007-03-06 19:16:20 +000022class BaseTest(unittest.TestCase):
23 # These tests are for buffers of values (bytes) and not
24 # specific to character interpretation, used for bytes objects
25 # and various string implementations
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000026
Walter Dörwald0fd583c2003-02-21 12:53:50 +000027 # The type to be tested
28 # Change in subclasses to change the behaviour of fixtesttype()
29 type2test = None
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000030
Walter Dörwald0fd583c2003-02-21 12:53:50 +000031 # All tests pass their arguments to the testing methods
32 # as str objects. fixtesttype() can be used to propagate
33 # these arguments to the appropriate type
34 def fixtype(self, obj):
35 if isinstance(obj, str):
36 return self.__class__.type2test(obj)
37 elif isinstance(obj, list):
38 return [self.fixtype(x) for x in obj]
39 elif isinstance(obj, tuple):
40 return tuple([self.fixtype(x) for x in obj])
41 elif isinstance(obj, dict):
42 return dict([
43 (self.fixtype(key), self.fixtype(value))
Guido van Rossumcc2b0162007-02-11 06:12:03 +000044 for (key, value) in obj.items()
Walter Dörwald0fd583c2003-02-21 12:53:50 +000045 ])
46 else:
47 return obj
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000048
Guido van Rossum09549f42007-08-27 20:40:10 +000049 # check that obj.method(*args) returns result
50 def checkequal(self, result, obj, methodname, *args):
Walter Dörwald0fd583c2003-02-21 12:53:50 +000051 result = self.fixtype(result)
Guido van Rossum09549f42007-08-27 20:40:10 +000052 obj = self.fixtype(obj)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000053 args = self.fixtype(args)
Guido van Rossum09549f42007-08-27 20:40:10 +000054 realresult = getattr(obj, methodname)(*args)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000055 self.assertEqual(
56 result,
57 realresult
58 )
59 # if the original is returned make sure that
60 # this doesn't happen with subclasses
Guido van Rossum09549f42007-08-27 20:40:10 +000061 if obj is realresult:
62 try:
63 class subtype(self.__class__.type2test):
64 pass
65 except TypeError:
66 pass # Skip this if we can't subclass
67 else:
68 obj = subtype(obj)
69 realresult = getattr(obj, methodname)(*args)
Ezio Melottib3aedd42010-11-20 19:04:17 +000070 self.assertIsNot(obj, realresult)
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000071
Guido van Rossum09549f42007-08-27 20:40:10 +000072 # check that obj.method(*args) raises exc
73 def checkraises(self, exc, obj, methodname, *args):
74 obj = self.fixtype(obj)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000075 args = self.fixtype(args)
76 self.assertRaises(
77 exc,
Guido van Rossum09549f42007-08-27 20:40:10 +000078 getattr(obj, methodname),
Walter Dörwald0fd583c2003-02-21 12:53:50 +000079 *args
80 )
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000081
Guido van Rossum09549f42007-08-27 20:40:10 +000082 # call obj.method(*args) without any checks
83 def checkcall(self, obj, methodname, *args):
84 obj = self.fixtype(obj)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000085 args = self.fixtype(args)
Guido van Rossum09549f42007-08-27 20:40:10 +000086 getattr(obj, methodname)(*args)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000087
Walter Dörwald0fd583c2003-02-21 12:53:50 +000088 def test_count(self):
89 self.checkequal(3, 'aaa', 'count', 'a')
90 self.checkequal(0, 'aaa', 'count', 'b')
91 self.checkequal(3, 'aaa', 'count', 'a')
92 self.checkequal(0, 'aaa', 'count', 'b')
93 self.checkequal(3, 'aaa', 'count', 'a')
94 self.checkequal(0, 'aaa', 'count', 'b')
95 self.checkequal(0, 'aaa', 'count', 'b')
Thomas Wouters4d70c3d2006-06-08 14:42:34 +000096 self.checkequal(2, 'aaa', 'count', 'a', 1)
97 self.checkequal(0, 'aaa', 'count', 'a', 10)
Walter Dörwald0fd583c2003-02-21 12:53:50 +000098 self.checkequal(1, 'aaa', 'count', 'a', -1)
99 self.checkequal(3, 'aaa', 'count', 'a', -10)
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000100 self.checkequal(1, 'aaa', 'count', 'a', 0, 1)
101 self.checkequal(3, 'aaa', 'count', 'a', 0, 10)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000102 self.checkequal(2, 'aaa', 'count', 'a', 0, -1)
103 self.checkequal(0, 'aaa', 'count', 'a', 0, -10)
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000104 self.checkequal(3, 'aaa', 'count', '', 1)
105 self.checkequal(1, 'aaa', 'count', '', 3)
106 self.checkequal(0, 'aaa', 'count', '', 10)
107 self.checkequal(2, 'aaa', 'count', '', -1)
108 self.checkequal(4, 'aaa', 'count', '', -10)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000109
Amaury Forgeot d'Arcf2e93682008-09-26 22:48:41 +0000110 self.checkequal(1, '', 'count', '')
111 self.checkequal(0, '', 'count', '', 1, 1)
112 self.checkequal(0, '', 'count', '', sys.maxsize, 0)
113
114 self.checkequal(0, '', 'count', 'xx')
115 self.checkequal(0, '', 'count', 'xx', 1, 1)
116 self.checkequal(0, '', 'count', 'xx', sys.maxsize, 0)
117
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000118 self.checkraises(TypeError, 'hello', 'count')
119 self.checkraises(TypeError, 'hello', 'count', 42)
120
Raymond Hettinger57e74472005-02-20 09:54:53 +0000121 # For a variety of combinations,
122 # verify that str.count() matches an equivalent function
123 # replacing all occurrences and then differencing the string lengths
124 charset = ['', 'a', 'b']
125 digits = 7
126 base = len(charset)
127 teststrings = set()
Guido van Rossum805365e2007-05-07 22:24:25 +0000128 for i in range(base ** digits):
Raymond Hettinger57e74472005-02-20 09:54:53 +0000129 entry = []
Guido van Rossum805365e2007-05-07 22:24:25 +0000130 for j in range(digits):
Raymond Hettinger57e74472005-02-20 09:54:53 +0000131 i, m = divmod(i, base)
132 entry.append(charset[m])
133 teststrings.add(''.join(entry))
Guido van Rossum09549f42007-08-27 20:40:10 +0000134 teststrings = [self.fixtype(ts) for ts in teststrings]
Raymond Hettinger57e74472005-02-20 09:54:53 +0000135 for i in teststrings:
Raymond Hettinger57e74472005-02-20 09:54:53 +0000136 n = len(i)
137 for j in teststrings:
138 r1 = i.count(j)
139 if j:
Guido van Rossum09549f42007-08-27 20:40:10 +0000140 r2, rem = divmod(n - len(i.replace(j, self.fixtype(''))),
141 len(j))
Raymond Hettinger57e74472005-02-20 09:54:53 +0000142 else:
143 r2, rem = len(i)+1, 0
144 if rem or r1 != r2:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000145 self.assertEqual(rem, 0, '%s != 0 for %s' % (rem, i))
146 self.assertEqual(r1, r2, '%s != %s for %s' % (r1, r2, i))
Raymond Hettinger57e74472005-02-20 09:54:53 +0000147
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000148 def test_find(self):
149 self.checkequal(0, 'abcdefghiabc', 'find', 'abc')
150 self.checkequal(9, 'abcdefghiabc', 'find', 'abc', 1)
151 self.checkequal(-1, 'abcdefghiabc', 'find', 'def', 4)
152
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000153 self.checkequal(0, 'abc', 'find', '', 0)
154 self.checkequal(3, 'abc', 'find', '', 3)
155 self.checkequal(-1, 'abc', 'find', '', 4)
156
Christian Heimes9cd17752007-11-18 19:35:23 +0000157 # to check the ability to pass None as defaults
158 self.checkequal( 2, 'rrarrrrrrrrra', 'find', 'a')
159 self.checkequal(12, 'rrarrrrrrrrra', 'find', 'a', 4)
160 self.checkequal(-1, 'rrarrrrrrrrra', 'find', 'a', 4, 6)
161 self.checkequal(12, 'rrarrrrrrrrra', 'find', 'a', 4, None)
162 self.checkequal( 2, 'rrarrrrrrrrra', 'find', 'a', None, 6)
163
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000164 self.checkraises(TypeError, 'hello', 'find')
165 self.checkraises(TypeError, 'hello', 'find', 42)
166
Amaury Forgeot d'Arcf2e93682008-09-26 22:48:41 +0000167 self.checkequal(0, '', 'find', '')
168 self.checkequal(-1, '', 'find', '', 1, 1)
169 self.checkequal(-1, '', 'find', '', sys.maxsize, 0)
170
171 self.checkequal(-1, '', 'find', 'xx')
172 self.checkequal(-1, '', 'find', 'xx', 1, 1)
173 self.checkequal(-1, '', 'find', 'xx', sys.maxsize, 0)
174
Antoine Pitrou74edda02010-01-02 21:51:33 +0000175 # issue 7458
176 self.checkequal(-1, 'ab', 'find', 'xxx', sys.maxsize + 1, 0)
177
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000178 # For a variety of combinations,
179 # verify that str.find() matches __contains__
180 # and that the found substring is really at that location
181 charset = ['', 'a', 'b', 'c']
182 digits = 5
183 base = len(charset)
184 teststrings = set()
Guido van Rossum805365e2007-05-07 22:24:25 +0000185 for i in range(base ** digits):
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000186 entry = []
Guido van Rossum805365e2007-05-07 22:24:25 +0000187 for j in range(digits):
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000188 i, m = divmod(i, base)
189 entry.append(charset[m])
190 teststrings.add(''.join(entry))
Guido van Rossum09549f42007-08-27 20:40:10 +0000191 teststrings = [self.fixtype(ts) for ts in teststrings]
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000192 for i in teststrings:
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000193 for j in teststrings:
194 loc = i.find(j)
195 r1 = (loc != -1)
196 r2 = j in i
Antoine Pitrou2e544fb2010-01-02 21:55:17 +0000197 self.assertEqual(r1, r2)
Raymond Hettinger7cbf1bc2005-02-20 04:07:08 +0000198 if loc != -1:
199 self.assertEqual(i[loc:loc+len(j)], j)
200
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000201 def test_rfind(self):
202 self.checkequal(9, 'abcdefghiabc', 'rfind', 'abc')
203 self.checkequal(12, 'abcdefghiabc', 'rfind', '')
204 self.checkequal(0, 'abcdefghiabc', 'rfind', 'abcd')
205 self.checkequal(-1, 'abcdefghiabc', 'rfind', 'abcz')
206
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000207 self.checkequal(3, 'abc', 'rfind', '', 0)
208 self.checkequal(3, 'abc', 'rfind', '', 3)
209 self.checkequal(-1, 'abc', 'rfind', '', 4)
210
Christian Heimes9cd17752007-11-18 19:35:23 +0000211 # to check the ability to pass None as defaults
212 self.checkequal(12, 'rrarrrrrrrrra', 'rfind', 'a')
213 self.checkequal(12, 'rrarrrrrrrrra', 'rfind', 'a', 4)
214 self.checkequal(-1, 'rrarrrrrrrrra', 'rfind', 'a', 4, 6)
215 self.checkequal(12, 'rrarrrrrrrrra', 'rfind', 'a', 4, None)
216 self.checkequal( 2, 'rrarrrrrrrrra', 'rfind', 'a', None, 6)
217
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000218 self.checkraises(TypeError, 'hello', 'rfind')
219 self.checkraises(TypeError, 'hello', 'rfind', 42)
220
Antoine Pitrouda2ecaf2010-01-02 21:40:36 +0000221 # For a variety of combinations,
222 # verify that str.rfind() matches __contains__
223 # and that the found substring is really at that location
224 charset = ['', 'a', 'b', 'c']
225 digits = 5
226 base = len(charset)
227 teststrings = set()
228 for i in range(base ** digits):
229 entry = []
230 for j in range(digits):
231 i, m = divmod(i, base)
232 entry.append(charset[m])
233 teststrings.add(''.join(entry))
234 teststrings = [self.fixtype(ts) for ts in teststrings]
235 for i in teststrings:
236 for j in teststrings:
237 loc = i.rfind(j)
238 r1 = (loc != -1)
239 r2 = j in i
Antoine Pitrou2e544fb2010-01-02 21:55:17 +0000240 self.assertEqual(r1, r2)
Antoine Pitrouda2ecaf2010-01-02 21:40:36 +0000241 if loc != -1:
242 self.assertEqual(i[loc:loc+len(j)], j)
243
Antoine Pitrou74edda02010-01-02 21:51:33 +0000244 # issue 7458
245 self.checkequal(-1, 'ab', 'rfind', 'xxx', sys.maxsize + 1, 0)
246
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000247 def test_index(self):
248 self.checkequal(0, 'abcdefghiabc', 'index', '')
249 self.checkequal(3, 'abcdefghiabc', 'index', 'def')
250 self.checkequal(0, 'abcdefghiabc', 'index', 'abc')
251 self.checkequal(9, 'abcdefghiabc', 'index', 'abc', 1)
252
253 self.checkraises(ValueError, 'abcdefghiabc', 'index', 'hib')
254 self.checkraises(ValueError, 'abcdefghiab', 'index', 'abc', 1)
255 self.checkraises(ValueError, 'abcdefghi', 'index', 'ghi', 8)
256 self.checkraises(ValueError, 'abcdefghi', 'index', 'ghi', -1)
257
Christian Heimes9cd17752007-11-18 19:35:23 +0000258 # to check the ability to pass None as defaults
259 self.checkequal( 2, 'rrarrrrrrrrra', 'index', 'a')
260 self.checkequal(12, 'rrarrrrrrrrra', 'index', 'a', 4)
261 self.checkraises(ValueError, 'rrarrrrrrrrra', 'index', 'a', 4, 6)
262 self.checkequal(12, 'rrarrrrrrrrra', 'index', 'a', 4, None)
263 self.checkequal( 2, 'rrarrrrrrrrra', 'index', 'a', None, 6)
264
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000265 self.checkraises(TypeError, 'hello', 'index')
266 self.checkraises(TypeError, 'hello', 'index', 42)
267
268 def test_rindex(self):
269 self.checkequal(12, 'abcdefghiabc', 'rindex', '')
270 self.checkequal(3, 'abcdefghiabc', 'rindex', 'def')
271 self.checkequal(9, 'abcdefghiabc', 'rindex', 'abc')
272 self.checkequal(0, 'abcdefghiabc', 'rindex', 'abc', 0, -1)
273
274 self.checkraises(ValueError, 'abcdefghiabc', 'rindex', 'hib')
275 self.checkraises(ValueError, 'defghiabc', 'rindex', 'def', 1)
276 self.checkraises(ValueError, 'defghiabc', 'rindex', 'abc', 0, -1)
277 self.checkraises(ValueError, 'abcdefghi', 'rindex', 'ghi', 0, 8)
278 self.checkraises(ValueError, 'abcdefghi', 'rindex', 'ghi', 0, -1)
279
Christian Heimes9cd17752007-11-18 19:35:23 +0000280 # to check the ability to pass None as defaults
281 self.checkequal(12, 'rrarrrrrrrrra', 'rindex', 'a')
282 self.checkequal(12, 'rrarrrrrrrrra', 'rindex', 'a', 4)
283 self.checkraises(ValueError, 'rrarrrrrrrrra', 'rindex', 'a', 4, 6)
284 self.checkequal(12, 'rrarrrrrrrrra', 'rindex', 'a', 4, None)
285 self.checkequal( 2, 'rrarrrrrrrrra', 'rindex', 'a', None, 6)
286
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000287 self.checkraises(TypeError, 'hello', 'rindex')
288 self.checkraises(TypeError, 'hello', 'rindex', 42)
289
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000290 def test_lower(self):
291 self.checkequal('hello', 'HeLLo', 'lower')
292 self.checkequal('hello', 'hello', 'lower')
293 self.checkraises(TypeError, 'hello', 'lower', 42)
294
295 def test_upper(self):
296 self.checkequal('HELLO', 'HeLLo', 'upper')
297 self.checkequal('HELLO', 'HELLO', 'upper')
298 self.checkraises(TypeError, 'hello', 'upper', 42)
299
300 def test_expandtabs(self):
301 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
302 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
303 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 4)
304 self.checkequal('abc\r\nab def\ng hi', 'abc\r\nab\tdef\ng\thi', 'expandtabs', 4)
305 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
306 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
307 self.checkequal('abc\r\nab\r\ndef\ng\r\nhi', 'abc\r\nab\r\ndef\ng\r\nhi', 'expandtabs', 4)
308 self.checkequal(' a\n b', ' \ta\n\tb', 'expandtabs', 1)
309
310 self.checkraises(TypeError, 'hello', 'expandtabs', 42, 42)
311 # This test is only valid when sizeof(int) == sizeof(void*) == 4.
Christian Heimesa37d4c62007-12-04 23:02:19 +0000312 if sys.maxsize < (1 << 32) and struct.calcsize('P') == 4:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000313 self.checkraises(OverflowError,
Christian Heimesa37d4c62007-12-04 23:02:19 +0000314 '\ta\n\tb', 'expandtabs', sys.maxsize)
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000315
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000316 def test_split(self):
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000317 # by a char
318 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'split', '|')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000319 self.checkequal(['a|b|c|d'], 'a|b|c|d', 'split', '|', 0)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000320 self.checkequal(['a', 'b|c|d'], 'a|b|c|d', 'split', '|', 1)
321 self.checkequal(['a', 'b', 'c|d'], 'a|b|c|d', 'split', '|', 2)
322 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'split', '|', 3)
323 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'split', '|', 4)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000324 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'split', '|',
Christian Heimesa37d4c62007-12-04 23:02:19 +0000325 sys.maxsize-2)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000326 self.checkequal(['a|b|c|d'], 'a|b|c|d', 'split', '|', 0)
327 self.checkequal(['a', '', 'b||c||d'], 'a||b||c||d', 'split', '|', 2)
328 self.checkequal(['endcase ', ''], 'endcase |', 'split', '|')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000329 self.checkequal(['', ' startcase'], '| startcase', 'split', '|')
330 self.checkequal(['', 'bothcase', ''], '|bothcase|', 'split', '|')
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000331 self.checkequal(['a', '', 'b\x00c\x00d'], 'a\x00\x00b\x00c\x00d', 'split', '\x00', 2)
332
Thomas Wouters477c8d52006-05-27 19:21:47 +0000333 self.checkequal(['a']*20, ('a|'*20)[:-1], 'split', '|')
334 self.checkequal(['a']*15 +['a|a|a|a|a'],
335 ('a|'*20)[:-1], 'split', '|', 15)
336
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000337 # by string
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000338 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'split', '//')
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000339 self.checkequal(['a', 'b//c//d'], 'a//b//c//d', 'split', '//', 1)
340 self.checkequal(['a', 'b', 'c//d'], 'a//b//c//d', 'split', '//', 2)
341 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'split', '//', 3)
342 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'split', '//', 4)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000343 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'split', '//',
Christian Heimesa37d4c62007-12-04 23:02:19 +0000344 sys.maxsize-10)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000345 self.checkequal(['a//b//c//d'], 'a//b//c//d', 'split', '//', 0)
346 self.checkequal(['a', '', 'b////c////d'], 'a////b////c////d', 'split', '//', 2)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000347 self.checkequal(['endcase ', ''], 'endcase test', 'split', 'test')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000348 self.checkequal(['', ' begincase'], 'test begincase', 'split', 'test')
349 self.checkequal(['', ' bothcase ', ''], 'test bothcase test',
350 'split', 'test')
351 self.checkequal(['a', 'bc'], 'abbbc', 'split', 'bb')
352 self.checkequal(['', ''], 'aaa', 'split', 'aaa')
353 self.checkequal(['aaa'], 'aaa', 'split', 'aaa', 0)
354 self.checkequal(['ab', 'ab'], 'abbaab', 'split', 'ba')
355 self.checkequal(['aaaa'], 'aaaa', 'split', 'aab')
356 self.checkequal([''], '', 'split', 'aaa')
357 self.checkequal(['aa'], 'aa', 'split', 'aaa')
358 self.checkequal(['A', 'bobb'], 'Abbobbbobb', 'split', 'bbobb')
359 self.checkequal(['A', 'B', ''], 'AbbobbBbbobb', 'split', 'bbobb')
360
361 self.checkequal(['a']*20, ('aBLAH'*20)[:-4], 'split', 'BLAH')
362 self.checkequal(['a']*20, ('aBLAH'*20)[:-4], 'split', 'BLAH', 19)
363 self.checkequal(['a']*18 + ['aBLAHa'], ('aBLAH'*20)[:-4],
364 'split', 'BLAH', 18)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000365
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000366 # argument type
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000367 self.checkraises(TypeError, 'hello', 'split', 42, 42, 42)
368
Thomas Wouters477c8d52006-05-27 19:21:47 +0000369 # null case
370 self.checkraises(ValueError, 'hello', 'split', '')
371 self.checkraises(ValueError, 'hello', 'split', '', 0)
372
Hye-Shik Chang3ae811b2003-12-15 18:49:53 +0000373 def test_rsplit(self):
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000374 # by a char
375 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|')
376 self.checkequal(['a|b|c', 'd'], 'a|b|c|d', 'rsplit', '|', 1)
377 self.checkequal(['a|b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|', 2)
378 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|', 3)
379 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|', 4)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000380 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|',
Christian Heimesa37d4c62007-12-04 23:02:19 +0000381 sys.maxsize-100)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000382 self.checkequal(['a|b|c|d'], 'a|b|c|d', 'rsplit', '|', 0)
383 self.checkequal(['a||b||c', '', 'd'], 'a||b||c||d', 'rsplit', '|', 2)
384 self.checkequal(['', ' begincase'], '| begincase', 'rsplit', '|')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000385 self.checkequal(['endcase ', ''], 'endcase |', 'rsplit', '|')
386 self.checkequal(['', 'bothcase', ''], '|bothcase|', 'rsplit', '|')
387
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000388 self.checkequal(['a\x00\x00b', 'c', 'd'], 'a\x00\x00b\x00c\x00d', 'rsplit', '\x00', 2)
389
Thomas Wouters477c8d52006-05-27 19:21:47 +0000390 self.checkequal(['a']*20, ('a|'*20)[:-1], 'rsplit', '|')
391 self.checkequal(['a|a|a|a|a']+['a']*15,
392 ('a|'*20)[:-1], 'rsplit', '|', 15)
393
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000394 # by string
395 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'rsplit', '//')
396 self.checkequal(['a//b//c', 'd'], 'a//b//c//d', 'rsplit', '//', 1)
397 self.checkequal(['a//b', 'c', 'd'], 'a//b//c//d', 'rsplit', '//', 2)
398 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'rsplit', '//', 3)
399 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'rsplit', '//', 4)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000400 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'rsplit', '//',
Christian Heimesa37d4c62007-12-04 23:02:19 +0000401 sys.maxsize-5)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000402 self.checkequal(['a//b//c//d'], 'a//b//c//d', 'rsplit', '//', 0)
403 self.checkequal(['a////b////c', '', 'd'], 'a////b////c////d', 'rsplit', '//', 2)
404 self.checkequal(['', ' begincase'], 'test begincase', 'rsplit', 'test')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000405 self.checkequal(['endcase ', ''], 'endcase test', 'rsplit', 'test')
406 self.checkequal(['', ' bothcase ', ''], 'test bothcase test',
407 'rsplit', 'test')
408 self.checkequal(['ab', 'c'], 'abbbc', 'rsplit', 'bb')
409 self.checkequal(['', ''], 'aaa', 'rsplit', 'aaa')
410 self.checkequal(['aaa'], 'aaa', 'rsplit', 'aaa', 0)
411 self.checkequal(['ab', 'ab'], 'abbaab', 'rsplit', 'ba')
412 self.checkequal(['aaaa'], 'aaaa', 'rsplit', 'aab')
413 self.checkequal([''], '', 'rsplit', 'aaa')
414 self.checkequal(['aa'], 'aa', 'rsplit', 'aaa')
415 self.checkequal(['bbob', 'A'], 'bbobbbobbA', 'rsplit', 'bbobb')
416 self.checkequal(['', 'B', 'A'], 'bbobbBbbobbA', 'rsplit', 'bbobb')
417
418 self.checkequal(['a']*20, ('aBLAH'*20)[:-4], 'rsplit', 'BLAH')
419 self.checkequal(['a']*20, ('aBLAH'*20)[:-4], 'rsplit', 'BLAH', 19)
420 self.checkequal(['aBLAHa'] + ['a']*18, ('aBLAH'*20)[:-4],
421 'rsplit', 'BLAH', 18)
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000422
Hye-Shik Chang75c00ef2004-01-05 00:29:51 +0000423 # argument type
424 self.checkraises(TypeError, 'hello', 'rsplit', 42, 42, 42)
Hye-Shik Chang3ae811b2003-12-15 18:49:53 +0000425
Thomas Wouters477c8d52006-05-27 19:21:47 +0000426 # null case
427 self.checkraises(ValueError, 'hello', 'rsplit', '')
428 self.checkraises(ValueError, 'hello', 'rsplit', '', 0)
429
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000430 def test_replace(self):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000431 EQ = self.checkequal
432
433 # Operations on the empty string
434 EQ("", "", "replace", "", "")
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000435 EQ("A", "", "replace", "", "A")
Thomas Wouters477c8d52006-05-27 19:21:47 +0000436 EQ("", "", "replace", "A", "")
437 EQ("", "", "replace", "A", "A")
438 EQ("", "", "replace", "", "", 100)
Christian Heimesa37d4c62007-12-04 23:02:19 +0000439 EQ("", "", "replace", "", "", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000440
441 # interleave (from=="", 'to' gets inserted everywhere)
442 EQ("A", "A", "replace", "", "")
443 EQ("*A*", "A", "replace", "", "*")
444 EQ("*1A*1", "A", "replace", "", "*1")
445 EQ("*-#A*-#", "A", "replace", "", "*-#")
446 EQ("*-A*-A*-", "AA", "replace", "", "*-")
447 EQ("*-A*-A*-", "AA", "replace", "", "*-", -1)
Christian Heimesa37d4c62007-12-04 23:02:19 +0000448 EQ("*-A*-A*-", "AA", "replace", "", "*-", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000449 EQ("*-A*-A*-", "AA", "replace", "", "*-", 4)
450 EQ("*-A*-A*-", "AA", "replace", "", "*-", 3)
451 EQ("*-A*-A", "AA", "replace", "", "*-", 2)
452 EQ("*-AA", "AA", "replace", "", "*-", 1)
453 EQ("AA", "AA", "replace", "", "*-", 0)
454
455 # single character deletion (from=="A", to=="")
456 EQ("", "A", "replace", "A", "")
457 EQ("", "AAA", "replace", "A", "")
458 EQ("", "AAA", "replace", "A", "", -1)
Christian Heimesa37d4c62007-12-04 23:02:19 +0000459 EQ("", "AAA", "replace", "A", "", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000460 EQ("", "AAA", "replace", "A", "", 4)
461 EQ("", "AAA", "replace", "A", "", 3)
462 EQ("A", "AAA", "replace", "A", "", 2)
463 EQ("AA", "AAA", "replace", "A", "", 1)
464 EQ("AAA", "AAA", "replace", "A", "", 0)
465 EQ("", "AAAAAAAAAA", "replace", "A", "")
466 EQ("BCD", "ABACADA", "replace", "A", "")
467 EQ("BCD", "ABACADA", "replace", "A", "", -1)
Christian Heimesa37d4c62007-12-04 23:02:19 +0000468 EQ("BCD", "ABACADA", "replace", "A", "", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000469 EQ("BCD", "ABACADA", "replace", "A", "", 5)
470 EQ("BCD", "ABACADA", "replace", "A", "", 4)
471 EQ("BCDA", "ABACADA", "replace", "A", "", 3)
472 EQ("BCADA", "ABACADA", "replace", "A", "", 2)
473 EQ("BACADA", "ABACADA", "replace", "A", "", 1)
474 EQ("ABACADA", "ABACADA", "replace", "A", "", 0)
475 EQ("BCD", "ABCAD", "replace", "A", "")
476 EQ("BCD", "ABCADAA", "replace", "A", "")
477 EQ("BCD", "BCD", "replace", "A", "")
478 EQ("*************", "*************", "replace", "A", "")
479 EQ("^A^", "^"+"A"*1000+"^", "replace", "A", "", 999)
480
481 # substring deletion (from=="the", to=="")
482 EQ("", "the", "replace", "the", "")
483 EQ("ater", "theater", "replace", "the", "")
484 EQ("", "thethe", "replace", "the", "")
485 EQ("", "thethethethe", "replace", "the", "")
486 EQ("aaaa", "theatheatheathea", "replace", "the", "")
487 EQ("that", "that", "replace", "the", "")
488 EQ("thaet", "thaet", "replace", "the", "")
489 EQ("here and re", "here and there", "replace", "the", "")
490 EQ("here and re and re", "here and there and there",
Christian Heimesa37d4c62007-12-04 23:02:19 +0000491 "replace", "the", "", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000492 EQ("here and re and re", "here and there and there",
493 "replace", "the", "", -1)
494 EQ("here and re and re", "here and there and there",
495 "replace", "the", "", 3)
496 EQ("here and re and re", "here and there and there",
497 "replace", "the", "", 2)
498 EQ("here and re and there", "here and there and there",
499 "replace", "the", "", 1)
500 EQ("here and there and there", "here and there and there",
501 "replace", "the", "", 0)
502 EQ("here and re and re", "here and there and there", "replace", "the", "")
503
504 EQ("abc", "abc", "replace", "the", "")
505 EQ("abcdefg", "abcdefg", "replace", "the", "")
506
507 # substring deletion (from=="bob", to=="")
508 EQ("bob", "bbobob", "replace", "bob", "")
509 EQ("bobXbob", "bbobobXbbobob", "replace", "bob", "")
510 EQ("aaaaaaa", "aaaaaaabob", "replace", "bob", "")
511 EQ("aaaaaaa", "aaaaaaa", "replace", "bob", "")
512
513 # single character replace in place (len(from)==len(to)==1)
514 EQ("Who goes there?", "Who goes there?", "replace", "o", "o")
515 EQ("WhO gOes there?", "Who goes there?", "replace", "o", "O")
Christian Heimesa37d4c62007-12-04 23:02:19 +0000516 EQ("WhO gOes there?", "Who goes there?", "replace", "o", "O", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000517 EQ("WhO gOes there?", "Who goes there?", "replace", "o", "O", -1)
518 EQ("WhO gOes there?", "Who goes there?", "replace", "o", "O", 3)
519 EQ("WhO gOes there?", "Who goes there?", "replace", "o", "O", 2)
520 EQ("WhO goes there?", "Who goes there?", "replace", "o", "O", 1)
521 EQ("Who goes there?", "Who goes there?", "replace", "o", "O", 0)
522
523 EQ("Who goes there?", "Who goes there?", "replace", "a", "q")
524 EQ("who goes there?", "Who goes there?", "replace", "W", "w")
525 EQ("wwho goes there?ww", "WWho goes there?WW", "replace", "W", "w")
526 EQ("Who goes there!", "Who goes there?", "replace", "?", "!")
527 EQ("Who goes there!!", "Who goes there??", "replace", "?", "!")
528
529 EQ("Who goes there?", "Who goes there?", "replace", ".", "!")
530
531 # substring replace in place (len(from)==len(to) > 1)
532 EQ("Th** ** a t**sue", "This is a tissue", "replace", "is", "**")
Christian Heimesa37d4c62007-12-04 23:02:19 +0000533 EQ("Th** ** a t**sue", "This is a tissue", "replace", "is", "**", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000534 EQ("Th** ** a t**sue", "This is a tissue", "replace", "is", "**", -1)
535 EQ("Th** ** a t**sue", "This is a tissue", "replace", "is", "**", 4)
536 EQ("Th** ** a t**sue", "This is a tissue", "replace", "is", "**", 3)
537 EQ("Th** ** a tissue", "This is a tissue", "replace", "is", "**", 2)
538 EQ("Th** is a tissue", "This is a tissue", "replace", "is", "**", 1)
539 EQ("This is a tissue", "This is a tissue", "replace", "is", "**", 0)
540 EQ("cobob", "bobob", "replace", "bob", "cob")
541 EQ("cobobXcobocob", "bobobXbobobob", "replace", "bob", "cob")
542 EQ("bobob", "bobob", "replace", "bot", "bot")
543
544 # replace single character (len(from)==1, len(to)>1)
545 EQ("ReyKKjaviKK", "Reykjavik", "replace", "k", "KK")
546 EQ("ReyKKjaviKK", "Reykjavik", "replace", "k", "KK", -1)
Christian Heimesa37d4c62007-12-04 23:02:19 +0000547 EQ("ReyKKjaviKK", "Reykjavik", "replace", "k", "KK", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000548 EQ("ReyKKjaviKK", "Reykjavik", "replace", "k", "KK", 2)
549 EQ("ReyKKjavik", "Reykjavik", "replace", "k", "KK", 1)
550 EQ("Reykjavik", "Reykjavik", "replace", "k", "KK", 0)
551 EQ("A----B----C----", "A.B.C.", "replace", ".", "----")
552
553 EQ("Reykjavik", "Reykjavik", "replace", "q", "KK")
554
555 # replace substring (len(from)>1, len(to)!=len(from))
556 EQ("ham, ham, eggs and ham", "spam, spam, eggs and spam",
557 "replace", "spam", "ham")
558 EQ("ham, ham, eggs and ham", "spam, spam, eggs and spam",
Christian Heimesa37d4c62007-12-04 23:02:19 +0000559 "replace", "spam", "ham", sys.maxsize)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000560 EQ("ham, ham, eggs and ham", "spam, spam, eggs and spam",
561 "replace", "spam", "ham", -1)
562 EQ("ham, ham, eggs and ham", "spam, spam, eggs and spam",
563 "replace", "spam", "ham", 4)
564 EQ("ham, ham, eggs and ham", "spam, spam, eggs and spam",
565 "replace", "spam", "ham", 3)
566 EQ("ham, ham, eggs and spam", "spam, spam, eggs and spam",
567 "replace", "spam", "ham", 2)
568 EQ("ham, spam, eggs and spam", "spam, spam, eggs and spam",
569 "replace", "spam", "ham", 1)
570 EQ("spam, spam, eggs and spam", "spam, spam, eggs and spam",
571 "replace", "spam", "ham", 0)
572
573 EQ("bobob", "bobobob", "replace", "bobob", "bob")
574 EQ("bobobXbobob", "bobobobXbobobob", "replace", "bobob", "bob")
575 EQ("BOBOBOB", "BOBOBOB", "replace", "bob", "bobby")
576
Guido van Rossum39478e82007-08-27 17:23:59 +0000577 # XXX Commented out. Is there any reason to support buffer objects
578 # as arguments for str.replace()? GvR
Guido van Rossum254348e2007-11-21 19:29:53 +0000579## ba = bytearray('a')
580## bb = bytearray('b')
Guido van Rossum39478e82007-08-27 17:23:59 +0000581## EQ("bbc", "abc", "replace", ba, bb)
582## EQ("aac", "abc", "replace", bb, ba)
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000583
Thomas Wouters477c8d52006-05-27 19:21:47 +0000584 #
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000585 self.checkequal('one@two!three!', 'one!two!three!', 'replace', '!', '@', 1)
586 self.checkequal('onetwothree', 'one!two!three!', 'replace', '!', '')
587 self.checkequal('one@two@three!', 'one!two!three!', 'replace', '!', '@', 2)
588 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@', 3)
589 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@', 4)
590 self.checkequal('one!two!three!', 'one!two!three!', 'replace', '!', '@', 0)
591 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@')
592 self.checkequal('one!two!three!', 'one!two!three!', 'replace', 'x', '@')
593 self.checkequal('one!two!three!', 'one!two!three!', 'replace', 'x', '@', 2)
594 self.checkequal('-a-b-c-', 'abc', 'replace', '', '-')
595 self.checkequal('-a-b-c', 'abc', 'replace', '', '-', 3)
596 self.checkequal('abc', 'abc', 'replace', '', '-', 0)
597 self.checkequal('', '', 'replace', '', '')
598 self.checkequal('abc', 'abc', 'replace', 'ab', '--', 0)
599 self.checkequal('abc', 'abc', 'replace', 'xy', '--')
600 # Next three for SF bug 422088: [OSF1 alpha] string.replace(); died with
601 # MemoryError due to empty result (platform malloc issue when requesting
602 # 0 bytes).
603 self.checkequal('', '123', 'replace', '123', '')
604 self.checkequal('', '123123', 'replace', '123', '')
605 self.checkequal('x', '123x123', 'replace', '123', '')
606
607 self.checkraises(TypeError, 'hello', 'replace')
608 self.checkraises(TypeError, 'hello', 'replace', 42)
609 self.checkraises(TypeError, 'hello', 'replace', 42, 'h')
610 self.checkraises(TypeError, 'hello', 'replace', 'h', 42)
611
Thomas Wouters477c8d52006-05-27 19:21:47 +0000612 def test_replace_overflow(self):
613 # Check for overflow checking on 32 bit machines
Christian Heimesa37d4c62007-12-04 23:02:19 +0000614 if sys.maxsize != 2147483647 or struct.calcsize("P") > 4:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000615 return
616 A2_16 = "A" * (2**16)
617 self.checkraises(OverflowError, A2_16, "replace", "", A2_16)
618 self.checkraises(OverflowError, A2_16, "replace", "A", A2_16)
619 self.checkraises(OverflowError, A2_16, "replace", "AA", A2_16+A2_16)
620
Georg Brandlc7885542007-03-06 19:16:20 +0000621
622
623class CommonTest(BaseTest):
624 # This testcase contains test that can be used in all
625 # stringlike classes. Currently this is str, unicode
626 # UserString and the string module.
627
628 def test_hash(self):
629 # SF bug 1054139: += optimization was not invalidating cached hash value
630 a = self.type2test('DNSSEC')
631 b = self.type2test('')
632 for c in a:
633 b += c
634 hash(b)
635 self.assertEqual(hash(a), hash(b))
636
637 def test_capitalize(self):
638 self.checkequal(' hello ', ' hello ', 'capitalize')
639 self.checkequal('Hello ', 'Hello ','capitalize')
640 self.checkequal('Hello ', 'hello ','capitalize')
641 self.checkequal('Aaaa', 'aaaa', 'capitalize')
642 self.checkequal('Aaaa', 'AaAa', 'capitalize')
643
Ezio Melottiee8d9982011-08-15 09:09:57 +0300644 # check that titlecased chars are lowered correctly
645 # \u1ffc is the titlecased char
646 self.checkequal('\u1ffc\u1ff3\u1ff3\u1ff3',
647 '\u1ff3\u1ff3\u1ffc\u1ffc', 'capitalize')
648 # check with cased non-letter chars
649 self.checkequal('\u24c5\u24e8\u24e3\u24d7\u24de\u24dd',
650 '\u24c5\u24ce\u24c9\u24bd\u24c4\u24c3', 'capitalize')
651 self.checkequal('\u24c5\u24e8\u24e3\u24d7\u24de\u24dd',
652 '\u24df\u24e8\u24e3\u24d7\u24de\u24dd', 'capitalize')
653 self.checkequal('\u2160\u2171\u2172',
654 '\u2160\u2161\u2162', 'capitalize')
655 self.checkequal('\u2160\u2171\u2172',
656 '\u2170\u2171\u2172', 'capitalize')
657 # check with Ll chars with no upper - nothing changes here
658 self.checkequal('\u019b\u1d00\u1d86\u0221\u1fb7',
659 '\u019b\u1d00\u1d86\u0221\u1fb7', 'capitalize')
660
Georg Brandlc7885542007-03-06 19:16:20 +0000661 self.checkraises(TypeError, 'hello', 'capitalize', 42)
662
663 def test_lower(self):
664 self.checkequal('hello', 'HeLLo', 'lower')
665 self.checkequal('hello', 'hello', 'lower')
666 self.checkraises(TypeError, 'hello', 'lower', 42)
667
668 def test_upper(self):
669 self.checkequal('HELLO', 'HeLLo', 'upper')
670 self.checkequal('HELLO', 'HELLO', 'upper')
671 self.checkraises(TypeError, 'hello', 'upper', 42)
672
673 def test_expandtabs(self):
674 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
675 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
676 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 4)
677 self.checkequal('abc\r\nab def\ng hi', 'abc\r\nab\tdef\ng\thi', 'expandtabs', 4)
678 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
679 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
680 self.checkequal('abc\r\nab\r\ndef\ng\r\nhi', 'abc\r\nab\r\ndef\ng\r\nhi', 'expandtabs', 4)
681
682 self.checkraises(TypeError, 'hello', 'expandtabs', 42, 42)
683
684 def test_additional_split(self):
685 self.checkequal(['this', 'is', 'the', 'split', 'function'],
686 'this is the split function', 'split')
687
688 # by whitespace
689 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d ', 'split')
690 self.checkequal(['a', 'b c d'], 'a b c d', 'split', None, 1)
691 self.checkequal(['a', 'b', 'c d'], 'a b c d', 'split', None, 2)
692 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'split', None, 3)
693 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'split', None, 4)
694 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'split', None,
Christian Heimesa37d4c62007-12-04 23:02:19 +0000695 sys.maxsize-1)
Georg Brandlc7885542007-03-06 19:16:20 +0000696 self.checkequal(['a b c d'], 'a b c d', 'split', None, 0)
697 self.checkequal(['a b c d'], ' a b c d', 'split', None, 0)
698 self.checkequal(['a', 'b', 'c d'], 'a b c d', 'split', None, 2)
699
700 self.checkequal([], ' ', 'split')
701 self.checkequal(['a'], ' a ', 'split')
702 self.checkequal(['a', 'b'], ' a b ', 'split')
703 self.checkequal(['a', 'b '], ' a b ', 'split', None, 1)
704 self.checkequal(['a', 'b c '], ' a b c ', 'split', None, 1)
705 self.checkequal(['a', 'b', 'c '], ' a b c ', 'split', None, 2)
706 self.checkequal(['a', 'b'], '\n\ta \t\r b \v ', 'split')
707 aaa = ' a '*20
708 self.checkequal(['a']*20, aaa, 'split')
709 self.checkequal(['a'] + [aaa[4:]], aaa, 'split', None, 1)
710 self.checkequal(['a']*19 + ['a '], aaa, 'split', None, 19)
711
712 # mixed use of str and unicode
Guido van Rossumef87d6e2007-05-02 19:09:54 +0000713 self.checkequal(['a', 'b', 'c d'], 'a b c d', 'split', ' ', 2)
Georg Brandlc7885542007-03-06 19:16:20 +0000714
715 def test_additional_rsplit(self):
716 self.checkequal(['this', 'is', 'the', 'rsplit', 'function'],
717 'this is the rsplit function', 'rsplit')
718
719 # by whitespace
720 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d ', 'rsplit')
721 self.checkequal(['a b c', 'd'], 'a b c d', 'rsplit', None, 1)
722 self.checkequal(['a b', 'c', 'd'], 'a b c d', 'rsplit', None, 2)
723 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'rsplit', None, 3)
724 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'rsplit', None, 4)
725 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'rsplit', None,
Christian Heimesa37d4c62007-12-04 23:02:19 +0000726 sys.maxsize-20)
Georg Brandlc7885542007-03-06 19:16:20 +0000727 self.checkequal(['a b c d'], 'a b c d', 'rsplit', None, 0)
728 self.checkequal(['a b c d'], 'a b c d ', 'rsplit', None, 0)
729 self.checkequal(['a b', 'c', 'd'], 'a b c d', 'rsplit', None, 2)
730
731 self.checkequal([], ' ', 'rsplit')
732 self.checkequal(['a'], ' a ', 'rsplit')
733 self.checkequal(['a', 'b'], ' a b ', 'rsplit')
734 self.checkequal([' a', 'b'], ' a b ', 'rsplit', None, 1)
735 self.checkequal([' a b','c'], ' a b c ', 'rsplit',
736 None, 1)
737 self.checkequal([' a', 'b', 'c'], ' a b c ', 'rsplit',
738 None, 2)
739 self.checkequal(['a', 'b'], '\n\ta \t\r b \v ', 'rsplit', None, 88)
740 aaa = ' a '*20
741 self.checkequal(['a']*20, aaa, 'rsplit')
742 self.checkequal([aaa[:-4]] + ['a'], aaa, 'rsplit', None, 1)
743 self.checkequal([' a a'] + ['a']*18, aaa, 'rsplit', None, 18)
744
745 # mixed use of str and unicode
Guido van Rossumef87d6e2007-05-02 19:09:54 +0000746 self.checkequal(['a b', 'c', 'd'], 'a b c d', 'rsplit', ' ', 2)
Georg Brandlc7885542007-03-06 19:16:20 +0000747
748 def test_strip(self):
749 self.checkequal('hello', ' hello ', 'strip')
750 self.checkequal('hello ', ' hello ', 'lstrip')
751 self.checkequal(' hello', ' hello ', 'rstrip')
752 self.checkequal('hello', 'hello', 'strip')
753
754 # strip/lstrip/rstrip with None arg
755 self.checkequal('hello', ' hello ', 'strip', None)
756 self.checkequal('hello ', ' hello ', 'lstrip', None)
757 self.checkequal(' hello', ' hello ', 'rstrip', None)
758 self.checkequal('hello', 'hello', 'strip', None)
759
760 # strip/lstrip/rstrip with str arg
761 self.checkequal('hello', 'xyzzyhelloxyzzy', 'strip', 'xyz')
762 self.checkequal('helloxyzzy', 'xyzzyhelloxyzzy', 'lstrip', 'xyz')
763 self.checkequal('xyzzyhello', 'xyzzyhelloxyzzy', 'rstrip', 'xyz')
764 self.checkequal('hello', 'hello', 'strip', 'xyz')
765
Georg Brandlc7885542007-03-06 19:16:20 +0000766 self.checkraises(TypeError, 'hello', 'strip', 42, 42)
767 self.checkraises(TypeError, 'hello', 'lstrip', 42, 42)
768 self.checkraises(TypeError, 'hello', 'rstrip', 42, 42)
769
770 def test_ljust(self):
771 self.checkequal('abc ', 'abc', 'ljust', 10)
772 self.checkequal('abc ', 'abc', 'ljust', 6)
773 self.checkequal('abc', 'abc', 'ljust', 3)
774 self.checkequal('abc', 'abc', 'ljust', 2)
775 self.checkequal('abc*******', 'abc', 'ljust', 10, '*')
776 self.checkraises(TypeError, 'abc', 'ljust')
777
778 def test_rjust(self):
779 self.checkequal(' abc', 'abc', 'rjust', 10)
780 self.checkequal(' abc', 'abc', 'rjust', 6)
781 self.checkequal('abc', 'abc', 'rjust', 3)
782 self.checkequal('abc', 'abc', 'rjust', 2)
783 self.checkequal('*******abc', 'abc', 'rjust', 10, '*')
784 self.checkraises(TypeError, 'abc', 'rjust')
785
786 def test_center(self):
787 self.checkequal(' abc ', 'abc', 'center', 10)
788 self.checkequal(' abc ', 'abc', 'center', 6)
789 self.checkequal('abc', 'abc', 'center', 3)
790 self.checkequal('abc', 'abc', 'center', 2)
791 self.checkequal('***abc****', 'abc', 'center', 10, '*')
792 self.checkraises(TypeError, 'abc', 'center')
793
794 def test_swapcase(self):
795 self.checkequal('hEllO CoMPuTErS', 'HeLLo cOmpUteRs', 'swapcase')
796
797 self.checkraises(TypeError, 'hello', 'swapcase', 42)
798
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000799 def test_zfill(self):
800 self.checkequal('123', '123', 'zfill', 2)
801 self.checkequal('123', '123', 'zfill', 3)
802 self.checkequal('0123', '123', 'zfill', 4)
803 self.checkequal('+123', '+123', 'zfill', 3)
804 self.checkequal('+123', '+123', 'zfill', 4)
805 self.checkequal('+0123', '+123', 'zfill', 5)
806 self.checkequal('-123', '-123', 'zfill', 3)
807 self.checkequal('-123', '-123', 'zfill', 4)
808 self.checkequal('-0123', '-123', 'zfill', 5)
809 self.checkequal('000', '', 'zfill', 3)
810 self.checkequal('34', '34', 'zfill', 1)
811 self.checkequal('0034', '34', 'zfill', 4)
812
813 self.checkraises(TypeError, '123', 'zfill')
814
815class MixinStrUnicodeUserStringTest:
816 # additional tests that only work for
817 # stringlike objects, i.e. str, unicode, UserString
818 # (but not the string module)
819
820 def test_islower(self):
821 self.checkequal(False, '', 'islower')
822 self.checkequal(True, 'a', 'islower')
823 self.checkequal(False, 'A', 'islower')
824 self.checkequal(False, '\n', 'islower')
825 self.checkequal(True, 'abc', 'islower')
826 self.checkequal(False, 'aBc', 'islower')
827 self.checkequal(True, 'abc\n', 'islower')
828 self.checkraises(TypeError, 'abc', 'islower', 42)
829
830 def test_isupper(self):
831 self.checkequal(False, '', 'isupper')
832 self.checkequal(False, 'a', 'isupper')
833 self.checkequal(True, 'A', 'isupper')
834 self.checkequal(False, '\n', 'isupper')
835 self.checkequal(True, 'ABC', 'isupper')
836 self.checkequal(False, 'AbC', 'isupper')
837 self.checkequal(True, 'ABC\n', 'isupper')
838 self.checkraises(TypeError, 'abc', 'isupper', 42)
839
840 def test_istitle(self):
841 self.checkequal(False, '', 'istitle')
842 self.checkequal(False, 'a', 'istitle')
843 self.checkequal(True, 'A', 'istitle')
844 self.checkequal(False, '\n', 'istitle')
845 self.checkequal(True, 'A Titlecased Line', 'istitle')
846 self.checkequal(True, 'A\nTitlecased Line', 'istitle')
847 self.checkequal(True, 'A Titlecased, Line', 'istitle')
848 self.checkequal(False, 'Not a capitalized String', 'istitle')
849 self.checkequal(False, 'Not\ta Titlecase String', 'istitle')
850 self.checkequal(False, 'Not--a Titlecase String', 'istitle')
851 self.checkequal(False, 'NOT', 'istitle')
852 self.checkraises(TypeError, 'abc', 'istitle', 42)
853
854 def test_isspace(self):
855 self.checkequal(False, '', 'isspace')
856 self.checkequal(False, 'a', 'isspace')
857 self.checkequal(True, ' ', 'isspace')
858 self.checkequal(True, '\t', 'isspace')
859 self.checkequal(True, '\r', 'isspace')
860 self.checkequal(True, '\n', 'isspace')
861 self.checkequal(True, ' \t\r\n', 'isspace')
862 self.checkequal(False, ' \t\r\na', 'isspace')
863 self.checkraises(TypeError, 'abc', 'isspace', 42)
864
865 def test_isalpha(self):
866 self.checkequal(False, '', 'isalpha')
867 self.checkequal(True, 'a', 'isalpha')
868 self.checkequal(True, 'A', 'isalpha')
869 self.checkequal(False, '\n', 'isalpha')
870 self.checkequal(True, 'abc', 'isalpha')
871 self.checkequal(False, 'aBc123', 'isalpha')
872 self.checkequal(False, 'abc\n', 'isalpha')
873 self.checkraises(TypeError, 'abc', 'isalpha', 42)
874
875 def test_isalnum(self):
876 self.checkequal(False, '', 'isalnum')
877 self.checkequal(True, 'a', 'isalnum')
878 self.checkequal(True, 'A', 'isalnum')
879 self.checkequal(False, '\n', 'isalnum')
880 self.checkequal(True, '123abc456', 'isalnum')
881 self.checkequal(True, 'a1b3c', 'isalnum')
882 self.checkequal(False, 'aBc000 ', 'isalnum')
883 self.checkequal(False, 'abc\n', 'isalnum')
884 self.checkraises(TypeError, 'abc', 'isalnum', 42)
885
886 def test_isdigit(self):
887 self.checkequal(False, '', 'isdigit')
888 self.checkequal(False, 'a', 'isdigit')
889 self.checkequal(True, '0', 'isdigit')
890 self.checkequal(True, '0123456789', 'isdigit')
891 self.checkequal(False, '0123456789a', 'isdigit')
892
893 self.checkraises(TypeError, 'abc', 'isdigit', 42)
894
895 def test_title(self):
896 self.checkequal(' Hello ', ' hello ', 'title')
897 self.checkequal('Hello ', 'hello ', 'title')
898 self.checkequal('Hello ', 'Hello ', 'title')
899 self.checkequal('Format This As Title String', "fOrMaT thIs aS titLe String", 'title')
900 self.checkequal('Format,This-As*Title;String', "fOrMaT,thIs-aS*titLe;String", 'title', )
901 self.checkequal('Getint', "getInt", 'title')
902 self.checkraises(TypeError, 'hello', 'title', 42)
903
904 def test_splitlines(self):
905 self.checkequal(['abc', 'def', '', 'ghi'], "abc\ndef\n\rghi", 'splitlines')
906 self.checkequal(['abc', 'def', '', 'ghi'], "abc\ndef\n\r\nghi", 'splitlines')
907 self.checkequal(['abc', 'def', 'ghi'], "abc\ndef\r\nghi", 'splitlines')
908 self.checkequal(['abc', 'def', 'ghi'], "abc\ndef\r\nghi\n", 'splitlines')
909 self.checkequal(['abc', 'def', 'ghi', ''], "abc\ndef\r\nghi\n\r", 'splitlines')
910 self.checkequal(['', 'abc', 'def', 'ghi', ''], "\nabc\ndef\r\nghi\n\r", 'splitlines')
911 self.checkequal(['\n', 'abc\n', 'def\r\n', 'ghi\n', '\r'], "\nabc\ndef\r\nghi\n\r", 'splitlines', 1)
912
913 self.checkraises(TypeError, 'abc', 'splitlines', 42, 42)
914
915 def test_startswith(self):
916 self.checkequal(True, 'hello', 'startswith', 'he')
917 self.checkequal(True, 'hello', 'startswith', 'hello')
918 self.checkequal(False, 'hello', 'startswith', 'hello world')
919 self.checkequal(True, 'hello', 'startswith', '')
920 self.checkequal(False, 'hello', 'startswith', 'ello')
921 self.checkequal(True, 'hello', 'startswith', 'ello', 1)
922 self.checkequal(True, 'hello', 'startswith', 'o', 4)
923 self.checkequal(False, 'hello', 'startswith', 'o', 5)
924 self.checkequal(True, 'hello', 'startswith', '', 5)
925 self.checkequal(False, 'hello', 'startswith', 'lo', 6)
926 self.checkequal(True, 'helloworld', 'startswith', 'lowo', 3)
927 self.checkequal(True, 'helloworld', 'startswith', 'lowo', 3, 7)
928 self.checkequal(False, 'helloworld', 'startswith', 'lowo', 3, 6)
929
930 # test negative indices
931 self.checkequal(True, 'hello', 'startswith', 'he', 0, -1)
932 self.checkequal(True, 'hello', 'startswith', 'he', -53, -1)
933 self.checkequal(False, 'hello', 'startswith', 'hello', 0, -1)
934 self.checkequal(False, 'hello', 'startswith', 'hello world', -1, -10)
935 self.checkequal(False, 'hello', 'startswith', 'ello', -5)
936 self.checkequal(True, 'hello', 'startswith', 'ello', -4)
937 self.checkequal(False, 'hello', 'startswith', 'o', -2)
938 self.checkequal(True, 'hello', 'startswith', 'o', -1)
939 self.checkequal(True, 'hello', 'startswith', '', -3, -3)
940 self.checkequal(False, 'hello', 'startswith', 'lo', -9)
941
942 self.checkraises(TypeError, 'hello', 'startswith')
943 self.checkraises(TypeError, 'hello', 'startswith', 42)
944
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000945 # test tuple arguments
946 self.checkequal(True, 'hello', 'startswith', ('he', 'ha'))
947 self.checkequal(False, 'hello', 'startswith', ('lo', 'llo'))
948 self.checkequal(True, 'hello', 'startswith', ('hellox', 'hello'))
949 self.checkequal(False, 'hello', 'startswith', ())
950 self.checkequal(True, 'helloworld', 'startswith', ('hellowo',
951 'rld', 'lowo'), 3)
952 self.checkequal(False, 'helloworld', 'startswith', ('hellowo', 'ello',
953 'rld'), 3)
954 self.checkequal(True, 'hello', 'startswith', ('lo', 'he'), 0, -1)
955 self.checkequal(False, 'hello', 'startswith', ('he', 'hel'), 0, 1)
956 self.checkequal(True, 'hello', 'startswith', ('he', 'hel'), 0, 2)
957
958 self.checkraises(TypeError, 'hello', 'startswith', (42,))
959
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000960 def test_endswith(self):
961 self.checkequal(True, 'hello', 'endswith', 'lo')
962 self.checkequal(False, 'hello', 'endswith', 'he')
963 self.checkequal(True, 'hello', 'endswith', '')
964 self.checkequal(False, 'hello', 'endswith', 'hello world')
965 self.checkequal(False, 'helloworld', 'endswith', 'worl')
966 self.checkequal(True, 'helloworld', 'endswith', 'worl', 3, 9)
967 self.checkequal(True, 'helloworld', 'endswith', 'world', 3, 12)
968 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 1, 7)
969 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 2, 7)
970 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 3, 7)
971 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 4, 7)
972 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 3, 8)
973 self.checkequal(False, 'ab', 'endswith', 'ab', 0, 1)
974 self.checkequal(False, 'ab', 'endswith', 'ab', 0, 0)
975
976 # test negative indices
977 self.checkequal(True, 'hello', 'endswith', 'lo', -2)
978 self.checkequal(False, 'hello', 'endswith', 'he', -2)
979 self.checkequal(True, 'hello', 'endswith', '', -3, -3)
980 self.checkequal(False, 'hello', 'endswith', 'hello world', -10, -2)
981 self.checkequal(False, 'helloworld', 'endswith', 'worl', -6)
982 self.checkequal(True, 'helloworld', 'endswith', 'worl', -5, -1)
983 self.checkequal(True, 'helloworld', 'endswith', 'worl', -5, 9)
984 self.checkequal(True, 'helloworld', 'endswith', 'world', -7, 12)
985 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -99, -3)
986 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -8, -3)
987 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -7, -3)
988 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 3, -4)
989 self.checkequal(False, 'helloworld', 'endswith', 'lowo', -8, -2)
990
991 self.checkraises(TypeError, 'hello', 'endswith')
992 self.checkraises(TypeError, 'hello', 'endswith', 42)
993
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000994 # test tuple arguments
995 self.checkequal(False, 'hello', 'endswith', ('he', 'ha'))
996 self.checkequal(True, 'hello', 'endswith', ('lo', 'llo'))
997 self.checkequal(True, 'hello', 'endswith', ('hellox', 'hello'))
998 self.checkequal(False, 'hello', 'endswith', ())
999 self.checkequal(True, 'helloworld', 'endswith', ('hellowo',
1000 'rld', 'lowo'), 3)
1001 self.checkequal(False, 'helloworld', 'endswith', ('hellowo', 'ello',
1002 'rld'), 3, -1)
1003 self.checkequal(True, 'hello', 'endswith', ('hell', 'ell'), 0, -1)
1004 self.checkequal(False, 'hello', 'endswith', ('he', 'hel'), 0, 1)
1005 self.checkequal(True, 'hello', 'endswith', ('he', 'hell'), 0, 4)
1006
1007 self.checkraises(TypeError, 'hello', 'endswith', (42,))
1008
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001009 def test___contains__(self):
Ezio Melottib19f43d2010-01-24 20:59:24 +00001010 self.checkequal(True, '', '__contains__', '')
1011 self.checkequal(True, 'abc', '__contains__', '')
1012 self.checkequal(False, 'abc', '__contains__', '\0')
1013 self.checkequal(True, '\0abc', '__contains__', '\0')
1014 self.checkequal(True, 'abc\0', '__contains__', '\0')
1015 self.checkequal(True, '\0abc', '__contains__', 'a')
1016 self.checkequal(True, 'asdf', '__contains__', 'asdf')
1017 self.checkequal(False, 'asd', '__contains__', 'asdf')
1018 self.checkequal(False, '', '__contains__', 'asdf')
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001019
1020 def test_subscript(self):
Guido van Rossumef87d6e2007-05-02 19:09:54 +00001021 self.checkequal('a', 'abc', '__getitem__', 0)
1022 self.checkequal('c', 'abc', '__getitem__', -1)
1023 self.checkequal('a', 'abc', '__getitem__', 0)
1024 self.checkequal('abc', 'abc', '__getitem__', slice(0, 3))
1025 self.checkequal('abc', 'abc', '__getitem__', slice(0, 1000))
1026 self.checkequal('a', 'abc', '__getitem__', slice(0, 1))
1027 self.checkequal('', 'abc', '__getitem__', slice(0, 0))
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001028
1029 self.checkraises(TypeError, 'abc', '__getitem__', 'def')
1030
1031 def test_slice(self):
Thomas Woutersd2cf20e2007-08-30 22:57:53 +00001032 self.checkequal('abc', 'abc', '__getitem__', slice(0, 1000))
1033 self.checkequal('abc', 'abc', '__getitem__', slice(0, 3))
1034 self.checkequal('ab', 'abc', '__getitem__', slice(0, 2))
1035 self.checkequal('bc', 'abc', '__getitem__', slice(1, 3))
1036 self.checkequal('b', 'abc', '__getitem__', slice(1, 2))
1037 self.checkequal('', 'abc', '__getitem__', slice(2, 2))
1038 self.checkequal('', 'abc', '__getitem__', slice(1000, 1000))
1039 self.checkequal('', 'abc', '__getitem__', slice(2000, 1000))
1040 self.checkequal('', 'abc', '__getitem__', slice(2, 1))
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001041
Thomas Woutersd2cf20e2007-08-30 22:57:53 +00001042 self.checkraises(TypeError, 'abc', '__getitem__', 'def')
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001043
Thomas Woutersed03b412007-08-28 21:37:11 +00001044 def test_extended_getslice(self):
1045 # Test extended slicing by comparing with list slicing.
1046 s = string.ascii_letters + string.digits
1047 indices = (0, None, 1, 3, 41, -1, -2, -37)
1048 for start in indices:
1049 for stop in indices:
1050 # Skip step 0 (invalid)
1051 for step in indices[1:]:
1052 L = list(s)[start:stop:step]
1053 self.checkequal("".join(L), s, '__getitem__',
1054 slice(start, stop, step))
1055
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001056 def test_mul(self):
1057 self.checkequal('', 'abc', '__mul__', -1)
1058 self.checkequal('', 'abc', '__mul__', 0)
1059 self.checkequal('abc', 'abc', '__mul__', 1)
1060 self.checkequal('abcabcabc', 'abc', '__mul__', 3)
1061 self.checkraises(TypeError, 'abc', '__mul__')
1062 self.checkraises(TypeError, 'abc', '__mul__', '')
Martin v. Löwis18e16552006-02-15 17:27:45 +00001063 # XXX: on a 64-bit system, this doesn't raise an overflow error,
1064 # but either raises a MemoryError, or succeeds (if you have 54TiB)
1065 #self.checkraises(OverflowError, 10000*'abc', '__mul__', 2000000000)
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001066
1067 def test_join(self):
1068 # join now works with any sequence type
1069 # moved here, because the argument order is
1070 # different in string.join (see the test in
1071 # test.test_string.StringTest.test_join)
1072 self.checkequal('a b c d', ' ', 'join', ['a', 'b', 'c', 'd'])
1073 self.checkequal('abcd', '', 'join', ('a', 'b', 'c', 'd'))
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001074 self.checkequal('bd', '', 'join', ('', 'b', '', 'd'))
1075 self.checkequal('ac', '', 'join', ('a', '', 'c', ''))
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001076 self.checkequal('w x y z', ' ', 'join', Sequence())
1077 self.checkequal('abc', 'a', 'join', ('abc',))
1078 self.checkequal('z', 'a', 'join', UserList(['z']))
Walter Dörwald67e83882007-05-05 12:26:27 +00001079 self.checkequal('a.b.c', '.', 'join', ['a', 'b', 'c'])
Guido van Rossum98297ee2007-11-06 21:34:58 +00001080 self.assertRaises(TypeError, '.'.join, ['a', 'b', 3])
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001081 for i in [5, 25, 125]:
1082 self.checkequal(((('a' * i) + '-') * i)[:-1], '-', 'join',
1083 ['a' * i] * i)
1084 self.checkequal(((('a' * i) + '-') * i)[:-1], '-', 'join',
1085 ('a' * i,) * i)
1086
Guido van Rossum98297ee2007-11-06 21:34:58 +00001087 #self.checkequal(str(BadSeq1()), ' ', 'join', BadSeq1())
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001088 self.checkequal('a b c', ' ', 'join', BadSeq2())
1089
1090 self.checkraises(TypeError, ' ', 'join')
1091 self.checkraises(TypeError, ' ', 'join', 7)
Guido van Rossumf1044292007-09-27 18:01:22 +00001092 self.checkraises(TypeError, ' ', 'join', [1, 2, bytes()])
Michael W. Hudsonb2308bb2005-10-21 11:45:01 +00001093 try:
1094 def f():
1095 yield 4 + ""
1096 self.fixtype(' ').join(f())
Guido van Rossumb940e112007-01-10 16:19:56 +00001097 except TypeError as e:
Michael W. Hudsonb2308bb2005-10-21 11:45:01 +00001098 if '+' not in str(e):
1099 self.fail('join() ate exception message')
1100 else:
1101 self.fail('exception not raised')
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001102
1103 def test_formatting(self):
1104 self.checkequal('+hello+', '+%s+', '__mod__', 'hello')
1105 self.checkequal('+10+', '+%d+', '__mod__', 10)
1106 self.checkequal('a', "%c", '__mod__', "a")
1107 self.checkequal('a', "%c", '__mod__', "a")
1108 self.checkequal('"', "%c", '__mod__', 34)
1109 self.checkequal('$', "%c", '__mod__', 36)
1110 self.checkequal('10', "%d", '__mod__', 10)
Walter Dörwald43440a62003-03-31 18:07:50 +00001111 self.checkequal('\x7f', "%c", '__mod__', 0x7f)
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001112
1113 for ordinal in (-100, 0x200000):
1114 # unicode raises ValueError, str raises OverflowError
1115 self.checkraises((ValueError, OverflowError), '%c', '__mod__', ordinal)
1116
Christian Heimesa612dc02008-02-24 13:08:18 +00001117 longvalue = sys.maxsize + 10
1118 slongvalue = str(longvalue)
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001119 self.checkequal(' 42', '%3ld', '__mod__', 42)
Christian Heimesa612dc02008-02-24 13:08:18 +00001120 self.checkequal('42', '%d', '__mod__', 42.0)
1121 self.checkequal(slongvalue, '%d', '__mod__', longvalue)
1122 self.checkcall('%d', '__mod__', float(longvalue))
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001123 self.checkequal('0042.00', '%07.2f', '__mod__', 42)
Raymond Hettinger9bfe5332003-08-27 04:55:52 +00001124 self.checkequal('0042.00', '%07.2F', '__mod__', 42)
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001125
1126 self.checkraises(TypeError, 'abc', '__mod__')
1127 self.checkraises(TypeError, '%(foo)s', '__mod__', 42)
1128 self.checkraises(TypeError, '%s%s', '__mod__', (42,))
1129 self.checkraises(TypeError, '%c', '__mod__', (None,))
1130 self.checkraises(ValueError, '%(foo', '__mod__', {})
1131 self.checkraises(TypeError, '%(foo)s %(bar)s', '__mod__', ('foo', 42))
Christian Heimesa612dc02008-02-24 13:08:18 +00001132 self.checkraises(TypeError, '%d', '__mod__', "42") # not numeric
Mark Dickinson5c2db372009-12-05 20:28:34 +00001133 self.checkraises(TypeError, '%d', '__mod__', (42+0j)) # no int conversion provided
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001134
1135 # argument names with properly nested brackets are supported
1136 self.checkequal('bar', '%((foo))s', '__mod__', {'(foo)': 'bar'})
1137
1138 # 100 is a magic number in PyUnicode_Format, this forces a resize
1139 self.checkequal(103*'a'+'x', '%sx', '__mod__', 103*'a')
1140
1141 self.checkraises(TypeError, '%*s', '__mod__', ('foo', 'bar'))
1142 self.checkraises(TypeError, '%10.*f', '__mod__', ('foo', 42.))
1143 self.checkraises(ValueError, '%10', '__mod__', (42,))
1144
1145 def test_floatformatting(self):
1146 # float formatting
Guido van Rossum805365e2007-05-07 22:24:25 +00001147 for prec in range(100):
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001148 format = '%%.%if' % prec
1149 value = 0.01
Guido van Rossum805365e2007-05-07 22:24:25 +00001150 for x in range(60):
Florent Xiclunaa87b3832010-09-13 02:28:18 +00001151 value = value * 3.14159265359 / 3.0 * 10.0
Mark Dickinsonf489caf2009-05-01 11:42:00 +00001152 self.checkcall(format, "__mod__", value)
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001153
Thomas Wouters477c8d52006-05-27 19:21:47 +00001154 def test_inplace_rewrites(self):
1155 # Check that strings don't copy and modify cached single-character strings
1156 self.checkequal('a', 'A', 'lower')
1157 self.checkequal(True, 'A', 'isupper')
1158 self.checkequal('A', 'a', 'upper')
1159 self.checkequal(True, 'a', 'islower')
1160
1161 self.checkequal('a', 'A', 'replace', 'A', 'a')
1162 self.checkequal(True, 'A', 'isupper')
1163
1164 self.checkequal('A', 'a', 'capitalize')
1165 self.checkequal(True, 'a', 'islower')
1166
1167 self.checkequal('A', 'a', 'swapcase')
1168 self.checkequal(True, 'a', 'islower')
1169
1170 self.checkequal('A', 'a', 'title')
1171 self.checkequal(True, 'a', 'islower')
1172
1173 def test_partition(self):
1174
1175 self.checkequal(('this is the par', 'ti', 'tion method'),
1176 'this is the partition method', 'partition', 'ti')
1177
1178 # from raymond's original specification
1179 S = 'http://www.python.org'
1180 self.checkequal(('http', '://', 'www.python.org'), S, 'partition', '://')
1181 self.checkequal(('http://www.python.org', '', ''), S, 'partition', '?')
1182 self.checkequal(('', 'http://', 'www.python.org'), S, 'partition', 'http://')
1183 self.checkequal(('http://www.python.', 'org', ''), S, 'partition', 'org')
1184
1185 self.checkraises(ValueError, S, 'partition', '')
1186 self.checkraises(TypeError, S, 'partition', None)
1187
1188 def test_rpartition(self):
1189
1190 self.checkequal(('this is the rparti', 'ti', 'on method'),
1191 'this is the rpartition method', 'rpartition', 'ti')
1192
1193 # from raymond's original specification
1194 S = 'http://www.python.org'
1195 self.checkequal(('http', '://', 'www.python.org'), S, 'rpartition', '://')
Thomas Wouters89f507f2006-12-13 04:49:30 +00001196 self.checkequal(('', '', 'http://www.python.org'), S, 'rpartition', '?')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001197 self.checkequal(('', 'http://', 'www.python.org'), S, 'rpartition', 'http://')
1198 self.checkequal(('http://www.python.', 'org', ''), S, 'rpartition', 'org')
1199
1200 self.checkraises(ValueError, S, 'rpartition', '')
1201 self.checkraises(TypeError, S, 'rpartition', None)
1202
Jesus Ceaac451502011-04-20 17:09:23 +02001203 def test_none_arguments(self):
1204 # issue 11828
1205 s = 'hello'
1206 self.checkequal(2, s, 'find', 'l', None)
1207 self.checkequal(3, s, 'find', 'l', -2, None)
1208 self.checkequal(2, s, 'find', 'l', None, -2)
1209 self.checkequal(0, s, 'find', 'h', None, None)
1210
1211 self.checkequal(3, s, 'rfind', 'l', None)
1212 self.checkequal(3, s, 'rfind', 'l', -2, None)
1213 self.checkequal(2, s, 'rfind', 'l', None, -2)
1214 self.checkequal(0, s, 'rfind', 'h', None, None)
1215
1216 self.checkequal(2, s, 'index', 'l', None)
1217 self.checkequal(3, s, 'index', 'l', -2, None)
1218 self.checkequal(2, s, 'index', 'l', None, -2)
1219 self.checkequal(0, s, 'index', 'h', None, None)
1220
1221 self.checkequal(3, s, 'rindex', 'l', None)
1222 self.checkequal(3, s, 'rindex', 'l', -2, None)
1223 self.checkequal(2, s, 'rindex', 'l', None, -2)
1224 self.checkequal(0, s, 'rindex', 'h', None, None)
1225
1226 self.checkequal(2, s, 'count', 'l', None)
1227 self.checkequal(1, s, 'count', 'l', -2, None)
1228 self.checkequal(1, s, 'count', 'l', None, -2)
1229 self.checkequal(0, s, 'count', 'x', None, None)
1230
1231 self.checkequal(True, s, 'endswith', 'o', None)
1232 self.checkequal(True, s, 'endswith', 'lo', -2, None)
1233 self.checkequal(True, s, 'endswith', 'l', None, -2)
1234 self.checkequal(False, s, 'endswith', 'x', None, None)
1235
1236 self.checkequal(True, s, 'startswith', 'h', None)
1237 self.checkequal(True, s, 'startswith', 'l', -2, None)
1238 self.checkequal(True, s, 'startswith', 'h', None, -2)
1239 self.checkequal(False, s, 'startswith', 'x', None, None)
1240
1241 def test_find_etc_raise_correct_error_messages(self):
1242 # issue 11828
1243 s = 'hello'
1244 x = 'x'
Ezio Melottiaf928422011-04-20 21:56:21 +03001245 self.assertRaisesRegex(TypeError, r'^find\(', s.find,
Jesus Ceaac451502011-04-20 17:09:23 +02001246 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001247 self.assertRaisesRegex(TypeError, r'^rfind\(', s.rfind,
Jesus Ceaac451502011-04-20 17:09:23 +02001248 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001249 self.assertRaisesRegex(TypeError, r'^index\(', s.index,
Jesus Ceaac451502011-04-20 17:09:23 +02001250 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001251 self.assertRaisesRegex(TypeError, r'^rindex\(', s.rindex,
Jesus Ceaac451502011-04-20 17:09:23 +02001252 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001253 self.assertRaisesRegex(TypeError, r'^count\(', s.count,
Jesus Ceaac451502011-04-20 17:09:23 +02001254 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001255 self.assertRaisesRegex(TypeError, r'^startswith\(', s.startswith,
Jesus Ceaac451502011-04-20 17:09:23 +02001256 x, None, None, None)
Ezio Melottiaf928422011-04-20 21:56:21 +03001257 self.assertRaisesRegex(TypeError, r'^endswith\(', s.endswith,
Jesus Ceaac451502011-04-20 17:09:23 +02001258 x, None, None, None)
1259
Walter Dörwald57d88e52004-08-26 16:53:04 +00001260
Walter Dörwald57d88e52004-08-26 16:53:04 +00001261class MixinStrUnicodeTest:
Tim Peters108f1372004-08-27 05:36:07 +00001262 # Additional tests that only work with str and unicode.
Walter Dörwald57d88e52004-08-26 16:53:04 +00001263
1264 def test_bug1001011(self):
1265 # Make sure join returns a NEW object for single item sequences
Tim Peters108f1372004-08-27 05:36:07 +00001266 # involving a subclass.
1267 # Make sure that it is of the appropriate type.
1268 # Check the optimisation still occurs for standard objects.
Walter Dörwald57d88e52004-08-26 16:53:04 +00001269 t = self.type2test
1270 class subclass(t):
1271 pass
1272 s1 = subclass("abcd")
1273 s2 = t().join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001274 self.assertIsNot(s1, s2)
1275 self.assertIs(type(s2), t)
Tim Peters108f1372004-08-27 05:36:07 +00001276
1277 s1 = t("abcd")
1278 s2 = t().join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001279 self.assertIs(s1, s2)
Tim Peters108f1372004-08-27 05:36:07 +00001280
1281 # Should also test mixed-type join.
Guido van Rossumef87d6e2007-05-02 19:09:54 +00001282 if t is str:
Tim Peters108f1372004-08-27 05:36:07 +00001283 s1 = subclass("abcd")
1284 s2 = "".join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001285 self.assertIsNot(s1, s2)
1286 self.assertIs(type(s2), t)
Tim Peters108f1372004-08-27 05:36:07 +00001287
1288 s1 = t("abcd")
1289 s2 = "".join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001290 self.assertIs(s1, s2)
Tim Peters108f1372004-08-27 05:36:07 +00001291
Guido van Rossum98297ee2007-11-06 21:34:58 +00001292## elif t is str8:
1293## s1 = subclass("abcd")
1294## s2 = "".join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001295## self.assertIsNot(s1, s2)
1296## self.assertIs(type(s2), str) # promotes!
Tim Peters108f1372004-08-27 05:36:07 +00001297
Guido van Rossum98297ee2007-11-06 21:34:58 +00001298## s1 = t("abcd")
1299## s2 = "".join([s1])
Ezio Melottib3aedd42010-11-20 19:04:17 +00001300## self.assertIsNot(s1, s2)
1301## self.assertIs(type(s2), str) # promotes!
Tim Peters108f1372004-08-27 05:36:07 +00001302
1303 else:
1304 self.fail("unexpected type for MixinStrUnicodeTest %r" % t)