blob: eafc89a294d516809b43f401287ebd221e415583 [file] [log] [blame]
Walter Dörwald0fd583c2003-02-21 12:53:50 +00001"""
2Common tests shared by test_str, test_unicode, test_userstring and test_string.
3"""
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +00004
Walter Dörwald0fd583c2003-02-21 12:53:50 +00005import unittest, string, sys
6from test import test_support
Jeremy Hylton20f41b62000-07-11 03:31:55 +00007from UserList import UserList
8
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +00009class Sequence:
Walter Dörwald0fd583c2003-02-21 12:53:50 +000010 def __init__(self, seq='wxyz'): self.seq = seq
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000011 def __len__(self): return len(self.seq)
12 def __getitem__(self, i): return self.seq[i]
13
14class BadSeq1(Sequence):
15 def __init__(self): self.seq = [7, 'hello', 123L]
16
17class BadSeq2(Sequence):
18 def __init__(self): self.seq = ['a', 'b', 'c']
19 def __len__(self): return 8
20
Walter Dörwald0fd583c2003-02-21 12:53:50 +000021class CommonTest(unittest.TestCase):
22 # This testcase contains test that can be used in all
23 # stringlike classes. Currently this is str, unicode
24 # UserString and the string module.
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000025
Walter Dörwald0fd583c2003-02-21 12:53:50 +000026 # The type to be tested
27 # Change in subclasses to change the behaviour of fixtesttype()
28 type2test = None
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000029
Walter Dörwald0fd583c2003-02-21 12:53:50 +000030 # All tests pass their arguments to the testing methods
31 # as str objects. fixtesttype() can be used to propagate
32 # these arguments to the appropriate type
33 def fixtype(self, obj):
34 if isinstance(obj, str):
35 return self.__class__.type2test(obj)
36 elif isinstance(obj, list):
37 return [self.fixtype(x) for x in obj]
38 elif isinstance(obj, tuple):
39 return tuple([self.fixtype(x) for x in obj])
40 elif isinstance(obj, dict):
41 return dict([
42 (self.fixtype(key), self.fixtype(value))
43 for (key, value) in obj.iteritems()
44 ])
45 else:
46 return obj
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000047
Walter Dörwald0fd583c2003-02-21 12:53:50 +000048 # check that object.method(*args) returns result
49 def checkequal(self, result, object, methodname, *args):
50 result = self.fixtype(result)
51 object = self.fixtype(object)
52 args = self.fixtype(args)
53 realresult = getattr(object, methodname)(*args)
54 self.assertEqual(
55 result,
56 realresult
57 )
58 # if the original is returned make sure that
59 # this doesn't happen with subclasses
60 if object == realresult:
61 class subtype(self.__class__.type2test):
62 pass
63 object = subtype(object)
64 realresult = getattr(object, methodname)(*args)
65 self.assert_(object is not realresult)
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000066
Walter Dörwald0fd583c2003-02-21 12:53:50 +000067 # check that object.method(*args) raises exc
68 def checkraises(self, exc, object, methodname, *args):
69 object = self.fixtype(object)
70 args = self.fixtype(args)
71 self.assertRaises(
72 exc,
73 getattr(object, methodname),
74 *args
75 )
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +000076
Walter Dörwald0fd583c2003-02-21 12:53:50 +000077 # call object.method(*args) without any checks
78 def checkcall(self, object, methodname, *args):
79 object = self.fixtype(object)
80 args = self.fixtype(args)
81 getattr(object, methodname)(*args)
82
83 def test_capitalize(self):
84 self.checkequal(' hello ', ' hello ', 'capitalize')
85 self.checkequal('Hello ', 'Hello ','capitalize')
86 self.checkequal('Hello ', 'hello ','capitalize')
87 self.checkequal('Aaaa', 'aaaa', 'capitalize')
88 self.checkequal('Aaaa', 'AaAa', 'capitalize')
89
90 self.checkraises(TypeError, 'hello', 'capitalize', 42)
91
92 def test_count(self):
93 self.checkequal(3, 'aaa', 'count', 'a')
94 self.checkequal(0, 'aaa', 'count', 'b')
95 self.checkequal(3, 'aaa', 'count', 'a')
96 self.checkequal(0, 'aaa', 'count', 'b')
97 self.checkequal(3, 'aaa', 'count', 'a')
98 self.checkequal(0, 'aaa', 'count', 'b')
99 self.checkequal(0, 'aaa', 'count', 'b')
100 self.checkequal(1, 'aaa', 'count', 'a', -1)
101 self.checkequal(3, 'aaa', 'count', 'a', -10)
102 self.checkequal(2, 'aaa', 'count', 'a', 0, -1)
103 self.checkequal(0, 'aaa', 'count', 'a', 0, -10)
104
105 self.checkraises(TypeError, 'hello', 'count')
106 self.checkraises(TypeError, 'hello', 'count', 42)
107
108 def test_find(self):
109 self.checkequal(0, 'abcdefghiabc', 'find', 'abc')
110 self.checkequal(9, 'abcdefghiabc', 'find', 'abc', 1)
111 self.checkequal(-1, 'abcdefghiabc', 'find', 'def', 4)
112
113 self.checkraises(TypeError, 'hello', 'find')
114 self.checkraises(TypeError, 'hello', 'find', 42)
115
116 def test_rfind(self):
117 self.checkequal(9, 'abcdefghiabc', 'rfind', 'abc')
118 self.checkequal(12, 'abcdefghiabc', 'rfind', '')
119 self.checkequal(0, 'abcdefghiabc', 'rfind', 'abcd')
120 self.checkequal(-1, 'abcdefghiabc', 'rfind', 'abcz')
121
122 self.checkraises(TypeError, 'hello', 'rfind')
123 self.checkraises(TypeError, 'hello', 'rfind', 42)
124
125 def test_index(self):
126 self.checkequal(0, 'abcdefghiabc', 'index', '')
127 self.checkequal(3, 'abcdefghiabc', 'index', 'def')
128 self.checkequal(0, 'abcdefghiabc', 'index', 'abc')
129 self.checkequal(9, 'abcdefghiabc', 'index', 'abc', 1)
130
131 self.checkraises(ValueError, 'abcdefghiabc', 'index', 'hib')
132 self.checkraises(ValueError, 'abcdefghiab', 'index', 'abc', 1)
133 self.checkraises(ValueError, 'abcdefghi', 'index', 'ghi', 8)
134 self.checkraises(ValueError, 'abcdefghi', 'index', 'ghi', -1)
135
136 self.checkraises(TypeError, 'hello', 'index')
137 self.checkraises(TypeError, 'hello', 'index', 42)
138
139 def test_rindex(self):
140 self.checkequal(12, 'abcdefghiabc', 'rindex', '')
141 self.checkequal(3, 'abcdefghiabc', 'rindex', 'def')
142 self.checkequal(9, 'abcdefghiabc', 'rindex', 'abc')
143 self.checkequal(0, 'abcdefghiabc', 'rindex', 'abc', 0, -1)
144
145 self.checkraises(ValueError, 'abcdefghiabc', 'rindex', 'hib')
146 self.checkraises(ValueError, 'defghiabc', 'rindex', 'def', 1)
147 self.checkraises(ValueError, 'defghiabc', 'rindex', 'abc', 0, -1)
148 self.checkraises(ValueError, 'abcdefghi', 'rindex', 'ghi', 0, 8)
149 self.checkraises(ValueError, 'abcdefghi', 'rindex', 'ghi', 0, -1)
150
151 self.checkraises(TypeError, 'hello', 'rindex')
152 self.checkraises(TypeError, 'hello', 'rindex', 42)
153
154 def test_lower(self):
155 self.checkequal('hello', 'HeLLo', 'lower')
156 self.checkequal('hello', 'hello', 'lower')
157 self.checkraises(TypeError, 'hello', 'lower', 42)
158
159 def test_upper(self):
160 self.checkequal('HELLO', 'HeLLo', 'upper')
161 self.checkequal('HELLO', 'HELLO', 'upper')
162 self.checkraises(TypeError, 'hello', 'upper', 42)
163
164 def test_expandtabs(self):
165 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
166 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
167 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 4)
168 self.checkequal('abc\r\nab def\ng hi', 'abc\r\nab\tdef\ng\thi', 'expandtabs', 4)
169 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs')
170 self.checkequal('abc\rab def\ng hi', 'abc\rab\tdef\ng\thi', 'expandtabs', 8)
171 self.checkequal('abc\r\nab\r\ndef\ng\r\nhi', 'abc\r\nab\r\ndef\ng\r\nhi', 'expandtabs', 4)
172
173 self.checkraises(TypeError, 'hello', 'expandtabs', 42, 42)
174
175 def test_split(self):
176 self.checkequal(['this', 'is', 'the', 'split', 'function'],
177 'this is the split function', 'split')
178 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'split', '|')
179 self.checkequal(['a', 'b', 'c|d'], 'a|b|c|d', 'split', '|', 2)
180 self.checkequal(['a', 'b c d'], 'a b c d', 'split', None, 1)
181 self.checkequal(['a', 'b', 'c d'], 'a b c d', 'split', None, 2)
182 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'split', None, 3)
183 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'split', None, 4)
184 self.checkequal(['a b c d'], 'a b c d', 'split', None, 0)
185 self.checkequal(['a', 'b', 'c d'], 'a b c d', 'split', None, 2)
186 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d ', 'split')
187 self.checkequal(['a', 'b', 'c', 'd'], 'a//b//c//d', 'split', '//')
188 self.checkequal(['endcase ', ''], 'endcase test', 'split', 'test')
189
190 self.checkraises(TypeError, 'hello', 'split', 42, 42, 42)
191
Hye-Shik Chang3ae811b2003-12-15 18:49:53 +0000192 def test_rsplit(self):
193 self.checkequal(['this', 'is', 'the', 'rsplit', 'function'],
194 'this is the rsplit function', 'rsplit')
195 self.checkequal(['a', 'b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|')
196 self.checkequal(['a|b', 'c', 'd'], 'a|b|c|d', 'rsplit', '|', 2)
197 self.checkequal(['a b c', 'd'], 'a b c d', 'rsplit', None, 1)
198 self.checkequal(['a b', 'c', 'd'], 'a b c d', 'rsplit', None, 2)
199 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'rsplit', None, 3)
200 self.checkequal(['a', 'b', 'c', 'd'], 'a b c d', 'rsplit', None, 4)
201 self.checkequal(['a b c d'], 'a b c d', 'rsplit', None, 0)
202 self.checkequal(['a, b, c', 'd'], 'a, b, c, d', 'rsplit', ', ', 1)
203 self.checkequal(['a, b', 'c', 'd'], 'a, b, c, d', 'rsplit', ', ', 2)
204 self.checkequal(['a', 'b', 'c', 'd'], 'a, b, c, d', 'rsplit', ', ', 3)
205 self.checkequal(['a', 'b', 'c', 'd'], 'a, b, c, d', 'rsplit', ', ', 4)
206 self.checkequal(['a, b, c, d'], 'a, b, c, d', 'rsplit', ', ', 0)
207 self.checkequal(['a b', 'c', 'd'], 'a b c d', 'rsplit', None, 2)
208 self.checkequal(['a\x00b', 'c'], 'a\x00b\x00c', 'rsplit', '\x00', 1)
209 self.checkequal(['', ''], 'abcd', 'rsplit', 'abcd')
210 self.checkequal([u'a b', u'c', u'd'], 'a b c d', 'rsplit', u' ', 2)
Hye-Shik Chang7fc4cf52003-12-23 09:10:16 +0000211 self.checkequal(['', ' endcase'], '| endcase', 'rsplit', '|')
212 self.checkequal(['', ' endcase'], 'test endcase', 'rsplit', 'test')
Hye-Shik Chang3ae811b2003-12-15 18:49:53 +0000213
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000214 def test_strip(self):
215 self.checkequal('hello', ' hello ', 'strip')
216 self.checkequal('hello ', ' hello ', 'lstrip')
217 self.checkequal(' hello', ' hello ', 'rstrip')
218 self.checkequal('hello', 'hello', 'strip')
219
Neal Norwitzffe33b72003-04-10 22:35:32 +0000220 # strip/lstrip/rstrip with None arg
221 self.checkequal('hello', ' hello ', 'strip', None)
222 self.checkequal('hello ', ' hello ', 'lstrip', None)
223 self.checkequal(' hello', ' hello ', 'rstrip', None)
224 self.checkequal('hello', 'hello', 'strip', None)
225
226 # strip/lstrip/rstrip with str arg
227 self.checkequal('hello', 'xyzzyhelloxyzzy', 'strip', 'xyz')
228 self.checkequal('helloxyzzy', 'xyzzyhelloxyzzy', 'lstrip', 'xyz')
229 self.checkequal('xyzzyhello', 'xyzzyhelloxyzzy', 'rstrip', 'xyz')
230 self.checkequal('hello', 'hello', 'strip', 'xyz')
231
232 # strip/lstrip/rstrip with unicode arg
233 if test_support.have_unicode:
234 self.checkequal(unicode('hello', 'ascii'), 'xyzzyhelloxyzzy',
235 'strip', unicode('xyz', 'ascii'))
236 self.checkequal(unicode('helloxyzzy', 'ascii'), 'xyzzyhelloxyzzy',
237 'lstrip', unicode('xyz', 'ascii'))
238 self.checkequal(unicode('xyzzyhello', 'ascii'), 'xyzzyhelloxyzzy',
239 'rstrip', unicode('xyz', 'ascii'))
240 self.checkequal(unicode('hello', 'ascii'), 'hello',
241 'strip', unicode('xyz', 'ascii'))
242
243 self.checkraises(TypeError, 'hello', 'strip', 42, 42)
244 self.checkraises(TypeError, 'hello', 'lstrip', 42, 42)
245 self.checkraises(TypeError, 'hello', 'rstrip', 42, 42)
246
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000247 def test_ljust(self):
248 self.checkequal('abc ', 'abc', 'ljust', 10)
249 self.checkequal('abc ', 'abc', 'ljust', 6)
250 self.checkequal('abc', 'abc', 'ljust', 3)
251 self.checkequal('abc', 'abc', 'ljust', 2)
Raymond Hettinger4f8f9762003-11-26 08:21:35 +0000252 self.checkequal('abc*******', 'abc', 'ljust', 10, '*')
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000253 self.checkraises(TypeError, 'abc', 'ljust')
254
255 def test_rjust(self):
256 self.checkequal(' abc', 'abc', 'rjust', 10)
257 self.checkequal(' abc', 'abc', 'rjust', 6)
258 self.checkequal('abc', 'abc', 'rjust', 3)
259 self.checkequal('abc', 'abc', 'rjust', 2)
Raymond Hettinger4f8f9762003-11-26 08:21:35 +0000260 self.checkequal('*******abc', 'abc', 'rjust', 10, '*')
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000261 self.checkraises(TypeError, 'abc', 'rjust')
262
263 def test_center(self):
264 self.checkequal(' abc ', 'abc', 'center', 10)
265 self.checkequal(' abc ', 'abc', 'center', 6)
266 self.checkequal('abc', 'abc', 'center', 3)
267 self.checkequal('abc', 'abc', 'center', 2)
Raymond Hettinger4f8f9762003-11-26 08:21:35 +0000268 self.checkequal('***abc****', 'abc', 'center', 10, '*')
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000269 self.checkraises(TypeError, 'abc', 'center')
270
271 def test_swapcase(self):
272 self.checkequal('hEllO CoMPuTErS', 'HeLLo cOmpUteRs', 'swapcase')
273
274 self.checkraises(TypeError, 'hello', 'swapcase', 42)
275
276 def test_replace(self):
277 self.checkequal('one@two!three!', 'one!two!three!', 'replace', '!', '@', 1)
278 self.checkequal('onetwothree', 'one!two!three!', 'replace', '!', '')
279 self.checkequal('one@two@three!', 'one!two!three!', 'replace', '!', '@', 2)
280 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@', 3)
281 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@', 4)
282 self.checkequal('one!two!three!', 'one!two!three!', 'replace', '!', '@', 0)
283 self.checkequal('one@two@three@', 'one!two!three!', 'replace', '!', '@')
284 self.checkequal('one!two!three!', 'one!two!three!', 'replace', 'x', '@')
285 self.checkequal('one!two!three!', 'one!two!three!', 'replace', 'x', '@', 2)
286 self.checkequal('-a-b-c-', 'abc', 'replace', '', '-')
287 self.checkequal('-a-b-c', 'abc', 'replace', '', '-', 3)
288 self.checkequal('abc', 'abc', 'replace', '', '-', 0)
289 self.checkequal('', '', 'replace', '', '')
290 self.checkequal('abc', 'abc', 'replace', 'ab', '--', 0)
291 self.checkequal('abc', 'abc', 'replace', 'xy', '--')
292 # Next three for SF bug 422088: [OSF1 alpha] string.replace(); died with
293 # MemoryError due to empty result (platform malloc issue when requesting
294 # 0 bytes).
295 self.checkequal('', '123', 'replace', '123', '')
296 self.checkequal('', '123123', 'replace', '123', '')
297 self.checkequal('x', '123x123', 'replace', '123', '')
298
299 self.checkraises(TypeError, 'hello', 'replace')
300 self.checkraises(TypeError, 'hello', 'replace', 42)
301 self.checkraises(TypeError, 'hello', 'replace', 42, 'h')
302 self.checkraises(TypeError, 'hello', 'replace', 'h', 42)
303
304 def test_zfill(self):
305 self.checkequal('123', '123', 'zfill', 2)
306 self.checkequal('123', '123', 'zfill', 3)
307 self.checkequal('0123', '123', 'zfill', 4)
308 self.checkequal('+123', '+123', 'zfill', 3)
309 self.checkequal('+123', '+123', 'zfill', 4)
310 self.checkequal('+0123', '+123', 'zfill', 5)
311 self.checkequal('-123', '-123', 'zfill', 3)
312 self.checkequal('-123', '-123', 'zfill', 4)
313 self.checkequal('-0123', '-123', 'zfill', 5)
314 self.checkequal('000', '', 'zfill', 3)
315 self.checkequal('34', '34', 'zfill', 1)
316 self.checkequal('0034', '34', 'zfill', 4)
317
318 self.checkraises(TypeError, '123', 'zfill')
319
320class MixinStrUnicodeUserStringTest:
321 # additional tests that only work for
322 # stringlike objects, i.e. str, unicode, UserString
323 # (but not the string module)
324
325 def test_islower(self):
326 self.checkequal(False, '', 'islower')
327 self.checkequal(True, 'a', 'islower')
328 self.checkequal(False, 'A', 'islower')
329 self.checkequal(False, '\n', 'islower')
330 self.checkequal(True, 'abc', 'islower')
331 self.checkequal(False, 'aBc', 'islower')
332 self.checkequal(True, 'abc\n', 'islower')
333 self.checkraises(TypeError, 'abc', 'islower', 42)
334
335 def test_isupper(self):
336 self.checkequal(False, '', 'isupper')
337 self.checkequal(False, 'a', 'isupper')
338 self.checkequal(True, 'A', 'isupper')
339 self.checkequal(False, '\n', 'isupper')
340 self.checkequal(True, 'ABC', 'isupper')
341 self.checkequal(False, 'AbC', 'isupper')
342 self.checkequal(True, 'ABC\n', 'isupper')
343 self.checkraises(TypeError, 'abc', 'isupper', 42)
344
345 def test_istitle(self):
346 self.checkequal(False, '', 'istitle')
347 self.checkequal(False, 'a', 'istitle')
348 self.checkequal(True, 'A', 'istitle')
349 self.checkequal(False, '\n', 'istitle')
350 self.checkequal(True, 'A Titlecased Line', 'istitle')
351 self.checkequal(True, 'A\nTitlecased Line', 'istitle')
352 self.checkequal(True, 'A Titlecased, Line', 'istitle')
353 self.checkequal(False, 'Not a capitalized String', 'istitle')
354 self.checkequal(False, 'Not\ta Titlecase String', 'istitle')
355 self.checkequal(False, 'Not--a Titlecase String', 'istitle')
356 self.checkequal(False, 'NOT', 'istitle')
357 self.checkraises(TypeError, 'abc', 'istitle', 42)
358
359 def test_isspace(self):
360 self.checkequal(False, '', 'isspace')
361 self.checkequal(False, 'a', 'isspace')
362 self.checkequal(True, ' ', 'isspace')
363 self.checkequal(True, '\t', 'isspace')
364 self.checkequal(True, '\r', 'isspace')
365 self.checkequal(True, '\n', 'isspace')
366 self.checkequal(True, ' \t\r\n', 'isspace')
367 self.checkequal(False, ' \t\r\na', 'isspace')
368 self.checkraises(TypeError, 'abc', 'isspace', 42)
369
370 def test_isalpha(self):
371 self.checkequal(False, '', 'isalpha')
372 self.checkequal(True, 'a', 'isalpha')
373 self.checkequal(True, 'A', 'isalpha')
374 self.checkequal(False, '\n', 'isalpha')
375 self.checkequal(True, 'abc', 'isalpha')
376 self.checkequal(False, 'aBc123', 'isalpha')
377 self.checkequal(False, 'abc\n', 'isalpha')
378 self.checkraises(TypeError, 'abc', 'isalpha', 42)
379
380 def test_isalnum(self):
381 self.checkequal(False, '', 'isalnum')
382 self.checkequal(True, 'a', 'isalnum')
383 self.checkequal(True, 'A', 'isalnum')
384 self.checkequal(False, '\n', 'isalnum')
385 self.checkequal(True, '123abc456', 'isalnum')
386 self.checkequal(True, 'a1b3c', 'isalnum')
387 self.checkequal(False, 'aBc000 ', 'isalnum')
388 self.checkequal(False, 'abc\n', 'isalnum')
389 self.checkraises(TypeError, 'abc', 'isalnum', 42)
390
391 def test_isdigit(self):
392 self.checkequal(False, '', 'isdigit')
393 self.checkequal(False, 'a', 'isdigit')
394 self.checkequal(True, '0', 'isdigit')
395 self.checkequal(True, '0123456789', 'isdigit')
396 self.checkequal(False, '0123456789a', 'isdigit')
397
398 self.checkraises(TypeError, 'abc', 'isdigit', 42)
399
400 def test_title(self):
401 self.checkequal(' Hello ', ' hello ', 'title')
402 self.checkequal('Hello ', 'hello ', 'title')
403 self.checkequal('Hello ', 'Hello ', 'title')
404 self.checkequal('Format This As Title String', "fOrMaT thIs aS titLe String", 'title')
405 self.checkequal('Format,This-As*Title;String', "fOrMaT,thIs-aS*titLe;String", 'title', )
406 self.checkequal('Getint', "getInt", 'title')
407 self.checkraises(TypeError, 'hello', 'title', 42)
408
409 def test_splitlines(self):
410 self.checkequal(['abc', 'def', '', 'ghi'], "abc\ndef\n\rghi", 'splitlines')
411 self.checkequal(['abc', 'def', '', 'ghi'], "abc\ndef\n\r\nghi", 'splitlines')
412 self.checkequal(['abc', 'def', 'ghi'], "abc\ndef\r\nghi", 'splitlines')
413 self.checkequal(['abc', 'def', 'ghi'], "abc\ndef\r\nghi\n", 'splitlines')
414 self.checkequal(['abc', 'def', 'ghi', ''], "abc\ndef\r\nghi\n\r", 'splitlines')
415 self.checkequal(['', 'abc', 'def', 'ghi', ''], "\nabc\ndef\r\nghi\n\r", 'splitlines')
416 self.checkequal(['\n', 'abc\n', 'def\r\n', 'ghi\n', '\r'], "\nabc\ndef\r\nghi\n\r", 'splitlines', 1)
417
418 self.checkraises(TypeError, 'abc', 'splitlines', 42, 42)
419
420 def test_startswith(self):
421 self.checkequal(True, 'hello', 'startswith', 'he')
422 self.checkequal(True, 'hello', 'startswith', 'hello')
423 self.checkequal(False, 'hello', 'startswith', 'hello world')
424 self.checkequal(True, 'hello', 'startswith', '')
425 self.checkequal(False, 'hello', 'startswith', 'ello')
426 self.checkequal(True, 'hello', 'startswith', 'ello', 1)
427 self.checkequal(True, 'hello', 'startswith', 'o', 4)
428 self.checkequal(False, 'hello', 'startswith', 'o', 5)
429 self.checkequal(True, 'hello', 'startswith', '', 5)
430 self.checkequal(False, 'hello', 'startswith', 'lo', 6)
431 self.checkequal(True, 'helloworld', 'startswith', 'lowo', 3)
432 self.checkequal(True, 'helloworld', 'startswith', 'lowo', 3, 7)
433 self.checkequal(False, 'helloworld', 'startswith', 'lowo', 3, 6)
434
435 # test negative indices
436 self.checkequal(True, 'hello', 'startswith', 'he', 0, -1)
437 self.checkequal(True, 'hello', 'startswith', 'he', -53, -1)
438 self.checkequal(False, 'hello', 'startswith', 'hello', 0, -1)
439 self.checkequal(False, 'hello', 'startswith', 'hello world', -1, -10)
440 self.checkequal(False, 'hello', 'startswith', 'ello', -5)
441 self.checkequal(True, 'hello', 'startswith', 'ello', -4)
442 self.checkequal(False, 'hello', 'startswith', 'o', -2)
443 self.checkequal(True, 'hello', 'startswith', 'o', -1)
444 self.checkequal(True, 'hello', 'startswith', '', -3, -3)
445 self.checkequal(False, 'hello', 'startswith', 'lo', -9)
446
447 self.checkraises(TypeError, 'hello', 'startswith')
448 self.checkraises(TypeError, 'hello', 'startswith', 42)
449
450 def test_endswith(self):
451 self.checkequal(True, 'hello', 'endswith', 'lo')
452 self.checkequal(False, 'hello', 'endswith', 'he')
453 self.checkequal(True, 'hello', 'endswith', '')
454 self.checkequal(False, 'hello', 'endswith', 'hello world')
455 self.checkequal(False, 'helloworld', 'endswith', 'worl')
456 self.checkequal(True, 'helloworld', 'endswith', 'worl', 3, 9)
457 self.checkequal(True, 'helloworld', 'endswith', 'world', 3, 12)
458 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 1, 7)
459 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 2, 7)
460 self.checkequal(True, 'helloworld', 'endswith', 'lowo', 3, 7)
461 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 4, 7)
462 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 3, 8)
463 self.checkequal(False, 'ab', 'endswith', 'ab', 0, 1)
464 self.checkequal(False, 'ab', 'endswith', 'ab', 0, 0)
465
466 # test negative indices
467 self.checkequal(True, 'hello', 'endswith', 'lo', -2)
468 self.checkequal(False, 'hello', 'endswith', 'he', -2)
469 self.checkequal(True, 'hello', 'endswith', '', -3, -3)
470 self.checkequal(False, 'hello', 'endswith', 'hello world', -10, -2)
471 self.checkequal(False, 'helloworld', 'endswith', 'worl', -6)
472 self.checkequal(True, 'helloworld', 'endswith', 'worl', -5, -1)
473 self.checkequal(True, 'helloworld', 'endswith', 'worl', -5, 9)
474 self.checkequal(True, 'helloworld', 'endswith', 'world', -7, 12)
475 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -99, -3)
476 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -8, -3)
477 self.checkequal(True, 'helloworld', 'endswith', 'lowo', -7, -3)
478 self.checkequal(False, 'helloworld', 'endswith', 'lowo', 3, -4)
479 self.checkequal(False, 'helloworld', 'endswith', 'lowo', -8, -2)
480
481 self.checkraises(TypeError, 'hello', 'endswith')
482 self.checkraises(TypeError, 'hello', 'endswith', 42)
483
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000484 def test___contains__(self):
485 self.checkequal(True, '', '__contains__', '') # vereq('' in '', True)
486 self.checkequal(True, 'abc', '__contains__', '') # vereq('' in 'abc', True)
487 self.checkequal(False, 'abc', '__contains__', '\0') # vereq('\0' in 'abc', False)
488 self.checkequal(True, '\0abc', '__contains__', '\0') # vereq('\0' in '\0abc', True)
489 self.checkequal(True, 'abc\0', '__contains__', '\0') # vereq('\0' in 'abc\0', True)
490 self.checkequal(True, '\0abc', '__contains__', 'a') # vereq('a' in '\0abc', True)
491 self.checkequal(True, 'asdf', '__contains__', 'asdf') # vereq('asdf' in 'asdf', True)
492 self.checkequal(False, 'asd', '__contains__', 'asdf') # vereq('asdf' in 'asd', False)
493 self.checkequal(False, '', '__contains__', 'asdf') # vereq('asdf' in '', False)
494
495 def test_subscript(self):
496 self.checkequal(u'a', 'abc', '__getitem__', 0)
497 self.checkequal(u'c', 'abc', '__getitem__', -1)
498 self.checkequal(u'a', 'abc', '__getitem__', 0L)
499 self.checkequal(u'abc', 'abc', '__getitem__', slice(0, 3))
500 self.checkequal(u'abc', 'abc', '__getitem__', slice(0, 1000))
501 self.checkequal(u'a', 'abc', '__getitem__', slice(0, 1))
502 self.checkequal(u'', 'abc', '__getitem__', slice(0, 0))
503 # FIXME What about negative indizes? This is handled differently by [] and __getitem__(slice)
504
505 self.checkraises(TypeError, 'abc', '__getitem__', 'def')
506
507 def test_slice(self):
508 self.checkequal('abc', 'abc', '__getslice__', 0, 1000)
509 self.checkequal('abc', 'abc', '__getslice__', 0, 3)
510 self.checkequal('ab', 'abc', '__getslice__', 0, 2)
511 self.checkequal('bc', 'abc', '__getslice__', 1, 3)
512 self.checkequal('b', 'abc', '__getslice__', 1, 2)
513 self.checkequal('', 'abc', '__getslice__', 2, 2)
514 self.checkequal('', 'abc', '__getslice__', 1000, 1000)
515 self.checkequal('', 'abc', '__getslice__', 2000, 1000)
516 self.checkequal('', 'abc', '__getslice__', 2, 1)
517 # FIXME What about negative indizes? This is handled differently by [] and __getslice__
518
519 self.checkraises(TypeError, 'abc', '__getslice__', 'def')
520
521 def test_mul(self):
522 self.checkequal('', 'abc', '__mul__', -1)
523 self.checkequal('', 'abc', '__mul__', 0)
524 self.checkequal('abc', 'abc', '__mul__', 1)
525 self.checkequal('abcabcabc', 'abc', '__mul__', 3)
526 self.checkraises(TypeError, 'abc', '__mul__')
527 self.checkraises(TypeError, 'abc', '__mul__', '')
Neal Norwitz15ff0e92003-02-23 23:15:26 +0000528 self.checkraises(OverflowError, 10000*'abc', '__mul__', 2000000000)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000529
530 def test_join(self):
531 # join now works with any sequence type
532 # moved here, because the argument order is
533 # different in string.join (see the test in
534 # test.test_string.StringTest.test_join)
535 self.checkequal('a b c d', ' ', 'join', ['a', 'b', 'c', 'd'])
536 self.checkequal('abcd', '', 'join', ('a', 'b', 'c', 'd'))
537 self.checkequal('w x y z', ' ', 'join', Sequence())
538 self.checkequal('abc', 'a', 'join', ('abc',))
539 self.checkequal('z', 'a', 'join', UserList(['z']))
540 if test_support.have_unicode:
541 self.checkequal(unicode('a.b.c'), unicode('.'), 'join', ['a', 'b', 'c'])
542 self.checkequal(unicode('a.b.c'), '.', 'join', [unicode('a'), 'b', 'c'])
543 self.checkequal(unicode('a.b.c'), '.', 'join', ['a', unicode('b'), 'c'])
544 self.checkequal(unicode('a.b.c'), '.', 'join', ['a', 'b', unicode('c')])
545 self.checkraises(TypeError, '.', 'join', ['a', unicode('b'), 3])
546 for i in [5, 25, 125]:
547 self.checkequal(((('a' * i) + '-') * i)[:-1], '-', 'join',
548 ['a' * i] * i)
549 self.checkequal(((('a' * i) + '-') * i)[:-1], '-', 'join',
550 ('a' * i,) * i)
551
552 self.checkraises(TypeError, ' ', 'join', BadSeq1())
553 self.checkequal('a b c', ' ', 'join', BadSeq2())
554
555 self.checkraises(TypeError, ' ', 'join')
556 self.checkraises(TypeError, ' ', 'join', 7)
557 self.checkraises(TypeError, ' ', 'join', Sequence([7, 'hello', 123L]))
558
559 def test_formatting(self):
560 self.checkequal('+hello+', '+%s+', '__mod__', 'hello')
561 self.checkequal('+10+', '+%d+', '__mod__', 10)
562 self.checkequal('a', "%c", '__mod__', "a")
563 self.checkequal('a', "%c", '__mod__', "a")
564 self.checkequal('"', "%c", '__mod__', 34)
565 self.checkequal('$', "%c", '__mod__', 36)
566 self.checkequal('10', "%d", '__mod__', 10)
Walter Dörwald43440a62003-03-31 18:07:50 +0000567 self.checkequal('\x7f', "%c", '__mod__', 0x7f)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000568
569 for ordinal in (-100, 0x200000):
570 # unicode raises ValueError, str raises OverflowError
571 self.checkraises((ValueError, OverflowError), '%c', '__mod__', ordinal)
572
573 self.checkequal(' 42', '%3ld', '__mod__', 42)
574 self.checkequal('0042.00', '%07.2f', '__mod__', 42)
Raymond Hettinger9bfe5332003-08-27 04:55:52 +0000575 self.checkequal('0042.00', '%07.2F', '__mod__', 42)
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000576
577 self.checkraises(TypeError, 'abc', '__mod__')
578 self.checkraises(TypeError, '%(foo)s', '__mod__', 42)
579 self.checkraises(TypeError, '%s%s', '__mod__', (42,))
580 self.checkraises(TypeError, '%c', '__mod__', (None,))
581 self.checkraises(ValueError, '%(foo', '__mod__', {})
582 self.checkraises(TypeError, '%(foo)s %(bar)s', '__mod__', ('foo', 42))
583
584 # argument names with properly nested brackets are supported
585 self.checkequal('bar', '%((foo))s', '__mod__', {'(foo)': 'bar'})
586
587 # 100 is a magic number in PyUnicode_Format, this forces a resize
588 self.checkequal(103*'a'+'x', '%sx', '__mod__', 103*'a')
589
590 self.checkraises(TypeError, '%*s', '__mod__', ('foo', 'bar'))
591 self.checkraises(TypeError, '%10.*f', '__mod__', ('foo', 42.))
592 self.checkraises(ValueError, '%10', '__mod__', (42,))
593
594 def test_floatformatting(self):
595 # float formatting
596 for prec in xrange(100):
597 format = '%%.%if' % prec
598 value = 0.01
599 for x in xrange(60):
600 value = value * 3.141592655 / 3.0 * 10.0
601 # The formatfloat() code in stringobject.c and
602 # unicodeobject.c uses a 120 byte buffer and switches from
603 # 'f' formatting to 'g' at precision 50, so we expect
604 # OverflowErrors for the ranges x < 50 and prec >= 67.
605 if x < 50 and prec >= 67:
606 self.checkraises(OverflowError, format, "__mod__", value)
607 else:
608 self.checkcall(format, "__mod__", value)
609
610class MixinStrStringUserStringTest:
611 # Additional tests for 8bit strings, i.e. str, UserString and
612 # the string module
613
614 def test_maketrans(self):
615 self.assertEqual(
616 ''.join(map(chr, xrange(256))).replace('abc', 'xyz'),
617 string.maketrans('abc', 'xyz')
618 )
619 self.assertRaises(ValueError, string.maketrans, 'abc', 'xyzw')
620
621 def test_translate(self):
622 table = string.maketrans('abc', 'xyz')
623 self.checkequal('xyzxyz', 'xyzabcdef', 'translate', table, 'def')
624
625 table = string.maketrans('a', 'A')
626 self.checkequal('Abc', 'abc', 'translate', table)
627 self.checkequal('xyz', 'xyz', 'translate', table)
628 self.checkequal('yz', 'xyz', 'translate', table, 'x')
629 self.checkraises(ValueError, 'xyz', 'translate', 'too short', 'strip')
630 self.checkraises(ValueError, 'xyz', 'translate', 'too short')
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +0000631
632
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000633class MixinStrUserStringTest:
634 # Additional tests that only work with
635 # 8bit compatible object, i.e. str and UserString
Jeremy Hyltonf82b04e2000-07-10 17:08:42 +0000636
Walter Dörwald0fd583c2003-02-21 12:53:50 +0000637 def test_encoding_decoding(self):
638 codecs = [('rot13', 'uryyb jbeyq'),
639 ('base64', 'aGVsbG8gd29ybGQ=\n'),
640 ('hex', '68656c6c6f20776f726c64'),
641 ('uu', 'begin 666 <data>\n+:&5L;&\\@=V]R;&0 \n \nend\n')]
642 for encoding, data in codecs:
643 self.checkequal(data, 'hello world', 'encode', encoding)
644 self.checkequal('hello world', data, 'decode', encoding)
645 # zlib is optional, so we make the test optional too...
646 try:
647 import zlib
648 except ImportError:
649 pass
650 else:
651 data = 'x\x9c\xcbH\xcd\xc9\xc9W(\xcf/\xcaI\x01\x00\x1a\x0b\x04]'
652 self.checkequal(data, 'hello world', 'encode', 'zlib')
653 self.checkequal('hello world', data, 'decode', 'zlib')
Walter Dörwald97951de2003-03-26 14:31:25 +0000654
655 self.checkraises(TypeError, 'xyz', 'decode', 42)
656 self.checkraises(TypeError, 'xyz', 'encode', 42)