blob: a44184fbc77a1eb12a20cb99ea140375aea4bb29 [file] [log] [blame]
Greg Ward3dc94e12002-08-22 18:37:50 +00001#
Greg Ward61864102004-06-03 01:59:41 +00002# Test suite for the textwrap module.
Greg Ward3dc94e12002-08-22 18:37:50 +00003#
4# Original tests written by Greg Ward <gward@python.net>.
5# Converted to PyUnit by Peter Hansen <peter@engcorp.com>.
6# Currently maintained by Greg Ward.
7#
8# $Id$
9#
10
Greg Ward90c0b072002-08-22 18:11:10 +000011import unittest
12
Antoine Pitrou389dec82013-08-12 22:39:09 +020013from textwrap import TextWrapper, wrap, fill, dedent, indent, shorten
Greg Ward90c0b072002-08-22 18:11:10 +000014
15
Greg Ward13c53c62002-08-22 18:57:26 +000016class BaseTestCase(unittest.TestCase):
Greg Ward90c0b072002-08-22 18:11:10 +000017 '''Parent class with utility methods for textwrap tests.'''
18
19 def show(self, textin):
20 if isinstance(textin, list):
21 result = []
22 for i in range(len(textin)):
23 result.append(" %d: %r" % (i, textin[i]))
R David Murray1585b702012-09-08 13:13:25 -040024 result = "\n".join(result) if result else " no lines"
Guido van Rossum3172c5d2007-10-16 18:12:55 +000025 elif isinstance(textin, str):
Greg Ward90c0b072002-08-22 18:11:10 +000026 result = " %s\n" % repr(textin)
27 return result
28
29
30 def check(self, result, expect):
Ezio Melottib3aedd42010-11-20 19:04:17 +000031 self.assertEqual(result, expect,
Greg Ward9ad15a32002-08-22 19:47:27 +000032 'expected:\n%s\nbut got:\n%s' % (
33 self.show(expect), self.show(result)))
Greg Ward90c0b072002-08-22 18:11:10 +000034
Guido van Rossumeb287a22002-10-02 15:47:32 +000035 def check_wrap(self, text, width, expect, **kwargs):
36 result = wrap(text, width, **kwargs)
Greg Wardee413842002-08-22 18:55:38 +000037 self.check(result, expect)
38
Greg Wardd1a72a02002-10-31 16:11:18 +000039 def check_split(self, text, expect):
40 result = self.wrapper._split(text)
Ezio Melottib3aedd42010-11-20 19:04:17 +000041 self.assertEqual(result, expect,
42 "\nexpected %r\n"
43 "but got %r" % (expect, result))
Greg Ward715debd2002-08-22 21:16:25 +000044
Greg Ward90c0b072002-08-22 18:11:10 +000045
Greg Ward13c53c62002-08-22 18:57:26 +000046class WrapTestCase(BaseTestCase):
Greg Ward90c0b072002-08-22 18:11:10 +000047
Greg Ward90c0b072002-08-22 18:11:10 +000048 def setUp(self):
Greg Wardf0ba7642004-05-13 01:53:10 +000049 self.wrapper = TextWrapper(width=45)
Greg Ward90c0b072002-08-22 18:11:10 +000050
Greg Wardf6765782002-08-22 18:35:49 +000051 def test_simple(self):
Guido van Rossum327af772002-08-22 20:13:47 +000052 # Simple case: just words, spaces, and a bit of punctuation
Greg Ward90c0b072002-08-22 18:11:10 +000053
Greg Wardee413842002-08-22 18:55:38 +000054 text = "Hello there, how are you this fine day? I'm glad to hear it!"
Greg Ward90c0b072002-08-22 18:11:10 +000055
Greg Wardee413842002-08-22 18:55:38 +000056 self.check_wrap(text, 12,
57 ["Hello there,",
58 "how are you",
59 "this fine",
60 "day? I'm",
61 "glad to hear",
62 "it!"])
63 self.check_wrap(text, 42,
64 ["Hello there, how are you this fine day?",
65 "I'm glad to hear it!"])
66 self.check_wrap(text, 80, [text])
Greg Ward90c0b072002-08-22 18:11:10 +000067
R David Murray1585b702012-09-08 13:13:25 -040068 def test_empty_string(self):
69 # Check that wrapping the empty string returns an empty list.
70 self.check_wrap("", 6, [])
71 self.check_wrap("", 6, [], drop_whitespace=False)
72
73 def test_empty_string_with_initial_indent(self):
74 # Check that the empty string is not indented.
75 self.check_wrap("", 6, [], initial_indent="++")
76 self.check_wrap("", 6, [], initial_indent="++", drop_whitespace=False)
Greg Ward90c0b072002-08-22 18:11:10 +000077
Greg Wardf6765782002-08-22 18:35:49 +000078 def test_whitespace(self):
Guido van Rossum327af772002-08-22 20:13:47 +000079 # Whitespace munging and end-of-sentence detection
Greg Ward90c0b072002-08-22 18:11:10 +000080
Greg Wardee413842002-08-22 18:55:38 +000081 text = """\
Greg Ward90c0b072002-08-22 18:11:10 +000082This is a paragraph that already has
83line breaks. But some of its lines are much longer than the others,
84so it needs to be wrapped.
85Some lines are \ttabbed too.
86What a mess!
87"""
88
Greg Wardee413842002-08-22 18:55:38 +000089 expect = ["This is a paragraph that already has line",
90 "breaks. But some of its lines are much",
91 "longer than the others, so it needs to be",
92 "wrapped. Some lines are tabbed too. What a",
93 "mess!"]
Greg Ward90c0b072002-08-22 18:11:10 +000094
Greg Wardf0ba7642004-05-13 01:53:10 +000095 wrapper = TextWrapper(45, fix_sentence_endings=True)
96 result = wrapper.wrap(text)
Greg Ward90c0b072002-08-22 18:11:10 +000097 self.check(result, expect)
98
Greg Wardf0ba7642004-05-13 01:53:10 +000099 result = wrapper.fill(text)
Greg Ward90c0b072002-08-22 18:11:10 +0000100 self.check(result, '\n'.join(expect))
101
Hynek Schlawackd5272592012-05-19 13:33:11 +0200102 text = "\tTest\tdefault\t\ttabsize."
103 expect = [" Test default tabsize."]
104 self.check_wrap(text, 80, expect)
105
106 text = "\tTest\tcustom\t\ttabsize."
107 expect = [" Test custom tabsize."]
108 self.check_wrap(text, 80, expect, tabsize=4)
109
Greg Wardf0ba7642004-05-13 01:53:10 +0000110 def test_fix_sentence_endings(self):
111 wrapper = TextWrapper(60, fix_sentence_endings=True)
Greg Ward90c0b072002-08-22 18:11:10 +0000112
Greg Wardf0ba7642004-05-13 01:53:10 +0000113 # SF #847346: ensure that fix_sentence_endings=True does the
114 # right thing even on input short enough that it doesn't need to
115 # be wrapped.
116 text = "A short line. Note the single space."
117 expect = ["A short line. Note the single space."]
118 self.check(wrapper.wrap(text), expect)
119
120 # Test some of the hairy end cases that _fix_sentence_endings()
121 # is supposed to handle (the easy stuff is tested in
122 # test_whitespace() above).
123 text = "Well, Doctor? What do you think?"
124 expect = ["Well, Doctor? What do you think?"]
125 self.check(wrapper.wrap(text), expect)
126
127 text = "Well, Doctor?\nWhat do you think?"
128 self.check(wrapper.wrap(text), expect)
129
130 text = 'I say, chaps! Anyone for "tennis?"\nHmmph!'
131 expect = ['I say, chaps! Anyone for "tennis?" Hmmph!']
132 self.check(wrapper.wrap(text), expect)
133
134 wrapper.width = 20
135 expect = ['I say, chaps!', 'Anyone for "tennis?"', 'Hmmph!']
136 self.check(wrapper.wrap(text), expect)
137
138 text = 'And she said, "Go to hell!"\nCan you believe that?'
139 expect = ['And she said, "Go to',
140 'hell!" Can you',
141 'believe that?']
142 self.check(wrapper.wrap(text), expect)
143
144 wrapper.width = 60
145 expect = ['And she said, "Go to hell!" Can you believe that?']
146 self.check(wrapper.wrap(text), expect)
Tim Peters27f88362004-07-08 04:22:35 +0000147
Christian Heimes81ee3ef2008-05-04 22:42:01 +0000148 text = 'File stdio.h is nice.'
149 expect = ['File stdio.h is nice.']
150 self.check(wrapper.wrap(text), expect)
151
Greg Wardf6765782002-08-22 18:35:49 +0000152 def test_wrap_short(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000153 # Wrapping to make short lines longer
Greg Ward90c0b072002-08-22 18:11:10 +0000154
Greg Wardee413842002-08-22 18:55:38 +0000155 text = "This is a\nshort paragraph."
Greg Ward90c0b072002-08-22 18:11:10 +0000156
Greg Wardee413842002-08-22 18:55:38 +0000157 self.check_wrap(text, 20, ["This is a short",
158 "paragraph."])
159 self.check_wrap(text, 40, ["This is a short paragraph."])
Greg Ward90c0b072002-08-22 18:11:10 +0000160
161
Guido van Rossumeb287a22002-10-02 15:47:32 +0000162 def test_wrap_short_1line(self):
163 # Test endcases
164
165 text = "This is a short line."
166
167 self.check_wrap(text, 30, ["This is a short line."])
168 self.check_wrap(text, 30, ["(1) This is a short line."],
169 initial_indent="(1) ")
170
171
Greg Wardf6765782002-08-22 18:35:49 +0000172 def test_hyphenated(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000173 # Test breaking hyphenated words
Greg Ward90c0b072002-08-22 18:11:10 +0000174
Greg Wardee413842002-08-22 18:55:38 +0000175 text = ("this-is-a-useful-feature-for-"
176 "reformatting-posts-from-tim-peters'ly")
Greg Ward90c0b072002-08-22 18:11:10 +0000177
Greg Wardee413842002-08-22 18:55:38 +0000178 self.check_wrap(text, 40,
179 ["this-is-a-useful-feature-for-",
180 "reformatting-posts-from-tim-peters'ly"])
181 self.check_wrap(text, 41,
182 ["this-is-a-useful-feature-for-",
183 "reformatting-posts-from-tim-peters'ly"])
184 self.check_wrap(text, 42,
185 ["this-is-a-useful-feature-for-reformatting-",
186 "posts-from-tim-peters'ly"])
Serhiy Storchaka72bd3272015-03-24 18:32:27 +0200187 # The test tests current behavior but is not testing parts of the API.
188 expect = ("this-|is-|a-|useful-|feature-|for-|"
189 "reformatting-|posts-|from-|tim-|peters'ly").split('|')
190 self.check_wrap(text, 1, expect, break_long_words=False)
191 self.check_split(text, expect)
192
193 self.check_split('e-mail', ['e-mail'])
194 self.check_split('Jelly-O', ['Jelly-O'])
195 # The test tests current behavior but is not testing parts of the API.
196 self.check_split('half-a-crown', 'half-|a-|crown'.split('|'))
Greg Ward90c0b072002-08-22 18:11:10 +0000197
Greg Ward40407942005-03-05 02:53:17 +0000198 def test_hyphenated_numbers(self):
199 # Test that hyphenated numbers (eg. dates) are not broken like words.
200 text = ("Python 1.0.0 was released on 1994-01-26. Python 1.0.1 was\n"
201 "released on 1994-02-15.")
202
203 self.check_wrap(text, 30, ['Python 1.0.0 was released on',
204 '1994-01-26. Python 1.0.1 was',
205 'released on 1994-02-15.'])
206 self.check_wrap(text, 40, ['Python 1.0.0 was released on 1994-01-26.',
207 'Python 1.0.1 was released on 1994-02-15.'])
Serhiy Storchaka72bd3272015-03-24 18:32:27 +0200208 self.check_wrap(text, 1, text.split(), break_long_words=False)
Greg Ward40407942005-03-05 02:53:17 +0000209
210 text = "I do all my shopping at 7-11."
211 self.check_wrap(text, 25, ["I do all my shopping at",
212 "7-11."])
213 self.check_wrap(text, 27, ["I do all my shopping at",
214 "7-11."])
215 self.check_wrap(text, 29, ["I do all my shopping at 7-11."])
Serhiy Storchaka72bd3272015-03-24 18:32:27 +0200216 self.check_wrap(text, 1, text.split(), break_long_words=False)
Greg Ward40407942005-03-05 02:53:17 +0000217
Greg Ward9ad15a32002-08-22 19:47:27 +0000218 def test_em_dash(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000219 # Test text with em-dashes
Greg Ward9ad15a32002-08-22 19:47:27 +0000220 text = "Em-dashes should be written -- thus."
221 self.check_wrap(text, 25,
222 ["Em-dashes should be",
223 "written -- thus."])
224
225 # Probe the boundaries of the properly written em-dash,
226 # ie. " -- ".
227 self.check_wrap(text, 29,
228 ["Em-dashes should be written",
229 "-- thus."])
230 expect = ["Em-dashes should be written --",
231 "thus."]
232 self.check_wrap(text, 30, expect)
233 self.check_wrap(text, 35, expect)
234 self.check_wrap(text, 36,
235 ["Em-dashes should be written -- thus."])
Guido van Rossum327af772002-08-22 20:13:47 +0000236
Greg Ward9ad15a32002-08-22 19:47:27 +0000237 # The improperly written em-dash is handled too, because
238 # it's adjacent to non-whitespace on both sides.
239 text = "You can also do--this or even---this."
240 expect = ["You can also do",
241 "--this or even",
242 "---this."]
243 self.check_wrap(text, 15, expect)
244 self.check_wrap(text, 16, expect)
245 expect = ["You can also do--",
246 "this or even---",
247 "this."]
248 self.check_wrap(text, 17, expect)
249 self.check_wrap(text, 19, expect)
250 expect = ["You can also do--this or even",
251 "---this."]
252 self.check_wrap(text, 29, expect)
253 self.check_wrap(text, 31, expect)
254 expect = ["You can also do--this or even---",
255 "this."]
256 self.check_wrap(text, 32, expect)
257 self.check_wrap(text, 35, expect)
258
259 # All of the above behaviour could be deduced by probing the
260 # _split() method.
261 text = "Here's an -- em-dash and--here's another---and another!"
Greg Ward9ad15a32002-08-22 19:47:27 +0000262 expect = ["Here's", " ", "an", " ", "--", " ", "em-", "dash", " ",
263 "and", "--", "here's", " ", "another", "---",
264 "and", " ", "another!"]
Greg Wardd1a72a02002-10-31 16:11:18 +0000265 self.check_split(text, expect)
Greg Ward90c0b072002-08-22 18:11:10 +0000266
Greg Wardc6edb372002-08-22 21:27:05 +0000267 text = "and then--bam!--he was gone"
268 expect = ["and", " ", "then", "--", "bam!", "--",
269 "he", " ", "was", " ", "gone"]
Greg Wardd1a72a02002-10-31 16:11:18 +0000270 self.check_split(text, expect)
Greg Wardc6edb372002-08-22 21:27:05 +0000271
272
Greg Ward34f995b2002-08-22 21:10:07 +0000273 def test_unix_options (self):
274 # Test that Unix-style command-line options are wrapped correctly.
275 # Both Optik (OptionParser) and Docutils rely on this behaviour!
276
277 text = "You should use the -n option, or --dry-run in its long form."
278 self.check_wrap(text, 20,
279 ["You should use the",
280 "-n option, or --dry-",
281 "run in its long",
282 "form."])
283 self.check_wrap(text, 21,
284 ["You should use the -n",
285 "option, or --dry-run",
286 "in its long form."])
287 expect = ["You should use the -n option, or",
288 "--dry-run in its long form."]
289 self.check_wrap(text, 32, expect)
290 self.check_wrap(text, 34, expect)
291 self.check_wrap(text, 35, expect)
292 self.check_wrap(text, 38, expect)
293 expect = ["You should use the -n option, or --dry-",
294 "run in its long form."]
295 self.check_wrap(text, 39, expect)
296 self.check_wrap(text, 41, expect)
297 expect = ["You should use the -n option, or --dry-run",
298 "in its long form."]
299 self.check_wrap(text, 42, expect)
300
Greg Ward24a1c9c2002-08-22 21:12:54 +0000301 # Again, all of the above can be deduced from _split().
302 text = "the -n option, or --dry-run or --dryrun"
Greg Ward24a1c9c2002-08-22 21:12:54 +0000303 expect = ["the", " ", "-n", " ", "option,", " ", "or", " ",
304 "--dry-", "run", " ", "or", " ", "--dryrun"]
Greg Wardd1a72a02002-10-31 16:11:18 +0000305 self.check_split(text, expect)
306
307 def test_funky_hyphens (self):
308 # Screwy edge cases cooked up by David Goodger. All reported
309 # in SF bug #596434.
310 self.check_split("what the--hey!", ["what", " ", "the", "--", "hey!"])
311 self.check_split("what the--", ["what", " ", "the--"])
312 self.check_split("what the--.", ["what", " ", "the--."])
313 self.check_split("--text--.", ["--text--."])
314
Greg Wardcc55cb92003-05-07 01:19:22 +0000315 # When I first read bug #596434, this is what I thought David
316 # was talking about. I was wrong; these have always worked
317 # fine. The real problem is tested in test_funky_parens()
318 # below...
Greg Wardd1a72a02002-10-31 16:11:18 +0000319 self.check_split("--option", ["--option"])
320 self.check_split("--option-opt", ["--option-", "opt"])
Greg Wardcc55cb92003-05-07 01:19:22 +0000321 self.check_split("foo --option-opt bar",
322 ["foo", " ", "--option-", "opt", " ", "bar"])
323
Greg Ward61864102004-06-03 01:59:41 +0000324 def test_punct_hyphens(self):
325 # Oh bother, SF #965425 found another problem with hyphens --
326 # hyphenated words in single quotes weren't handled correctly.
327 # In fact, the bug is that *any* punctuation around a hyphenated
328 # word was handled incorrectly, except for a leading "--", which
329 # was special-cased for Optik and Docutils. So test a variety
330 # of styles of punctuation around a hyphenated word.
331 # (Actually this is based on an Optik bug report, #813077).
332 self.check_split("the 'wibble-wobble' widget",
333 ['the', ' ', "'wibble-", "wobble'", ' ', 'widget'])
334 self.check_split('the "wibble-wobble" widget',
335 ['the', ' ', '"wibble-', 'wobble"', ' ', 'widget'])
336 self.check_split("the (wibble-wobble) widget",
337 ['the', ' ', "(wibble-", "wobble)", ' ', 'widget'])
338 self.check_split("the ['wibble-wobble'] widget",
339 ['the', ' ', "['wibble-", "wobble']", ' ', 'widget'])
340
Serhiy Storchaka72bd3272015-03-24 18:32:27 +0200341 # The test tests current behavior but is not testing parts of the API.
342 self.check_split("what-d'you-call-it.",
343 "what-d'you-|call-|it.".split('|'))
344
Greg Wardcc55cb92003-05-07 01:19:22 +0000345 def test_funky_parens (self):
346 # Second part of SF bug #596434: long option strings inside
347 # parentheses.
348 self.check_split("foo (--option) bar",
349 ["foo", " ", "(--option)", " ", "bar"])
350
351 # Related stuff -- make sure parens work in simpler contexts.
352 self.check_split("foo (bar) baz",
353 ["foo", " ", "(bar)", " ", "baz"])
354 self.check_split("blah (ding dong), wubba",
355 ["blah", " ", "(ding", " ", "dong),",
356 " ", "wubba"])
Greg Ward24a1c9c2002-08-22 21:12:54 +0000357
R David Murray1585b702012-09-08 13:13:25 -0400358 def test_drop_whitespace_false(self):
359 # Check that drop_whitespace=False preserves whitespace.
360 # SF patch #1581073
361 text = " This is a sentence with much whitespace."
362 self.check_wrap(text, 10,
363 [" This is a", " ", "sentence ",
364 "with ", "much white", "space."],
365 drop_whitespace=False)
366
367 def test_drop_whitespace_false_whitespace_only(self):
368 # Check that drop_whitespace=False preserves a whitespace-only string.
369 self.check_wrap(" ", 6, [" "], drop_whitespace=False)
370
371 def test_drop_whitespace_false_whitespace_only_with_indent(self):
372 # Check that a whitespace-only string gets indented (when
373 # drop_whitespace is False).
374 self.check_wrap(" ", 6, [" "], drop_whitespace=False,
375 initial_indent=" ")
376
377 def test_drop_whitespace_whitespace_only(self):
378 # Check drop_whitespace on a whitespace-only string.
379 self.check_wrap(" ", 6, [])
380
381 def test_drop_whitespace_leading_whitespace(self):
382 # Check that drop_whitespace does not drop leading whitespace (if
383 # followed by non-whitespace).
Greg Ward24cbbcb2002-12-09 16:27:15 +0000384 # SF bug #622849 reported inconsistent handling of leading
385 # whitespace; let's test that a bit, shall we?
386 text = " This is a sentence with leading whitespace."
387 self.check_wrap(text, 50,
388 [" This is a sentence with leading whitespace."])
389 self.check_wrap(text, 30,
390 [" This is a sentence with", "leading whitespace."])
391
R David Murray1585b702012-09-08 13:13:25 -0400392 def test_drop_whitespace_whitespace_line(self):
393 # Check that drop_whitespace skips the whole line if a non-leading
394 # line consists only of whitespace.
395 text = "abcd efgh"
396 # Include the result for drop_whitespace=False for comparison.
397 self.check_wrap(text, 6, ["abcd", " ", "efgh"],
Guido van Rossumd8faa362007-04-27 19:54:29 +0000398 drop_whitespace=False)
R David Murray1585b702012-09-08 13:13:25 -0400399 self.check_wrap(text, 6, ["abcd", "efgh"])
400
401 def test_drop_whitespace_whitespace_only_with_indent(self):
402 # Check that initial_indent is not applied to a whitespace-only
403 # string. This checks a special case of the fact that dropping
404 # whitespace occurs before indenting.
405 self.check_wrap(" ", 6, [], initial_indent="++")
406
407 def test_drop_whitespace_whitespace_indent(self):
408 # Check that drop_whitespace does not drop whitespace indents.
409 # This checks a special case of the fact that dropping whitespace
410 # occurs before indenting.
411 self.check_wrap("abcd efgh", 6, [" abcd", " efgh"],
412 initial_indent=" ", subsequent_indent=" ")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000413
Greg Ward90c0b072002-08-22 18:11:10 +0000414 def test_split(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000415 # Ensure that the standard _split() method works as advertised
416 # in the comments
Greg Ward90c0b072002-08-22 18:11:10 +0000417
Greg Wardee413842002-08-22 18:55:38 +0000418 text = "Hello there -- you goof-ball, use the -b option!"
Greg Ward90c0b072002-08-22 18:11:10 +0000419
Greg Wardee413842002-08-22 18:55:38 +0000420 result = self.wrapper._split(text)
Greg Ward90c0b072002-08-22 18:11:10 +0000421 self.check(result,
422 ["Hello", " ", "there", " ", "--", " ", "you", " ", "goof-",
423 "ball,", " ", "use", " ", "the", " ", "-b", " ", "option!"])
424
Alexandre Vassalotti5f8ced22008-05-16 00:03:33 +0000425 def test_break_on_hyphens(self):
426 # Ensure that the break_on_hyphens attributes work
427 text = "yaba daba-doo"
428 self.check_wrap(text, 10, ["yaba daba-", "doo"],
429 break_on_hyphens=True)
430 self.check_wrap(text, 10, ["yaba", "daba-doo"],
431 break_on_hyphens=False)
432
Greg Ward49128572003-05-07 00:54:42 +0000433 def test_bad_width(self):
434 # Ensure that width <= 0 is caught.
435 text = "Whatever, it doesn't matter."
436 self.assertRaises(ValueError, wrap, text, 0)
437 self.assertRaises(ValueError, wrap, text, -1)
438
Antoine Pitrou7c59bc62008-12-13 23:20:54 +0000439 def test_no_split_at_umlaut(self):
440 text = "Die Empf\xe4nger-Auswahl"
441 self.check_wrap(text, 13, ["Die", "Empf\xe4nger-", "Auswahl"])
442
443 def test_umlaut_followed_by_dash(self):
444 text = "aa \xe4\xe4-\xe4\xe4"
445 self.check_wrap(text, 7, ["aa \xe4\xe4-", "\xe4\xe4"])
446
Greg Ward90c0b072002-08-22 18:11:10 +0000447
Serhiy Storchakaacc9f3f2013-10-15 21:22:54 +0300448class MaxLinesTestCase(BaseTestCase):
449 text = "Hello there, how are you this fine day? I'm glad to hear it!"
450
451 def test_simple(self):
452 self.check_wrap(self.text, 12,
453 ["Hello [...]"],
454 max_lines=0)
455 self.check_wrap(self.text, 12,
456 ["Hello [...]"],
457 max_lines=1)
458 self.check_wrap(self.text, 12,
459 ["Hello there,",
460 "how [...]"],
461 max_lines=2)
462 self.check_wrap(self.text, 13,
463 ["Hello there,",
464 "how are [...]"],
465 max_lines=2)
466 self.check_wrap(self.text, 80, [self.text], max_lines=1)
467 self.check_wrap(self.text, 12,
468 ["Hello there,",
469 "how are you",
470 "this fine",
471 "day? I'm",
472 "glad to hear",
473 "it!"],
474 max_lines=6)
475
476 def test_spaces(self):
477 # strip spaces before placeholder
478 self.check_wrap(self.text, 12,
479 ["Hello there,",
480 "how are you",
481 "this fine",
482 "day? [...]"],
483 max_lines=4)
484 # placeholder at the start of line
485 self.check_wrap(self.text, 6,
486 ["Hello",
487 "[...]"],
488 max_lines=2)
489 # final spaces
490 self.check_wrap(self.text + ' ' * 10, 12,
491 ["Hello there,",
492 "how are you",
493 "this fine",
494 "day? I'm",
495 "glad to hear",
496 "it!"],
497 max_lines=6)
498
499 def test_placeholder(self):
500 self.check_wrap(self.text, 12,
501 ["Hello..."],
502 max_lines=1,
503 placeholder='...')
504 self.check_wrap(self.text, 12,
505 ["Hello there,",
506 "how are..."],
507 max_lines=2,
508 placeholder='...')
509 # long placeholder and indentation
510 with self.assertRaises(ValueError):
511 wrap(self.text, 16, initial_indent=' ',
512 max_lines=1, placeholder=' [truncated]...')
513 with self.assertRaises(ValueError):
514 wrap(self.text, 16, subsequent_indent=' ',
515 max_lines=2, placeholder=' [truncated]...')
516 self.check_wrap(self.text, 16,
517 [" Hello there,",
518 " [truncated]..."],
519 max_lines=2,
520 initial_indent=' ',
521 subsequent_indent=' ',
522 placeholder=' [truncated]...')
523 self.check_wrap(self.text, 16,
524 [" [truncated]..."],
525 max_lines=1,
526 initial_indent=' ',
527 subsequent_indent=' ',
528 placeholder=' [truncated]...')
529 self.check_wrap(self.text, 80, [self.text], placeholder='.' * 1000)
530
531
Greg Wardfd030e42002-08-22 19:02:37 +0000532class LongWordTestCase (BaseTestCase):
533 def setUp(self):
534 self.wrapper = TextWrapper()
Greg Ward24cbbcb2002-12-09 16:27:15 +0000535 self.text = '''\
Greg Ward90c0b072002-08-22 18:11:10 +0000536Did you say "supercalifragilisticexpialidocious?"
537How *do* you spell that odd word, anyways?
538'''
Greg Wardfd030e42002-08-22 19:02:37 +0000539
540 def test_break_long(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000541 # Wrap text with long words and lots of punctuation
Greg Wardfd030e42002-08-22 19:02:37 +0000542
543 self.check_wrap(self.text, 30,
Greg Wardee413842002-08-22 18:55:38 +0000544 ['Did you say "supercalifragilis',
545 'ticexpialidocious?" How *do*',
546 'you spell that odd word,',
547 'anyways?'])
Greg Wardfd030e42002-08-22 19:02:37 +0000548 self.check_wrap(self.text, 50,
Greg Wardee413842002-08-22 18:55:38 +0000549 ['Did you say "supercalifragilisticexpialidocious?"',
550 'How *do* you spell that odd word, anyways?'])
Greg Ward90c0b072002-08-22 18:11:10 +0000551
Raymond Hettingerc11dbcd2003-08-30 14:43:55 +0000552 # SF bug 797650. Prevent an infinite loop by making sure that at
553 # least one character gets split off on every pass.
554 self.check_wrap('-'*10+'hello', 10,
555 ['----------',
556 ' h',
557 ' e',
558 ' l',
559 ' l',
560 ' o'],
561 subsequent_indent = ' '*15)
Greg Ward90c0b072002-08-22 18:11:10 +0000562
Georg Brandlfceab5a2008-01-19 20:08:23 +0000563 # bug 1146. Prevent a long word to be wrongly wrapped when the
564 # preceding word is exactly one character shorter than the width
565 self.check_wrap(self.text, 12,
566 ['Did you say ',
567 '"supercalifr',
568 'agilisticexp',
569 'ialidocious?',
570 '" How *do*',
571 'you spell',
572 'that odd',
573 'word,',
574 'anyways?'])
575
Guido van Rossum327af772002-08-22 20:13:47 +0000576 def test_nobreak_long(self):
577 # Test with break_long_words disabled
Greg Ward90c0b072002-08-22 18:11:10 +0000578 self.wrapper.break_long_words = 0
579 self.wrapper.width = 30
Greg Wardee413842002-08-22 18:55:38 +0000580 expect = ['Did you say',
581 '"supercalifragilisticexpialidocious?"',
582 'How *do* you spell that odd',
583 'word, anyways?'
Guido van Rossum327af772002-08-22 20:13:47 +0000584 ]
Greg Wardfd030e42002-08-22 19:02:37 +0000585 result = self.wrapper.wrap(self.text)
Greg Ward90c0b072002-08-22 18:11:10 +0000586 self.check(result, expect)
587
588 # Same thing with kwargs passed to standalone wrap() function.
Greg Wardfd030e42002-08-22 19:02:37 +0000589 result = wrap(self.text, width=30, break_long_words=0)
Greg Ward90c0b072002-08-22 18:11:10 +0000590 self.check(result, expect)
591
Serhiy Storchakaacc9f3f2013-10-15 21:22:54 +0300592 def test_max_lines_long(self):
593 self.check_wrap(self.text, 12,
594 ['Did you say ',
595 '"supercalifr',
596 'agilisticexp',
597 '[...]'],
598 max_lines=4)
599
Greg Ward90c0b072002-08-22 18:11:10 +0000600
Greg Ward13c53c62002-08-22 18:57:26 +0000601class IndentTestCases(BaseTestCase):
Greg Ward90c0b072002-08-22 18:11:10 +0000602
603 # called before each test method
604 def setUp(self):
Greg Wardf69d3c92002-08-22 19:06:45 +0000605 self.text = '''\
Greg Ward90c0b072002-08-22 18:11:10 +0000606This paragraph will be filled, first without any indentation,
607and then with some (including a hanging indent).'''
608
609
Greg Wardf6765782002-08-22 18:35:49 +0000610 def test_fill(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000611 # Test the fill() method
Greg Ward90c0b072002-08-22 18:11:10 +0000612
613 expect = '''\
614This paragraph will be filled, first
615without any indentation, and then with
616some (including a hanging indent).'''
617
Greg Wardf69d3c92002-08-22 19:06:45 +0000618 result = fill(self.text, 40)
Greg Ward90c0b072002-08-22 18:11:10 +0000619 self.check(result, expect)
620
621
Greg Wardf6765782002-08-22 18:35:49 +0000622 def test_initial_indent(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000623 # Test initial_indent parameter
Greg Ward90c0b072002-08-22 18:11:10 +0000624
Greg Wardf69d3c92002-08-22 19:06:45 +0000625 expect = [" This paragraph will be filled,",
626 "first without any indentation, and then",
627 "with some (including a hanging indent)."]
628 result = wrap(self.text, 40, initial_indent=" ")
Greg Ward90c0b072002-08-22 18:11:10 +0000629 self.check(result, expect)
630
Greg Wardf69d3c92002-08-22 19:06:45 +0000631 expect = "\n".join(expect)
632 result = fill(self.text, 40, initial_indent=" ")
Greg Ward90c0b072002-08-22 18:11:10 +0000633 self.check(result, expect)
634
635
Greg Wardf6765782002-08-22 18:35:49 +0000636 def test_subsequent_indent(self):
Guido van Rossum327af772002-08-22 20:13:47 +0000637 # Test subsequent_indent parameter
Greg Ward90c0b072002-08-22 18:11:10 +0000638
639 expect = '''\
640 * This paragraph will be filled, first
641 without any indentation, and then
642 with some (including a hanging
643 indent).'''
644
Greg Wardf69d3c92002-08-22 19:06:45 +0000645 result = fill(self.text, 40,
646 initial_indent=" * ", subsequent_indent=" ")
Greg Ward90c0b072002-08-22 18:11:10 +0000647 self.check(result, expect)
648
649
Greg Ward9e082f42003-05-08 01:58:26 +0000650# Despite the similar names, DedentTestCase is *not* the inverse
651# of IndentTestCase!
652class DedentTestCase(unittest.TestCase):
653
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000654 def assertUnchanged(self, text):
655 """assert that dedent() has no effect on 'text'"""
Ezio Melottib3aedd42010-11-20 19:04:17 +0000656 self.assertEqual(text, dedent(text))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000657
Greg Ward9e082f42003-05-08 01:58:26 +0000658 def test_dedent_nomargin(self):
659 # No lines indented.
660 text = "Hello there.\nHow are you?\nOh good, I'm glad."
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000661 self.assertUnchanged(text)
Greg Ward9e082f42003-05-08 01:58:26 +0000662
663 # Similar, with a blank line.
664 text = "Hello there.\n\nBoo!"
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000665 self.assertUnchanged(text)
Greg Ward9e082f42003-05-08 01:58:26 +0000666
667 # Some lines indented, but overall margin is still zero.
668 text = "Hello there.\n This is indented."
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000669 self.assertUnchanged(text)
Greg Ward9e082f42003-05-08 01:58:26 +0000670
671 # Again, add a blank line.
672 text = "Hello there.\n\n Boo!\n"
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000673 self.assertUnchanged(text)
Greg Ward9e082f42003-05-08 01:58:26 +0000674
675 def test_dedent_even(self):
676 # All lines indented by two spaces.
677 text = " Hello there.\n How are ya?\n Oh good."
678 expect = "Hello there.\nHow are ya?\nOh good."
Ezio Melottib3aedd42010-11-20 19:04:17 +0000679 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000680
681 # Same, with blank lines.
682 text = " Hello there.\n\n How are ya?\n Oh good.\n"
683 expect = "Hello there.\n\nHow are ya?\nOh good.\n"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000684 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000685
686 # Now indent one of the blank lines.
687 text = " Hello there.\n \n How are ya?\n Oh good.\n"
688 expect = "Hello there.\n\nHow are ya?\nOh good.\n"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000689 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000690
691 def test_dedent_uneven(self):
692 # Lines indented unevenly.
693 text = '''\
694 def foo():
695 while 1:
696 return foo
697 '''
698 expect = '''\
699def foo():
700 while 1:
701 return foo
702'''
Ezio Melottib3aedd42010-11-20 19:04:17 +0000703 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000704
705 # Uneven indentation with a blank line.
706 text = " Foo\n Bar\n\n Baz\n"
707 expect = "Foo\n Bar\n\n Baz\n"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000708 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000709
710 # Uneven indentation with a whitespace-only line.
711 text = " Foo\n Bar\n \n Baz\n"
712 expect = "Foo\n Bar\n\n Baz\n"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000713 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000714
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000715 # dedent() should not mangle internal tabs
716 def test_dedent_preserve_internal_tabs(self):
717 text = " hello\tthere\n how are\tyou?"
718 expect = "hello\tthere\nhow are\tyou?"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000719 self.assertEqual(expect, dedent(text))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000720
721 # make sure that it preserves tabs when it's not making any
722 # changes at all
Ezio Melottib3aedd42010-11-20 19:04:17 +0000723 self.assertEqual(expect, dedent(expect))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000724
725 # dedent() should not mangle tabs in the margin (i.e.
726 # tabs and spaces both count as margin, but are *not*
727 # considered equivalent)
728 def test_dedent_preserve_margin_tabs(self):
729 text = " hello there\n\thow are you?"
730 self.assertUnchanged(text)
731
732 # same effect even if we have 8 spaces
733 text = " hello there\n\thow are you?"
734 self.assertUnchanged(text)
735
736 # dedent() only removes whitespace that can be uniformly removed!
737 text = "\thello there\n\thow are you?"
738 expect = "hello there\nhow are you?"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000739 self.assertEqual(expect, dedent(text))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000740
741 text = " \thello there\n \thow are you?"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000742 self.assertEqual(expect, dedent(text))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000743
744 text = " \t hello there\n \t how are you?"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000745 self.assertEqual(expect, dedent(text))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000746
747 text = " \thello there\n \t how are you?"
748 expect = "hello there\n how are you?"
Ezio Melottib3aedd42010-11-20 19:04:17 +0000749 self.assertEqual(expect, dedent(text))
Greg Ward9e082f42003-05-08 01:58:26 +0000750
Serhiy Storchakaea4cb632015-10-28 21:39:36 +0200751 # test margin is smaller than smallest indent
752 text = " \thello there\n \thow are you?\n \tI'm fine, thanks"
753 expect = " \thello there\n \thow are you?\n\tI'm fine, thanks"
754 self.assertEqual(expect, dedent(text))
755
Greg Ward9e082f42003-05-08 01:58:26 +0000756
Nick Coghlan4fae8cd2012-06-11 23:07:51 +1000757# Test textwrap.indent
758class IndentTestCase(unittest.TestCase):
759 # The examples used for tests. If any of these change, the expected
760 # results in the various test cases must also be updated.
761 # The roundtrip cases are separate, because textwrap.dedent doesn't
762 # handle Windows line endings
763 ROUNDTRIP_CASES = (
764 # Basic test case
765 "Hi.\nThis is a test.\nTesting.",
766 # Include a blank line
767 "Hi.\nThis is a test.\n\nTesting.",
768 # Include leading and trailing blank lines
769 "\nHi.\nThis is a test.\nTesting.\n",
770 )
771 CASES = ROUNDTRIP_CASES + (
772 # Use Windows line endings
773 "Hi.\r\nThis is a test.\r\nTesting.\r\n",
774 # Pathological case
775 "\nHi.\r\nThis is a test.\n\r\nTesting.\r\n\n",
776 )
777
778 def test_indent_nomargin_default(self):
779 # indent should do nothing if 'prefix' is empty.
780 for text in self.CASES:
781 self.assertEqual(indent(text, ''), text)
782
783 def test_indent_nomargin_explicit_default(self):
784 # The same as test_indent_nomargin, but explicitly requesting
785 # the default behaviour by passing None as the predicate
786 for text in self.CASES:
787 self.assertEqual(indent(text, '', None), text)
788
789 def test_indent_nomargin_all_lines(self):
790 # The same as test_indent_nomargin, but using the optional
791 # predicate argument
792 predicate = lambda line: True
793 for text in self.CASES:
794 self.assertEqual(indent(text, '', predicate), text)
795
796 def test_indent_no_lines(self):
797 # Explicitly skip indenting any lines
798 predicate = lambda line: False
799 for text in self.CASES:
800 self.assertEqual(indent(text, ' ', predicate), text)
801
802 def test_roundtrip_spaces(self):
803 # A whitespace prefix should roundtrip with dedent
804 for text in self.ROUNDTRIP_CASES:
805 self.assertEqual(dedent(indent(text, ' ')), text)
806
807 def test_roundtrip_tabs(self):
808 # A whitespace prefix should roundtrip with dedent
809 for text in self.ROUNDTRIP_CASES:
810 self.assertEqual(dedent(indent(text, '\t\t')), text)
811
812 def test_roundtrip_mixed(self):
813 # A whitespace prefix should roundtrip with dedent
814 for text in self.ROUNDTRIP_CASES:
815 self.assertEqual(dedent(indent(text, ' \t \t ')), text)
816
817 def test_indent_default(self):
818 # Test default indenting of lines that are not whitespace only
819 prefix = ' '
820 expected = (
821 # Basic test case
822 " Hi.\n This is a test.\n Testing.",
823 # Include a blank line
824 " Hi.\n This is a test.\n\n Testing.",
825 # Include leading and trailing blank lines
826 "\n Hi.\n This is a test.\n Testing.\n",
827 # Use Windows line endings
828 " Hi.\r\n This is a test.\r\n Testing.\r\n",
829 # Pathological case
830 "\n Hi.\r\n This is a test.\n\r\n Testing.\r\n\n",
831 )
832 for text, expect in zip(self.CASES, expected):
833 self.assertEqual(indent(text, prefix), expect)
834
835 def test_indent_explicit_default(self):
836 # Test default indenting of lines that are not whitespace only
837 prefix = ' '
838 expected = (
839 # Basic test case
840 " Hi.\n This is a test.\n Testing.",
841 # Include a blank line
842 " Hi.\n This is a test.\n\n Testing.",
843 # Include leading and trailing blank lines
844 "\n Hi.\n This is a test.\n Testing.\n",
845 # Use Windows line endings
846 " Hi.\r\n This is a test.\r\n Testing.\r\n",
847 # Pathological case
848 "\n Hi.\r\n This is a test.\n\r\n Testing.\r\n\n",
849 )
850 for text, expect in zip(self.CASES, expected):
851 self.assertEqual(indent(text, prefix, None), expect)
852
853 def test_indent_all_lines(self):
854 # Add 'prefix' to all lines, including whitespace-only ones.
855 prefix = ' '
856 expected = (
857 # Basic test case
858 " Hi.\n This is a test.\n Testing.",
859 # Include a blank line
860 " Hi.\n This is a test.\n \n Testing.",
861 # Include leading and trailing blank lines
862 " \n Hi.\n This is a test.\n Testing.\n",
863 # Use Windows line endings
864 " Hi.\r\n This is a test.\r\n Testing.\r\n",
865 # Pathological case
866 " \n Hi.\r\n This is a test.\n \r\n Testing.\r\n \n",
867 )
868 predicate = lambda line: True
869 for text, expect in zip(self.CASES, expected):
870 self.assertEqual(indent(text, prefix, predicate), expect)
871
872 def test_indent_empty_lines(self):
873 # Add 'prefix' solely to whitespace-only lines.
874 prefix = ' '
875 expected = (
876 # Basic test case
877 "Hi.\nThis is a test.\nTesting.",
878 # Include a blank line
879 "Hi.\nThis is a test.\n \nTesting.",
880 # Include leading and trailing blank lines
881 " \nHi.\nThis is a test.\nTesting.\n",
882 # Use Windows line endings
883 "Hi.\r\nThis is a test.\r\nTesting.\r\n",
884 # Pathological case
885 " \nHi.\r\nThis is a test.\n \r\nTesting.\r\n \n",
886 )
887 predicate = lambda line: not line.strip()
888 for text, expect in zip(self.CASES, expected):
889 self.assertEqual(indent(text, prefix, predicate), expect)
890
891
Antoine Pitrou389dec82013-08-12 22:39:09 +0200892class ShortenTestCase(BaseTestCase):
893
Serhiy Storchakaacc9f3f2013-10-15 21:22:54 +0300894 def check_shorten(self, text, width, expect, **kwargs):
895 result = shorten(text, width, **kwargs)
896 self.check(result, expect)
897
Antoine Pitrou389dec82013-08-12 22:39:09 +0200898 def test_simple(self):
899 # Simple case: just words, spaces, and a bit of punctuation
900 text = "Hello there, how are you this fine day? I'm glad to hear it!"
901
Antoine Pitrouc5930562013-08-16 22:31:12 +0200902 self.check_shorten(text, 18, "Hello there, [...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200903 self.check_shorten(text, len(text), text)
904 self.check_shorten(text, len(text) - 1,
905 "Hello there, how are you this fine day? "
Antoine Pitrouc5930562013-08-16 22:31:12 +0200906 "I'm glad to [...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200907
908 def test_placeholder(self):
909 text = "Hello there, how are you this fine day? I'm glad to hear it!"
910
911 self.check_shorten(text, 17, "Hello there,$$", placeholder='$$')
912 self.check_shorten(text, 18, "Hello there, how$$", placeholder='$$')
913 self.check_shorten(text, 18, "Hello there, $$", placeholder=' $$')
914 self.check_shorten(text, len(text), text, placeholder='$$')
915 self.check_shorten(text, len(text) - 1,
916 "Hello there, how are you this fine day? "
917 "I'm glad to hear$$", placeholder='$$')
918
919 def test_empty_string(self):
920 self.check_shorten("", 6, "")
921
922 def test_whitespace(self):
923 # Whitespace collapsing
924 text = """
925 This is a paragraph that already has
926 line breaks and \t tabs too."""
927 self.check_shorten(text, 62,
928 "This is a paragraph that already has line "
929 "breaks and tabs too.")
930 self.check_shorten(text, 61,
931 "This is a paragraph that already has line "
Antoine Pitrouc5930562013-08-16 22:31:12 +0200932 "breaks and [...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200933
934 self.check_shorten("hello world! ", 12, "hello world!")
Antoine Pitrouc5930562013-08-16 22:31:12 +0200935 self.check_shorten("hello world! ", 11, "hello [...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200936 # The leading space is trimmed from the placeholder
937 # (it would be ugly otherwise).
Antoine Pitrouc5930562013-08-16 22:31:12 +0200938 self.check_shorten("hello world! ", 10, "[...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200939
940 def test_width_too_small_for_placeholder(self):
Serhiy Storchakaacc9f3f2013-10-15 21:22:54 +0300941 shorten("x" * 20, width=8, placeholder="(......)")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200942 with self.assertRaises(ValueError):
Serhiy Storchakaacc9f3f2013-10-15 21:22:54 +0300943 shorten("x" * 20, width=8, placeholder="(.......)")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200944
945 def test_first_word_too_long_but_placeholder_fits(self):
Antoine Pitrouc5930562013-08-16 22:31:12 +0200946 self.check_shorten("Helloo", 5, "[...]")
Antoine Pitrou389dec82013-08-12 22:39:09 +0200947
Greg Wardf6765782002-08-22 18:35:49 +0000948
Greg Ward90c0b072002-08-22 18:11:10 +0000949if __name__ == '__main__':
Antoine Pitrou389dec82013-08-12 22:39:09 +0200950 unittest.main()