| # | 
 | # Test script for the textwrap module. | 
 | # | 
 | # Original tests written by Greg Ward <gward@python.net>. | 
 | # Converted to PyUnit by Peter Hansen <peter@engcorp.com>. | 
 | # Currently maintained by Greg Ward. | 
 | # | 
 | # $Id$ | 
 | # | 
 |  | 
 | import unittest | 
 | from test import test_support | 
 |  | 
 | from textwrap import TextWrapper, wrap, fill, dedent | 
 |  | 
 |  | 
 | class BaseTestCase(unittest.TestCase): | 
 |     '''Parent class with utility methods for textwrap tests.''' | 
 |  | 
 |     def show(self, textin): | 
 |         if isinstance(textin, list): | 
 |             result = [] | 
 |             for i in range(len(textin)): | 
 |                 result.append("  %d: %r" % (i, textin[i])) | 
 |             result = '\n'.join(result) | 
 |         elif isinstance(textin, basestring): | 
 |             result = "  %s\n" % repr(textin) | 
 |         return result | 
 |  | 
 |  | 
 |     def check(self, result, expect): | 
 |         self.assertEquals(result, expect, | 
 |             'expected:\n%s\nbut got:\n%s' % ( | 
 |                 self.show(expect), self.show(result))) | 
 |  | 
 |     def check_wrap(self, text, width, expect, **kwargs): | 
 |         result = wrap(text, width, **kwargs) | 
 |         self.check(result, expect) | 
 |  | 
 |     def check_split(self, text, expect): | 
 |         result = self.wrapper._split(text) | 
 |         self.assertEquals(result, expect, | 
 |                           "\nexpected %r\n" | 
 |                           "but got  %r" % (expect, result)) | 
 |  | 
 |  | 
 | class WrapTestCase(BaseTestCase): | 
 |  | 
 |     def setUp(self): | 
 |         self.wrapper = TextWrapper(width=45, fix_sentence_endings=True) | 
 |  | 
 |     def test_simple(self): | 
 |         # Simple case: just words, spaces, and a bit of punctuation | 
 |  | 
 |         text = "Hello there, how are you this fine day?  I'm glad to hear it!" | 
 |  | 
 |         self.check_wrap(text, 12, | 
 |                         ["Hello there,", | 
 |                          "how are you", | 
 |                          "this fine", | 
 |                          "day?  I'm", | 
 |                          "glad to hear", | 
 |                          "it!"]) | 
 |         self.check_wrap(text, 42, | 
 |                         ["Hello there, how are you this fine day?", | 
 |                          "I'm glad to hear it!"]) | 
 |         self.check_wrap(text, 80, [text]) | 
 |  | 
 |  | 
 |     def test_whitespace(self): | 
 |         # Whitespace munging and end-of-sentence detection | 
 |  | 
 |         text = """\ | 
 | This is a paragraph that already has | 
 | line breaks.  But some of its lines are much longer than the others, | 
 | so it needs to be wrapped. | 
 | Some lines are \ttabbed too. | 
 | What a mess! | 
 | """ | 
 |  | 
 |         expect = ["This is a paragraph that already has line", | 
 |                   "breaks.  But some of its lines are much", | 
 |                   "longer than the others, so it needs to be", | 
 |                   "wrapped.  Some lines are  tabbed too.  What a", | 
 |                   "mess!"] | 
 |  | 
 |         result = self.wrapper.wrap(text) | 
 |         self.check(result, expect) | 
 |  | 
 |         result = self.wrapper.fill(text) | 
 |         self.check(result, '\n'.join(expect)) | 
 |  | 
 |  | 
 |     def test_wrap_short(self): | 
 |         # Wrapping to make short lines longer | 
 |  | 
 |         text = "This is a\nshort paragraph." | 
 |  | 
 |         self.check_wrap(text, 20, ["This is a short", | 
 |                                    "paragraph."]) | 
 |         self.check_wrap(text, 40, ["This is a short paragraph."]) | 
 |  | 
 |  | 
 |     def test_wrap_short_1line(self): | 
 |         # Test endcases | 
 |  | 
 |         text = "This is a short line." | 
 |  | 
 |         self.check_wrap(text, 30, ["This is a short line."]) | 
 |         self.check_wrap(text, 30, ["(1) This is a short line."], | 
 |                         initial_indent="(1) ") | 
 |  | 
 |  | 
 |     def test_hyphenated(self): | 
 |         # Test breaking hyphenated words | 
 |  | 
 |         text = ("this-is-a-useful-feature-for-" | 
 |                 "reformatting-posts-from-tim-peters'ly") | 
 |  | 
 |         self.check_wrap(text, 40, | 
 |                         ["this-is-a-useful-feature-for-", | 
 |                          "reformatting-posts-from-tim-peters'ly"]) | 
 |         self.check_wrap(text, 41, | 
 |                         ["this-is-a-useful-feature-for-", | 
 |                          "reformatting-posts-from-tim-peters'ly"]) | 
 |         self.check_wrap(text, 42, | 
 |                         ["this-is-a-useful-feature-for-reformatting-", | 
 |                          "posts-from-tim-peters'ly"]) | 
 |  | 
 |     def test_em_dash(self): | 
 |         # Test text with em-dashes | 
 |         text = "Em-dashes should be written -- thus." | 
 |         self.check_wrap(text, 25, | 
 |                         ["Em-dashes should be", | 
 |                          "written -- thus."]) | 
 |  | 
 |         # Probe the boundaries of the properly written em-dash, | 
 |         # ie. " -- ". | 
 |         self.check_wrap(text, 29, | 
 |                         ["Em-dashes should be written", | 
 |                          "-- thus."]) | 
 |         expect = ["Em-dashes should be written --", | 
 |                   "thus."] | 
 |         self.check_wrap(text, 30, expect) | 
 |         self.check_wrap(text, 35, expect) | 
 |         self.check_wrap(text, 36, | 
 |                         ["Em-dashes should be written -- thus."]) | 
 |  | 
 |         # The improperly written em-dash is handled too, because | 
 |         # it's adjacent to non-whitespace on both sides. | 
 |         text = "You can also do--this or even---this." | 
 |         expect = ["You can also do", | 
 |                   "--this or even", | 
 |                   "---this."] | 
 |         self.check_wrap(text, 15, expect) | 
 |         self.check_wrap(text, 16, expect) | 
 |         expect = ["You can also do--", | 
 |                   "this or even---", | 
 |                   "this."] | 
 |         self.check_wrap(text, 17, expect) | 
 |         self.check_wrap(text, 19, expect) | 
 |         expect = ["You can also do--this or even", | 
 |                   "---this."] | 
 |         self.check_wrap(text, 29, expect) | 
 |         self.check_wrap(text, 31, expect) | 
 |         expect = ["You can also do--this or even---", | 
 |                   "this."] | 
 |         self.check_wrap(text, 32, expect) | 
 |         self.check_wrap(text, 35, expect) | 
 |  | 
 |         # All of the above behaviour could be deduced by probing the | 
 |         # _split() method. | 
 |         text = "Here's an -- em-dash and--here's another---and another!" | 
 |         expect = ["Here's", " ", "an", " ", "--", " ", "em-", "dash", " ", | 
 |                   "and", "--", "here's", " ", "another", "---", | 
 |                   "and", " ", "another!"] | 
 |         self.check_split(text, expect) | 
 |  | 
 |         text = "and then--bam!--he was gone" | 
 |         expect = ["and", " ", "then", "--", "bam!", "--", | 
 |                   "he", " ", "was", " ", "gone"] | 
 |         self.check_split(text, expect) | 
 |  | 
 |  | 
 |     def test_unix_options (self): | 
 |         # Test that Unix-style command-line options are wrapped correctly. | 
 |         # Both Optik (OptionParser) and Docutils rely on this behaviour! | 
 |  | 
 |         text = "You should use the -n option, or --dry-run in its long form." | 
 |         self.check_wrap(text, 20, | 
 |                         ["You should use the", | 
 |                          "-n option, or --dry-", | 
 |                          "run in its long", | 
 |                          "form."]) | 
 |         self.check_wrap(text, 21, | 
 |                         ["You should use the -n", | 
 |                          "option, or --dry-run", | 
 |                          "in its long form."]) | 
 |         expect = ["You should use the -n option, or", | 
 |                   "--dry-run in its long form."] | 
 |         self.check_wrap(text, 32, expect) | 
 |         self.check_wrap(text, 34, expect) | 
 |         self.check_wrap(text, 35, expect) | 
 |         self.check_wrap(text, 38, expect) | 
 |         expect = ["You should use the -n option, or --dry-", | 
 |                   "run in its long form."] | 
 |         self.check_wrap(text, 39, expect) | 
 |         self.check_wrap(text, 41, expect) | 
 |         expect = ["You should use the -n option, or --dry-run", | 
 |                   "in its long form."] | 
 |         self.check_wrap(text, 42, expect) | 
 |  | 
 |         # Again, all of the above can be deduced from _split(). | 
 |         text = "the -n option, or --dry-run or --dryrun" | 
 |         expect = ["the", " ", "-n", " ", "option,", " ", "or", " ", | 
 |                   "--dry-", "run", " ", "or", " ", "--dryrun"] | 
 |         self.check_split(text, expect) | 
 |  | 
 |     def test_funky_hyphens (self): | 
 |         # Screwy edge cases cooked up by David Goodger.  All reported | 
 |         # in SF bug #596434. | 
 |         self.check_split("what the--hey!", ["what", " ", "the", "--", "hey!"]) | 
 |         self.check_split("what the--", ["what", " ", "the--"]) | 
 |         self.check_split("what the--.", ["what", " ", "the--."]) | 
 |         self.check_split("--text--.", ["--text--."]) | 
 |  | 
 |         # When I first read bug #596434, this is what I thought David | 
 |         # was talking about.  I was wrong; these have always worked | 
 |         # fine.  The real problem is tested in test_funky_parens() | 
 |         # below... | 
 |         self.check_split("--option", ["--option"]) | 
 |         self.check_split("--option-opt", ["--option-", "opt"]) | 
 |         self.check_split("foo --option-opt bar", | 
 |                          ["foo", " ", "--option-", "opt", " ", "bar"]) | 
 |  | 
 |     def test_funky_parens (self): | 
 |         # Second part of SF bug #596434: long option strings inside | 
 |         # parentheses. | 
 |         self.check_split("foo (--option) bar", | 
 |                          ["foo", " ", "(--option)", " ", "bar"]) | 
 |  | 
 |         # Related stuff -- make sure parens work in simpler contexts. | 
 |         self.check_split("foo (bar) baz", | 
 |                          ["foo", " ", "(bar)", " ", "baz"]) | 
 |         self.check_split("blah (ding dong), wubba", | 
 |                          ["blah", " ", "(ding", " ", "dong),", | 
 |                           " ", "wubba"]) | 
 |  | 
 |     def test_initial_whitespace(self): | 
 |         # SF bug #622849 reported inconsistent handling of leading | 
 |         # whitespace; let's test that a bit, shall we? | 
 |         text = " This is a sentence with leading whitespace." | 
 |         self.check_wrap(text, 50, | 
 |                         [" This is a sentence with leading whitespace."]) | 
 |         self.check_wrap(text, 30, | 
 |                         [" This is a sentence with", "leading whitespace."]) | 
 |  | 
 |     def test_unicode(self): | 
 |         # *Very* simple test of wrapping Unicode strings.  I'm sure | 
 |         # there's more to it than this, but let's at least make | 
 |         # sure textwrap doesn't crash on Unicode input! | 
 |         text = u"Hello there, how are you today?" | 
 |         self.check_wrap(text, 50, [u"Hello there, how are you today?"]) | 
 |         self.check_wrap(text, 20, [u"Hello there, how are", "you today?"]) | 
 |         olines = self.wrapper.wrap(text) | 
 |         assert isinstance(olines, list) and isinstance(olines[0], unicode) | 
 |         otext = self.wrapper.fill(text) | 
 |         assert isinstance(otext, unicode) | 
 |  | 
 |     def test_split(self): | 
 |         # Ensure that the standard _split() method works as advertised | 
 |         # in the comments | 
 |  | 
 |         text = "Hello there -- you goof-ball, use the -b option!" | 
 |  | 
 |         result = self.wrapper._split(text) | 
 |         self.check(result, | 
 |              ["Hello", " ", "there", " ", "--", " ", "you", " ", "goof-", | 
 |               "ball,", " ", "use", " ", "the", " ", "-b", " ",  "option!"]) | 
 |  | 
 |     def test_bad_width(self): | 
 |         # Ensure that width <= 0 is caught. | 
 |         text = "Whatever, it doesn't matter." | 
 |         self.assertRaises(ValueError, wrap, text, 0) | 
 |         self.assertRaises(ValueError, wrap, text, -1) | 
 |  | 
 |  | 
 | class LongWordTestCase (BaseTestCase): | 
 |     def setUp(self): | 
 |         self.wrapper = TextWrapper() | 
 |         self.text = '''\ | 
 | Did you say "supercalifragilisticexpialidocious?" | 
 | How *do* you spell that odd word, anyways? | 
 | ''' | 
 |  | 
 |     def test_break_long(self): | 
 |         # Wrap text with long words and lots of punctuation | 
 |  | 
 |         self.check_wrap(self.text, 30, | 
 |                         ['Did you say "supercalifragilis', | 
 |                          'ticexpialidocious?" How *do*', | 
 |                          'you spell that odd word,', | 
 |                          'anyways?']) | 
 |         self.check_wrap(self.text, 50, | 
 |                         ['Did you say "supercalifragilisticexpialidocious?"', | 
 |                          'How *do* you spell that odd word, anyways?']) | 
 |  | 
 |         # SF bug 797650.  Prevent an infinite loop by making sure that at | 
 |         # least one character gets split off on every pass. | 
 |         self.check_wrap('-'*10+'hello', 10, | 
 |                         ['----------', | 
 |                          '               h', | 
 |                          '               e', | 
 |                          '               l', | 
 |                          '               l', | 
 |                          '               o'], | 
 |                         subsequent_indent = ' '*15) | 
 |  | 
 |     def test_nobreak_long(self): | 
 |         # Test with break_long_words disabled | 
 |         self.wrapper.break_long_words = 0 | 
 |         self.wrapper.width = 30 | 
 |         expect = ['Did you say', | 
 |                   '"supercalifragilisticexpialidocious?"', | 
 |                   'How *do* you spell that odd', | 
 |                   'word, anyways?' | 
 |                   ] | 
 |         result = self.wrapper.wrap(self.text) | 
 |         self.check(result, expect) | 
 |  | 
 |         # Same thing with kwargs passed to standalone wrap() function. | 
 |         result = wrap(self.text, width=30, break_long_words=0) | 
 |         self.check(result, expect) | 
 |  | 
 |  | 
 | class IndentTestCases(BaseTestCase): | 
 |  | 
 |     # called before each test method | 
 |     def setUp(self): | 
 |         self.text = '''\ | 
 | This paragraph will be filled, first without any indentation, | 
 | and then with some (including a hanging indent).''' | 
 |  | 
 |  | 
 |     def test_fill(self): | 
 |         # Test the fill() method | 
 |  | 
 |         expect = '''\ | 
 | This paragraph will be filled, first | 
 | without any indentation, and then with | 
 | some (including a hanging indent).''' | 
 |  | 
 |         result = fill(self.text, 40) | 
 |         self.check(result, expect) | 
 |  | 
 |  | 
 |     def test_initial_indent(self): | 
 |         # Test initial_indent parameter | 
 |  | 
 |         expect = ["     This paragraph will be filled,", | 
 |                   "first without any indentation, and then", | 
 |                   "with some (including a hanging indent)."] | 
 |         result = wrap(self.text, 40, initial_indent="     ") | 
 |         self.check(result, expect) | 
 |  | 
 |         expect = "\n".join(expect) | 
 |         result = fill(self.text, 40, initial_indent="     ") | 
 |         self.check(result, expect) | 
 |  | 
 |  | 
 |     def test_subsequent_indent(self): | 
 |         # Test subsequent_indent parameter | 
 |  | 
 |         expect = '''\ | 
 |   * This paragraph will be filled, first | 
 |     without any indentation, and then | 
 |     with some (including a hanging | 
 |     indent).''' | 
 |  | 
 |         result = fill(self.text, 40, | 
 |                       initial_indent="  * ", subsequent_indent="    ") | 
 |         self.check(result, expect) | 
 |  | 
 |  | 
 | # Despite the similar names, DedentTestCase is *not* the inverse | 
 | # of IndentTestCase! | 
 | class DedentTestCase(unittest.TestCase): | 
 |  | 
 |     def test_dedent_nomargin(self): | 
 |         # No lines indented. | 
 |         text = "Hello there.\nHow are you?\nOh good, I'm glad." | 
 |         self.assertEquals(dedent(text), text) | 
 |  | 
 |         # Similar, with a blank line. | 
 |         text = "Hello there.\n\nBoo!" | 
 |         self.assertEquals(dedent(text), text) | 
 |  | 
 |         # Some lines indented, but overall margin is still zero. | 
 |         text = "Hello there.\n  This is indented." | 
 |         self.assertEquals(dedent(text), text) | 
 |  | 
 |         # Again, add a blank line. | 
 |         text = "Hello there.\n\n  Boo!\n" | 
 |         self.assertEquals(dedent(text), text) | 
 |  | 
 |     def test_dedent_even(self): | 
 |         # All lines indented by two spaces. | 
 |         text = "  Hello there.\n  How are ya?\n  Oh good." | 
 |         expect = "Hello there.\nHow are ya?\nOh good." | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |         # Same, with blank lines. | 
 |         text = "  Hello there.\n\n  How are ya?\n  Oh good.\n" | 
 |         expect = "Hello there.\n\nHow are ya?\nOh good.\n" | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |         # Now indent one of the blank lines. | 
 |         text = "  Hello there.\n  \n  How are ya?\n  Oh good.\n" | 
 |         expect = "Hello there.\n\nHow are ya?\nOh good.\n" | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |     def test_dedent_uneven(self): | 
 |         # Lines indented unevenly. | 
 |         text = '''\ | 
 |         def foo(): | 
 |             while 1: | 
 |                 return foo | 
 |         ''' | 
 |         expect = '''\ | 
 | def foo(): | 
 |     while 1: | 
 |         return foo | 
 | ''' | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |         # Uneven indentation with a blank line. | 
 |         text = "  Foo\n    Bar\n\n   Baz\n" | 
 |         expect = "Foo\n  Bar\n\n Baz\n" | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |         # Uneven indentation with a whitespace-only line. | 
 |         text = "  Foo\n    Bar\n \n   Baz\n" | 
 |         expect = "Foo\n  Bar\n\n Baz\n" | 
 |         self.assertEquals(dedent(text), expect) | 
 |  | 
 |  | 
 |  | 
 | def test_main(): | 
 |     test_support.run_unittest(WrapTestCase, | 
 |                               LongWordTestCase, | 
 |                               IndentTestCases, | 
 |                               DedentTestCase) | 
 |  | 
 | if __name__ == '__main__': | 
 |     test_main() |