mirror of
				https://github.com/python/cpython.git
				synced 2025-10-22 14:42:22 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			510 lines
		
	
	
	
		
			19 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			510 lines
		
	
	
	
		
			19 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #
 | |
| # Test suite for the textwrap module.
 | |
| #
 | |
| # Original tests written by Greg Ward <gward@python.net>.
 | |
| # Converted to PyUnit by Peter Hansen <peter@engcorp.com>.
 | |
| # Currently maintained by Greg Ward.
 | |
| #
 | |
| # $Id$
 | |
| #
 | |
| 
 | |
| import unittest
 | |
| from test import test_support
 | |
| 
 | |
| from textwrap import TextWrapper, wrap, fill, dedent
 | |
| 
 | |
| 
 | |
| class BaseTestCase(unittest.TestCase):
 | |
|     '''Parent class with utility methods for textwrap tests.'''
 | |
| 
 | |
|     def show(self, textin):
 | |
|         if isinstance(textin, list):
 | |
|             result = []
 | |
|             for i in range(len(textin)):
 | |
|                 result.append("  %d: %r" % (i, textin[i]))
 | |
|             result = '\n'.join(result)
 | |
|         elif isinstance(textin, basestring):
 | |
|             result = "  %s\n" % repr(textin)
 | |
|         return result
 | |
| 
 | |
| 
 | |
|     def check(self, result, expect):
 | |
|         self.assertEquals(result, expect,
 | |
|             'expected:\n%s\nbut got:\n%s' % (
 | |
|                 self.show(expect), self.show(result)))
 | |
| 
 | |
|     def check_wrap(self, text, width, expect, **kwargs):
 | |
|         result = wrap(text, width, **kwargs)
 | |
|         self.check(result, expect)
 | |
| 
 | |
|     def check_split(self, text, expect):
 | |
|         result = self.wrapper._split(text)
 | |
|         self.assertEquals(result, expect,
 | |
|                           "\nexpected %r\n"
 | |
|                           "but got  %r" % (expect, result))
 | |
| 
 | |
| 
 | |
| class WrapTestCase(BaseTestCase):
 | |
| 
 | |
|     def setUp(self):
 | |
|         self.wrapper = TextWrapper(width=45)
 | |
| 
 | |
|     def test_simple(self):
 | |
|         # Simple case: just words, spaces, and a bit of punctuation
 | |
| 
 | |
|         text = "Hello there, how are you this fine day?  I'm glad to hear it!"
 | |
| 
 | |
|         self.check_wrap(text, 12,
 | |
|                         ["Hello there,",
 | |
|                          "how are you",
 | |
|                          "this fine",
 | |
|                          "day?  I'm",
 | |
|                          "glad to hear",
 | |
|                          "it!"])
 | |
|         self.check_wrap(text, 42,
 | |
|                         ["Hello there, how are you this fine day?",
 | |
|                          "I'm glad to hear it!"])
 | |
|         self.check_wrap(text, 80, [text])
 | |
| 
 | |
| 
 | |
|     def test_whitespace(self):
 | |
|         # Whitespace munging and end-of-sentence detection
 | |
| 
 | |
|         text = """\
 | |
| This is a paragraph that already has
 | |
| line breaks.  But some of its lines are much longer than the others,
 | |
| so it needs to be wrapped.
 | |
| Some lines are \ttabbed too.
 | |
| What a mess!
 | |
| """
 | |
| 
 | |
|         expect = ["This is a paragraph that already has line",
 | |
|                   "breaks.  But some of its lines are much",
 | |
|                   "longer than the others, so it needs to be",
 | |
|                   "wrapped.  Some lines are  tabbed too.  What a",
 | |
|                   "mess!"]
 | |
| 
 | |
|         wrapper = TextWrapper(45, fix_sentence_endings=True)
 | |
|         result = wrapper.wrap(text)
 | |
|         self.check(result, expect)
 | |
| 
 | |
|         result = wrapper.fill(text)
 | |
|         self.check(result, '\n'.join(expect))
 | |
| 
 | |
|     def test_fix_sentence_endings(self):
 | |
|         wrapper = TextWrapper(60, fix_sentence_endings=True)
 | |
| 
 | |
|         # SF #847346: ensure that fix_sentence_endings=True does the
 | |
|         # right thing even on input short enough that it doesn't need to
 | |
|         # be wrapped.
 | |
|         text = "A short line. Note the single space."
 | |
|         expect = ["A short line.  Note the single space."]
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         # Test some of the hairy end cases that _fix_sentence_endings()
 | |
|         # is supposed to handle (the easy stuff is tested in
 | |
|         # test_whitespace() above).
 | |
|         text = "Well, Doctor? What do you think?"
 | |
|         expect = ["Well, Doctor?  What do you think?"]
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         text = "Well, Doctor?\nWhat do you think?"
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         text = 'I say, chaps! Anyone for "tennis?"\nHmmph!'
 | |
|         expect = ['I say, chaps!  Anyone for "tennis?"  Hmmph!']
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         wrapper.width = 20
 | |
|         expect = ['I say, chaps!', 'Anyone for "tennis?"', 'Hmmph!']
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         text = 'And she said, "Go to hell!"\nCan you believe that?'
 | |
|         expect = ['And she said, "Go to',
 | |
|                   'hell!"  Can you',
 | |
|                   'believe that?']
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|         wrapper.width = 60
 | |
|         expect = ['And she said, "Go to hell!"  Can you believe that?']
 | |
|         self.check(wrapper.wrap(text), expect)
 | |
| 
 | |
|     def test_wrap_short(self):
 | |
|         # Wrapping to make short lines longer
 | |
| 
 | |
|         text = "This is a\nshort paragraph."
 | |
| 
 | |
|         self.check_wrap(text, 20, ["This is a short",
 | |
|                                    "paragraph."])
 | |
|         self.check_wrap(text, 40, ["This is a short paragraph."])
 | |
| 
 | |
| 
 | |
|     def test_wrap_short_1line(self):
 | |
|         # Test endcases
 | |
| 
 | |
|         text = "This is a short line."
 | |
| 
 | |
|         self.check_wrap(text, 30, ["This is a short line."])
 | |
|         self.check_wrap(text, 30, ["(1) This is a short line."],
 | |
|                         initial_indent="(1) ")
 | |
| 
 | |
| 
 | |
|     def test_hyphenated(self):
 | |
|         # Test breaking hyphenated words
 | |
| 
 | |
|         text = ("this-is-a-useful-feature-for-"
 | |
|                 "reformatting-posts-from-tim-peters'ly")
 | |
| 
 | |
|         self.check_wrap(text, 40,
 | |
|                         ["this-is-a-useful-feature-for-",
 | |
|                          "reformatting-posts-from-tim-peters'ly"])
 | |
|         self.check_wrap(text, 41,
 | |
|                         ["this-is-a-useful-feature-for-",
 | |
|                          "reformatting-posts-from-tim-peters'ly"])
 | |
|         self.check_wrap(text, 42,
 | |
|                         ["this-is-a-useful-feature-for-reformatting-",
 | |
|                          "posts-from-tim-peters'ly"])
 | |
| 
 | |
|     def test_em_dash(self):
 | |
|         # Test text with em-dashes
 | |
|         text = "Em-dashes should be written -- thus."
 | |
|         self.check_wrap(text, 25,
 | |
|                         ["Em-dashes should be",
 | |
|                          "written -- thus."])
 | |
| 
 | |
|         # Probe the boundaries of the properly written em-dash,
 | |
|         # ie. " -- ".
 | |
|         self.check_wrap(text, 29,
 | |
|                         ["Em-dashes should be written",
 | |
|                          "-- thus."])
 | |
|         expect = ["Em-dashes should be written --",
 | |
|                   "thus."]
 | |
|         self.check_wrap(text, 30, expect)
 | |
|         self.check_wrap(text, 35, expect)
 | |
|         self.check_wrap(text, 36,
 | |
|                         ["Em-dashes should be written -- thus."])
 | |
| 
 | |
|         # The improperly written em-dash is handled too, because
 | |
|         # it's adjacent to non-whitespace on both sides.
 | |
|         text = "You can also do--this or even---this."
 | |
|         expect = ["You can also do",
 | |
|                   "--this or even",
 | |
|                   "---this."]
 | |
|         self.check_wrap(text, 15, expect)
 | |
|         self.check_wrap(text, 16, expect)
 | |
|         expect = ["You can also do--",
 | |
|                   "this or even---",
 | |
|                   "this."]
 | |
|         self.check_wrap(text, 17, expect)
 | |
|         self.check_wrap(text, 19, expect)
 | |
|         expect = ["You can also do--this or even",
 | |
|                   "---this."]
 | |
|         self.check_wrap(text, 29, expect)
 | |
|         self.check_wrap(text, 31, expect)
 | |
|         expect = ["You can also do--this or even---",
 | |
|                   "this."]
 | |
|         self.check_wrap(text, 32, expect)
 | |
|         self.check_wrap(text, 35, expect)
 | |
| 
 | |
|         # All of the above behaviour could be deduced by probing the
 | |
|         # _split() method.
 | |
|         text = "Here's an -- em-dash and--here's another---and another!"
 | |
|         expect = ["Here's", " ", "an", " ", "--", " ", "em-", "dash", " ",
 | |
|                   "and", "--", "here's", " ", "another", "---",
 | |
|                   "and", " ", "another!"]
 | |
|         self.check_split(text, expect)
 | |
| 
 | |
|         text = "and then--bam!--he was gone"
 | |
|         expect = ["and", " ", "then", "--", "bam!", "--",
 | |
|                   "he", " ", "was", " ", "gone"]
 | |
|         self.check_split(text, expect)
 | |
| 
 | |
| 
 | |
|     def test_unix_options (self):
 | |
|         # Test that Unix-style command-line options are wrapped correctly.
 | |
|         # Both Optik (OptionParser) and Docutils rely on this behaviour!
 | |
| 
 | |
|         text = "You should use the -n option, or --dry-run in its long form."
 | |
|         self.check_wrap(text, 20,
 | |
|                         ["You should use the",
 | |
|                          "-n option, or --dry-",
 | |
|                          "run in its long",
 | |
|                          "form."])
 | |
|         self.check_wrap(text, 21,
 | |
|                         ["You should use the -n",
 | |
|                          "option, or --dry-run",
 | |
|                          "in its long form."])
 | |
|         expect = ["You should use the -n option, or",
 | |
|                   "--dry-run in its long form."]
 | |
|         self.check_wrap(text, 32, expect)
 | |
|         self.check_wrap(text, 34, expect)
 | |
|         self.check_wrap(text, 35, expect)
 | |
|         self.check_wrap(text, 38, expect)
 | |
|         expect = ["You should use the -n option, or --dry-",
 | |
|                   "run in its long form."]
 | |
|         self.check_wrap(text, 39, expect)
 | |
|         self.check_wrap(text, 41, expect)
 | |
|         expect = ["You should use the -n option, or --dry-run",
 | |
|                   "in its long form."]
 | |
|         self.check_wrap(text, 42, expect)
 | |
| 
 | |
|         # Again, all of the above can be deduced from _split().
 | |
|         text = "the -n option, or --dry-run or --dryrun"
 | |
|         expect = ["the", " ", "-n", " ", "option,", " ", "or", " ",
 | |
|                   "--dry-", "run", " ", "or", " ", "--dryrun"]
 | |
|         self.check_split(text, expect)
 | |
| 
 | |
|     def test_funky_hyphens (self):
 | |
|         # Screwy edge cases cooked up by David Goodger.  All reported
 | |
|         # in SF bug #596434.
 | |
|         self.check_split("what the--hey!", ["what", " ", "the", "--", "hey!"])
 | |
|         self.check_split("what the--", ["what", " ", "the--"])
 | |
|         self.check_split("what the--.", ["what", " ", "the--."])
 | |
|         self.check_split("--text--.", ["--text--."])
 | |
| 
 | |
|         # When I first read bug #596434, this is what I thought David
 | |
|         # was talking about.  I was wrong; these have always worked
 | |
|         # fine.  The real problem is tested in test_funky_parens()
 | |
|         # below...
 | |
|         self.check_split("--option", ["--option"])
 | |
|         self.check_split("--option-opt", ["--option-", "opt"])
 | |
|         self.check_split("foo --option-opt bar",
 | |
|                          ["foo", " ", "--option-", "opt", " ", "bar"])
 | |
| 
 | |
|     def test_punct_hyphens(self):
 | |
|         # Oh bother, SF #965425 found another problem with hyphens --
 | |
|         # hyphenated words in single quotes weren't handled correctly.
 | |
|         # In fact, the bug is that *any* punctuation around a hyphenated
 | |
|         # word was handled incorrectly, except for a leading "--", which
 | |
|         # was special-cased for Optik and Docutils.  So test a variety
 | |
|         # of styles of punctuation around a hyphenated word.
 | |
|         # (Actually this is based on an Optik bug report, #813077).
 | |
|         self.check_split("the 'wibble-wobble' widget",
 | |
|                          ['the', ' ', "'wibble-", "wobble'", ' ', 'widget'])
 | |
|         self.check_split('the "wibble-wobble" widget',
 | |
|                          ['the', ' ', '"wibble-', 'wobble"', ' ', 'widget'])
 | |
|         self.check_split("the (wibble-wobble) widget",
 | |
|                          ['the', ' ', "(wibble-", "wobble)", ' ', 'widget'])
 | |
|         self.check_split("the ['wibble-wobble'] widget",
 | |
|                          ['the', ' ', "['wibble-", "wobble']", ' ', 'widget'])
 | |
| 
 | |
|     def test_funky_parens (self):
 | |
|         # Second part of SF bug #596434: long option strings inside
 | |
|         # parentheses.
 | |
|         self.check_split("foo (--option) bar",
 | |
|                          ["foo", " ", "(--option)", " ", "bar"])
 | |
| 
 | |
|         # Related stuff -- make sure parens work in simpler contexts.
 | |
|         self.check_split("foo (bar) baz",
 | |
|                          ["foo", " ", "(bar)", " ", "baz"])
 | |
|         self.check_split("blah (ding dong), wubba",
 | |
|                          ["blah", " ", "(ding", " ", "dong),",
 | |
|                           " ", "wubba"])
 | |
| 
 | |
|     def test_initial_whitespace(self):
 | |
|         # SF bug #622849 reported inconsistent handling of leading
 | |
|         # whitespace; let's test that a bit, shall we?
 | |
|         text = " This is a sentence with leading whitespace."
 | |
|         self.check_wrap(text, 50,
 | |
|                         [" This is a sentence with leading whitespace."])
 | |
|         self.check_wrap(text, 30,
 | |
|                         [" This is a sentence with", "leading whitespace."])
 | |
| 
 | |
|     def test_unicode(self):
 | |
|         # *Very* simple test of wrapping Unicode strings.  I'm sure
 | |
|         # there's more to it than this, but let's at least make
 | |
|         # sure textwrap doesn't crash on Unicode input!
 | |
|         text = u"Hello there, how are you today?"
 | |
|         self.check_wrap(text, 50, [u"Hello there, how are you today?"])
 | |
|         self.check_wrap(text, 20, [u"Hello there, how are", "you today?"])
 | |
|         olines = self.wrapper.wrap(text)
 | |
|         assert isinstance(olines, list) and isinstance(olines[0], unicode)
 | |
|         otext = self.wrapper.fill(text)
 | |
|         assert isinstance(otext, unicode)
 | |
| 
 | |
|     def test_split(self):
 | |
|         # Ensure that the standard _split() method works as advertised
 | |
|         # in the comments
 | |
| 
 | |
|         text = "Hello there -- you goof-ball, use the -b option!"
 | |
| 
 | |
|         result = self.wrapper._split(text)
 | |
|         self.check(result,
 | |
|              ["Hello", " ", "there", " ", "--", " ", "you", " ", "goof-",
 | |
|               "ball,", " ", "use", " ", "the", " ", "-b", " ",  "option!"])
 | |
| 
 | |
|     def test_bad_width(self):
 | |
|         # Ensure that width <= 0 is caught.
 | |
|         text = "Whatever, it doesn't matter."
 | |
|         self.assertRaises(ValueError, wrap, text, 0)
 | |
|         self.assertRaises(ValueError, wrap, text, -1)
 | |
| 
 | |
| 
 | |
| class LongWordTestCase (BaseTestCase):
 | |
|     def setUp(self):
 | |
|         self.wrapper = TextWrapper()
 | |
|         self.text = '''\
 | |
| Did you say "supercalifragilisticexpialidocious?"
 | |
| How *do* you spell that odd word, anyways?
 | |
| '''
 | |
| 
 | |
|     def test_break_long(self):
 | |
|         # Wrap text with long words and lots of punctuation
 | |
| 
 | |
|         self.check_wrap(self.text, 30,
 | |
|                         ['Did you say "supercalifragilis',
 | |
|                          'ticexpialidocious?" How *do*',
 | |
|                          'you spell that odd word,',
 | |
|                          'anyways?'])
 | |
|         self.check_wrap(self.text, 50,
 | |
|                         ['Did you say "supercalifragilisticexpialidocious?"',
 | |
|                          'How *do* you spell that odd word, anyways?'])
 | |
| 
 | |
|         # SF bug 797650.  Prevent an infinite loop by making sure that at
 | |
|         # least one character gets split off on every pass.
 | |
|         self.check_wrap('-'*10+'hello', 10,
 | |
|                         ['----------',
 | |
|                          '               h',
 | |
|                          '               e',
 | |
|                          '               l',
 | |
|                          '               l',
 | |
|                          '               o'],
 | |
|                         subsequent_indent = ' '*15)
 | |
| 
 | |
|     def test_nobreak_long(self):
 | |
|         # Test with break_long_words disabled
 | |
|         self.wrapper.break_long_words = 0
 | |
|         self.wrapper.width = 30
 | |
|         expect = ['Did you say',
 | |
|                   '"supercalifragilisticexpialidocious?"',
 | |
|                   'How *do* you spell that odd',
 | |
|                   'word, anyways?'
 | |
|                   ]
 | |
|         result = self.wrapper.wrap(self.text)
 | |
|         self.check(result, expect)
 | |
| 
 | |
|         # Same thing with kwargs passed to standalone wrap() function.
 | |
|         result = wrap(self.text, width=30, break_long_words=0)
 | |
|         self.check(result, expect)
 | |
| 
 | |
| 
 | |
| class IndentTestCases(BaseTestCase):
 | |
| 
 | |
|     # called before each test method
 | |
|     def setUp(self):
 | |
|         self.text = '''\
 | |
| This paragraph will be filled, first without any indentation,
 | |
| and then with some (including a hanging indent).'''
 | |
| 
 | |
| 
 | |
|     def test_fill(self):
 | |
|         # Test the fill() method
 | |
| 
 | |
|         expect = '''\
 | |
| This paragraph will be filled, first
 | |
| without any indentation, and then with
 | |
| some (including a hanging indent).'''
 | |
| 
 | |
|         result = fill(self.text, 40)
 | |
|         self.check(result, expect)
 | |
| 
 | |
| 
 | |
|     def test_initial_indent(self):
 | |
|         # Test initial_indent parameter
 | |
| 
 | |
|         expect = ["     This paragraph will be filled,",
 | |
|                   "first without any indentation, and then",
 | |
|                   "with some (including a hanging indent)."]
 | |
|         result = wrap(self.text, 40, initial_indent="     ")
 | |
|         self.check(result, expect)
 | |
| 
 | |
|         expect = "\n".join(expect)
 | |
|         result = fill(self.text, 40, initial_indent="     ")
 | |
|         self.check(result, expect)
 | |
| 
 | |
| 
 | |
|     def test_subsequent_indent(self):
 | |
|         # Test subsequent_indent parameter
 | |
| 
 | |
|         expect = '''\
 | |
|   * This paragraph will be filled, first
 | |
|     without any indentation, and then
 | |
|     with some (including a hanging
 | |
|     indent).'''
 | |
| 
 | |
|         result = fill(self.text, 40,
 | |
|                       initial_indent="  * ", subsequent_indent="    ")
 | |
|         self.check(result, expect)
 | |
| 
 | |
| 
 | |
| # Despite the similar names, DedentTestCase is *not* the inverse
 | |
| # of IndentTestCase!
 | |
| class DedentTestCase(unittest.TestCase):
 | |
| 
 | |
|     def test_dedent_nomargin(self):
 | |
|         # No lines indented.
 | |
|         text = "Hello there.\nHow are you?\nOh good, I'm glad."
 | |
|         self.assertEquals(dedent(text), text)
 | |
| 
 | |
|         # Similar, with a blank line.
 | |
|         text = "Hello there.\n\nBoo!"
 | |
|         self.assertEquals(dedent(text), text)
 | |
| 
 | |
|         # Some lines indented, but overall margin is still zero.
 | |
|         text = "Hello there.\n  This is indented."
 | |
|         self.assertEquals(dedent(text), text)
 | |
| 
 | |
|         # Again, add a blank line.
 | |
|         text = "Hello there.\n\n  Boo!\n"
 | |
|         self.assertEquals(dedent(text), text)
 | |
| 
 | |
|     def test_dedent_even(self):
 | |
|         # All lines indented by two spaces.
 | |
|         text = "  Hello there.\n  How are ya?\n  Oh good."
 | |
|         expect = "Hello there.\nHow are ya?\nOh good."
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
|         # Same, with blank lines.
 | |
|         text = "  Hello there.\n\n  How are ya?\n  Oh good.\n"
 | |
|         expect = "Hello there.\n\nHow are ya?\nOh good.\n"
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
|         # Now indent one of the blank lines.
 | |
|         text = "  Hello there.\n  \n  How are ya?\n  Oh good.\n"
 | |
|         expect = "Hello there.\n\nHow are ya?\nOh good.\n"
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
|     def test_dedent_uneven(self):
 | |
|         # Lines indented unevenly.
 | |
|         text = '''\
 | |
|         def foo():
 | |
|             while 1:
 | |
|                 return foo
 | |
|         '''
 | |
|         expect = '''\
 | |
| def foo():
 | |
|     while 1:
 | |
|         return foo
 | |
| '''
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
|         # Uneven indentation with a blank line.
 | |
|         text = "  Foo\n    Bar\n\n   Baz\n"
 | |
|         expect = "Foo\n  Bar\n\n Baz\n"
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
|         # Uneven indentation with a whitespace-only line.
 | |
|         text = "  Foo\n    Bar\n \n   Baz\n"
 | |
|         expect = "Foo\n  Bar\n\n Baz\n"
 | |
|         self.assertEquals(dedent(text), expect)
 | |
| 
 | |
| 
 | |
| 
 | |
| def test_main():
 | |
|     test_support.run_unittest(WrapTestCase,
 | |
|                               LongWordTestCase,
 | |
|                               IndentTestCases,
 | |
|                               DedentTestCase)
 | |
| 
 | |
| if __name__ == '__main__':
 | |
|     test_main()
 | 
