home *** CD-ROM | disk | FTP | other *** search
- #
- # Test script for the textwrap module.
- #
- # Original tests written by Greg Ward <gward@python.net>.
- # Converted to PyUnit by Peter Hansen <peter@engcorp.com>.
- # Currently maintained by Greg Ward.
- #
- # $Id: test_textwrap.py,v 1.22.8.1 2003/08/30 14:52:35 rhettinger Exp $
- #
-
- import unittest
- from test import test_support
-
- from textwrap import TextWrapper, wrap, fill, dedent
-
-
- class BaseTestCase(unittest.TestCase):
- '''Parent class with utility methods for textwrap tests.'''
-
- def show(self, textin):
- if isinstance(textin, list):
- result = []
- for i in range(len(textin)):
- result.append(" %d: %r" % (i, textin[i]))
- result = '\n'.join(result)
- elif isinstance(textin, (str, unicode)):
- result = " %s\n" % repr(textin)
- return result
-
-
- def check(self, result, expect):
- self.assertEquals(result, expect,
- 'expected:\n%s\nbut got:\n%s' % (
- self.show(expect), self.show(result)))
-
- def check_wrap(self, text, width, expect, **kwargs):
- result = wrap(text, width, **kwargs)
- self.check(result, expect)
-
- def check_split(self, text, expect):
- result = self.wrapper._split(text)
- self.assertEquals(result, expect,
- "\nexpected %r\n"
- "but got %r" % (expect, result))
-
-
- class WrapTestCase(BaseTestCase):
-
- def setUp(self):
- self.wrapper = TextWrapper(width=45, fix_sentence_endings=True)
-
- def test_simple(self):
- # Simple case: just words, spaces, and a bit of punctuation
-
- text = "Hello there, how are you this fine day? I'm glad to hear it!"
-
- self.check_wrap(text, 12,
- ["Hello there,",
- "how are you",
- "this fine",
- "day? I'm",
- "glad to hear",
- "it!"])
- self.check_wrap(text, 42,
- ["Hello there, how are you this fine day?",
- "I'm glad to hear it!"])
- self.check_wrap(text, 80, [text])
-
-
- def test_whitespace(self):
- # Whitespace munging and end-of-sentence detection
-
- text = """\
- This is a paragraph that already has
- line breaks. But some of its lines are much longer than the others,
- so it needs to be wrapped.
- Some lines are \ttabbed too.
- What a mess!
- """
-
- expect = ["This is a paragraph that already has line",
- "breaks. But some of its lines are much",
- "longer than the others, so it needs to be",
- "wrapped. Some lines are tabbed too. What a",
- "mess!"]
-
- result = self.wrapper.wrap(text)
- self.check(result, expect)
-
- result = self.wrapper.fill(text)
- self.check(result, '\n'.join(expect))
-
-
- def test_wrap_short(self):
- # Wrapping to make short lines longer
-
- text = "This is a\nshort paragraph."
-
- self.check_wrap(text, 20, ["This is a short",
- "paragraph."])
- self.check_wrap(text, 40, ["This is a short paragraph."])
-
-
- def test_wrap_short_1line(self):
- # Test endcases
-
- text = "This is a short line."
-
- self.check_wrap(text, 30, ["This is a short line."])
- self.check_wrap(text, 30, ["(1) This is a short line."],
- initial_indent="(1) ")
-
-
- def test_hyphenated(self):
- # Test breaking hyphenated words
-
- text = ("this-is-a-useful-feature-for-"
- "reformatting-posts-from-tim-peters'ly")
-
- self.check_wrap(text, 40,
- ["this-is-a-useful-feature-for-",
- "reformatting-posts-from-tim-peters'ly"])
- self.check_wrap(text, 41,
- ["this-is-a-useful-feature-for-",
- "reformatting-posts-from-tim-peters'ly"])
- self.check_wrap(text, 42,
- ["this-is-a-useful-feature-for-reformatting-",
- "posts-from-tim-peters'ly"])
-
- def test_em_dash(self):
- # Test text with em-dashes
- text = "Em-dashes should be written -- thus."
- self.check_wrap(text, 25,
- ["Em-dashes should be",
- "written -- thus."])
-
- # Probe the boundaries of the properly written em-dash,
- # ie. " -- ".
- self.check_wrap(text, 29,
- ["Em-dashes should be written",
- "-- thus."])
- expect = ["Em-dashes should be written --",
- "thus."]
- self.check_wrap(text, 30, expect)
- self.check_wrap(text, 35, expect)
- self.check_wrap(text, 36,
- ["Em-dashes should be written -- thus."])
-
- # The improperly written em-dash is handled too, because
- # it's adjacent to non-whitespace on both sides.
- text = "You can also do--this or even---this."
- expect = ["You can also do",
- "--this or even",
- "---this."]
- self.check_wrap(text, 15, expect)
- self.check_wrap(text, 16, expect)
- expect = ["You can also do--",
- "this or even---",
- "this."]
- self.check_wrap(text, 17, expect)
- self.check_wrap(text, 19, expect)
- expect = ["You can also do--this or even",
- "---this."]
- self.check_wrap(text, 29, expect)
- self.check_wrap(text, 31, expect)
- expect = ["You can also do--this or even---",
- "this."]
- self.check_wrap(text, 32, expect)
- self.check_wrap(text, 35, expect)
-
- # All of the above behaviour could be deduced by probing the
- # _split() method.
- text = "Here's an -- em-dash and--here's another---and another!"
- expect = ["Here's", " ", "an", " ", "--", " ", "em-", "dash", " ",
- "and", "--", "here's", " ", "another", "---",
- "and", " ", "another!"]
- self.check_split(text, expect)
-
- text = "and then--bam!--he was gone"
- expect = ["and", " ", "then", "--", "bam!", "--",
- "he", " ", "was", " ", "gone"]
- self.check_split(text, expect)
-
-
- def test_unix_options (self):
- # Test that Unix-style command-line options are wrapped correctly.
- # Both Optik (OptionParser) and Docutils rely on this behaviour!
-
- text = "You should use the -n option, or --dry-run in its long form."
- self.check_wrap(text, 20,
- ["You should use the",
- "-n option, or --dry-",
- "run in its long",
- "form."])
- self.check_wrap(text, 21,
- ["You should use the -n",
- "option, or --dry-run",
- "in its long form."])
- expect = ["You should use the -n option, or",
- "--dry-run in its long form."]
- self.check_wrap(text, 32, expect)
- self.check_wrap(text, 34, expect)
- self.check_wrap(text, 35, expect)
- self.check_wrap(text, 38, expect)
- expect = ["You should use the -n option, or --dry-",
- "run in its long form."]
- self.check_wrap(text, 39, expect)
- self.check_wrap(text, 41, expect)
- expect = ["You should use the -n option, or --dry-run",
- "in its long form."]
- self.check_wrap(text, 42, expect)
-
- # Again, all of the above can be deduced from _split().
- text = "the -n option, or --dry-run or --dryrun"
- expect = ["the", " ", "-n", " ", "option,", " ", "or", " ",
- "--dry-", "run", " ", "or", " ", "--dryrun"]
- self.check_split(text, expect)
-
- def test_funky_hyphens (self):
- # Screwy edge cases cooked up by David Goodger. All reported
- # in SF bug #596434.
- self.check_split("what the--hey!", ["what", " ", "the", "--", "hey!"])
- self.check_split("what the--", ["what", " ", "the--"])
- self.check_split("what the--.", ["what", " ", "the--."])
- self.check_split("--text--.", ["--text--."])
-
- # When I first read bug #596434, this is what I thought David
- # was talking about. I was wrong; these have always worked
- # fine. The real problem is tested in test_funky_parens()
- # below...
- self.check_split("--option", ["--option"])
- self.check_split("--option-opt", ["--option-", "opt"])
- self.check_split("foo --option-opt bar",
- ["foo", " ", "--option-", "opt", " ", "bar"])
-
- def test_funky_parens (self):
- # Second part of SF bug #596434: long option strings inside
- # parentheses.
- self.check_split("foo (--option) bar",
- ["foo", " ", "(--option)", " ", "bar"])
-
- # Related stuff -- make sure parens work in simpler contexts.
- self.check_split("foo (bar) baz",
- ["foo", " ", "(bar)", " ", "baz"])
- self.check_split("blah (ding dong), wubba",
- ["blah", " ", "(ding", " ", "dong),",
- " ", "wubba"])
-
- def test_initial_whitespace(self):
- # SF bug #622849 reported inconsistent handling of leading
- # whitespace; let's test that a bit, shall we?
- text = " This is a sentence with leading whitespace."
- self.check_wrap(text, 50,
- [" This is a sentence with leading whitespace."])
- self.check_wrap(text, 30,
- [" This is a sentence with", "leading whitespace."])
-
- def test_unicode(self):
- # *Very* simple test of wrapping Unicode strings. I'm sure
- # there's more to it than this, but let's at least make
- # sure textwrap doesn't crash on Unicode input!
- text = u"Hello there, how are you today?"
- self.check_wrap(text, 50, [u"Hello there, how are you today?"])
- self.check_wrap(text, 20, [u"Hello there, how are", "you today?"])
- olines = self.wrapper.wrap(text)
- assert isinstance(olines, list) and isinstance(olines[0], unicode)
- otext = self.wrapper.fill(text)
- assert isinstance(otext, unicode)
-
- def test_split(self):
- # Ensure that the standard _split() method works as advertised
- # in the comments
-
- text = "Hello there -- you goof-ball, use the -b option!"
-
- result = self.wrapper._split(text)
- self.check(result,
- ["Hello", " ", "there", " ", "--", " ", "you", " ", "goof-",
- "ball,", " ", "use", " ", "the", " ", "-b", " ", "option!"])
-
- def test_bad_width(self):
- # Ensure that width <= 0 is caught.
- text = "Whatever, it doesn't matter."
- self.assertRaises(ValueError, wrap, text, 0)
- self.assertRaises(ValueError, wrap, text, -1)
-
-
- class LongWordTestCase (BaseTestCase):
- def setUp(self):
- self.wrapper = TextWrapper()
- self.text = '''\
- Did you say "supercalifragilisticexpialidocious?"
- How *do* you spell that odd word, anyways?
- '''
-
- def test_break_long(self):
- # Wrap text with long words and lots of punctuation
-
- self.check_wrap(self.text, 30,
- ['Did you say "supercalifragilis',
- 'ticexpialidocious?" How *do*',
- 'you spell that odd word,',
- 'anyways?'])
- self.check_wrap(self.text, 50,
- ['Did you say "supercalifragilisticexpialidocious?"',
- 'How *do* you spell that odd word, anyways?'])
-
- # SF bug 797650. Prevent an infinite loop by making sure that at
- # least one character gets split off on every pass.
- self.check_wrap('-'*10+'hello', 10,
- ['----------',
- ' h',
- ' e',
- ' l',
- ' l',
- ' o'],
- subsequent_indent = ' '*15)
-
- def test_nobreak_long(self):
- # Test with break_long_words disabled
- self.wrapper.break_long_words = 0
- self.wrapper.width = 30
- expect = ['Did you say',
- '"supercalifragilisticexpialidocious?"',
- 'How *do* you spell that odd',
- 'word, anyways?'
- ]
- result = self.wrapper.wrap(self.text)
- self.check(result, expect)
-
- # Same thing with kwargs passed to standalone wrap() function.
- result = wrap(self.text, width=30, break_long_words=0)
- self.check(result, expect)
-
-
- class IndentTestCases(BaseTestCase):
-
- # called before each test method
- def setUp(self):
- self.text = '''\
- This paragraph will be filled, first without any indentation,
- and then with some (including a hanging indent).'''
-
-
- def test_fill(self):
- # Test the fill() method
-
- expect = '''\
- This paragraph will be filled, first
- without any indentation, and then with
- some (including a hanging indent).'''
-
- result = fill(self.text, 40)
- self.check(result, expect)
-
-
- def test_initial_indent(self):
- # Test initial_indent parameter
-
- expect = [" This paragraph will be filled,",
- "first without any indentation, and then",
- "with some (including a hanging indent)."]
- result = wrap(self.text, 40, initial_indent=" ")
- self.check(result, expect)
-
- expect = "\n".join(expect)
- result = fill(self.text, 40, initial_indent=" ")
- self.check(result, expect)
-
-
- def test_subsequent_indent(self):
- # Test subsequent_indent parameter
-
- expect = '''\
- * This paragraph will be filled, first
- without any indentation, and then
- with some (including a hanging
- indent).'''
-
- result = fill(self.text, 40,
- initial_indent=" * ", subsequent_indent=" ")
- self.check(result, expect)
-
-
- # Despite the similar names, DedentTestCase is *not* the inverse
- # of IndentTestCase!
- class DedentTestCase(unittest.TestCase):
-
- def test_dedent_nomargin(self):
- # No lines indented.
- text = "Hello there.\nHow are you?\nOh good, I'm glad."
- self.assertEquals(dedent(text), text)
-
- # Similar, with a blank line.
- text = "Hello there.\n\nBoo!"
- self.assertEquals(dedent(text), text)
-
- # Some lines indented, but overall margin is still zero.
- text = "Hello there.\n This is indented."
- self.assertEquals(dedent(text), text)
-
- # Again, add a blank line.
- text = "Hello there.\n\n Boo!\n"
- self.assertEquals(dedent(text), text)
-
- def test_dedent_even(self):
- # All lines indented by two spaces.
- text = " Hello there.\n How are ya?\n Oh good."
- expect = "Hello there.\nHow are ya?\nOh good."
- self.assertEquals(dedent(text), expect)
-
- # Same, with blank lines.
- text = " Hello there.\n\n How are ya?\n Oh good.\n"
- expect = "Hello there.\n\nHow are ya?\nOh good.\n"
- self.assertEquals(dedent(text), expect)
-
- # Now indent one of the blank lines.
- text = " Hello there.\n \n How are ya?\n Oh good.\n"
- expect = "Hello there.\n\nHow are ya?\nOh good.\n"
- self.assertEquals(dedent(text), expect)
-
- def test_dedent_uneven(self):
- # Lines indented unevenly.
- text = '''\
- def foo():
- while 1:
- return foo
- '''
- expect = '''\
- def foo():
- while 1:
- return foo
- '''
- self.assertEquals(dedent(text), expect)
-
- # Uneven indentation with a blank line.
- text = " Foo\n Bar\n\n Baz\n"
- expect = "Foo\n Bar\n\n Baz\n"
- self.assertEquals(dedent(text), expect)
-
- # Uneven indentation with a whitespace-only line.
- text = " Foo\n Bar\n \n Baz\n"
- expect = "Foo\n Bar\n\n Baz\n"
- self.assertEquals(dedent(text), expect)
-
-
-
- def test_main():
- test_support.run_unittest(WrapTestCase,
- LongWordTestCase,
- IndentTestCases,
- DedentTestCase)
-
- if __name__ == '__main__':
- test_main()
-