| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080 |
- #
- # Test suite for the textwrap module.
- #
- # Original tests written by Greg Ward <gward@python.net>.
- # Converted to PyUnit by Peter Hansen <peter@engcorp.com>.
- # Currently maintained by Greg Ward.
- #
- # $Id$
- #
- import unittest
- from textwrap import TextWrapper, wrap, fill, dedent, indent, shorten
- class BaseTestCase(unittest.TestCase):
- '''Parent class with utility methods for textwrap tests.'''
- def show(self, textin):
- if isinstance(textin, list):
- result = []
- for i in range(len(textin)):
- result.append(" %d: %r" % (i, textin[i]))
- result = "\n".join(result) if result else " no lines"
- elif isinstance(textin, str):
- result = " %s\n" % repr(textin)
- return result
- def check(self, result, expect):
- self.assertEqual(result, expect,
- 'expected:\n%s\nbut got:\n%s' % (
- self.show(expect), self.show(result)))
- def check_wrap(self, text, width, expect, **kwargs):
- result = wrap(text, width, **kwargs)
- self.check(result, expect)
- def check_split(self, text, expect):
- result = self.wrapper._split(text)
- self.assertEqual(result, expect,
- "\nexpected %r\n"
- "but got %r" % (expect, result))
- class WrapTestCase(BaseTestCase):
- def setUp(self):
- self.wrapper = TextWrapper(width=45)
- def test_simple(self):
- # Simple case: just words, spaces, and a bit of punctuation
- text = "Hello there, how are you this fine day? I'm glad to hear it!"
- self.check_wrap(text, 12,
- ["Hello there,",
- "how are you",
- "this fine",
- "day? I'm",
- "glad to hear",
- "it!"])
- self.check_wrap(text, 42,
- ["Hello there, how are you this fine day?",
- "I'm glad to hear it!"])
- self.check_wrap(text, 80, [text])
- def test_empty_string(self):
- # Check that wrapping the empty string returns an empty list.
- self.check_wrap("", 6, [])
- self.check_wrap("", 6, [], drop_whitespace=False)
- def test_empty_string_with_initial_indent(self):
- # Check that the empty string is not indented.
- self.check_wrap("", 6, [], initial_indent="++")
- self.check_wrap("", 6, [], initial_indent="++", drop_whitespace=False)
- def test_whitespace(self):
- # Whitespace munging and end-of-sentence detection
- text = """\
- This is a paragraph that already has
- line breaks. But some of its lines are much longer than the others,
- so it needs to be wrapped.
- Some lines are \ttabbed too.
- What a mess!
- """
- expect = ["This is a paragraph that already has line",
- "breaks. But some of its lines are much",
- "longer than the others, so it needs to be",
- "wrapped. Some lines are tabbed too. What a",
- "mess!"]
- wrapper = TextWrapper(45, fix_sentence_endings=True)
- result = wrapper.wrap(text)
- self.check(result, expect)
- result = wrapper.fill(text)
- self.check(result, '\n'.join(expect))
- text = "\tTest\tdefault\t\ttabsize."
- expect = [" Test default tabsize."]
- self.check_wrap(text, 80, expect)
- text = "\tTest\tcustom\t\ttabsize."
- expect = [" Test custom tabsize."]
- self.check_wrap(text, 80, expect, tabsize=4)
- def test_fix_sentence_endings(self):
- wrapper = TextWrapper(60, fix_sentence_endings=True)
- # SF #847346: ensure that fix_sentence_endings=True does the
- # right thing even on input short enough that it doesn't need to
- # be wrapped.
- text = "A short line. Note the single space."
- expect = ["A short line. Note the single space."]
- self.check(wrapper.wrap(text), expect)
- # Test some of the hairy end cases that _fix_sentence_endings()
- # is supposed to handle (the easy stuff is tested in
- # test_whitespace() above).
- text = "Well, Doctor? What do you think?"
- expect = ["Well, Doctor? What do you think?"]
- self.check(wrapper.wrap(text), expect)
- text = "Well, Doctor?\nWhat do you think?"
- self.check(wrapper.wrap(text), expect)
- text = 'I say, chaps! Anyone for "tennis?"\nHmmph!'
- expect = ['I say, chaps! Anyone for "tennis?" Hmmph!']
- self.check(wrapper.wrap(text), expect)
- wrapper.width = 20
- expect = ['I say, chaps!', 'Anyone for "tennis?"', 'Hmmph!']
- self.check(wrapper.wrap(text), expect)
- text = 'And she said, "Go to hell!"\nCan you believe that?'
- expect = ['And she said, "Go to',
- 'hell!" Can you',
- 'believe that?']
- self.check(wrapper.wrap(text), expect)
- wrapper.width = 60
- expect = ['And she said, "Go to hell!" Can you believe that?']
- self.check(wrapper.wrap(text), expect)
- text = 'File stdio.h is nice.'
- expect = ['File stdio.h is nice.']
- self.check(wrapper.wrap(text), expect)
- def test_wrap_short(self):
- # Wrapping to make short lines longer
- text = "This is a\nshort paragraph."
- self.check_wrap(text, 20, ["This is a short",
- "paragraph."])
- self.check_wrap(text, 40, ["This is a short paragraph."])
- def test_wrap_short_1line(self):
- # Test endcases
- text = "This is a short line."
- self.check_wrap(text, 30, ["This is a short line."])
- self.check_wrap(text, 30, ["(1) This is a short line."],
- initial_indent="(1) ")
- def test_hyphenated(self):
- # Test breaking hyphenated words
- text = ("this-is-a-useful-feature-for-"
- "reformatting-posts-from-tim-peters'ly")
- self.check_wrap(text, 40,
- ["this-is-a-useful-feature-for-",
- "reformatting-posts-from-tim-peters'ly"])
- self.check_wrap(text, 41,
- ["this-is-a-useful-feature-for-",
- "reformatting-posts-from-tim-peters'ly"])
- self.check_wrap(text, 42,
- ["this-is-a-useful-feature-for-reformatting-",
- "posts-from-tim-peters'ly"])
- # The test tests current behavior but is not testing parts of the API.
- expect = ("this-|is-|a-|useful-|feature-|for-|"
- "reformatting-|posts-|from-|tim-|peters'ly").split('|')
- self.check_wrap(text, 1, expect, break_long_words=False)
- self.check_split(text, expect)
- self.check_split('e-mail', ['e-mail'])
- self.check_split('Jelly-O', ['Jelly-O'])
- # The test tests current behavior but is not testing parts of the API.
- self.check_split('half-a-crown', 'half-|a-|crown'.split('|'))
- def test_hyphenated_numbers(self):
- # Test that hyphenated numbers (eg. dates) are not broken like words.
- text = ("Python 1.0.0 was released on 1994-01-26. Python 1.0.1 was\n"
- "released on 1994-02-15.")
- self.check_wrap(text, 30, ['Python 1.0.0 was released on',
- '1994-01-26. Python 1.0.1 was',
- 'released on 1994-02-15.'])
- self.check_wrap(text, 40, ['Python 1.0.0 was released on 1994-01-26.',
- 'Python 1.0.1 was released on 1994-02-15.'])
- self.check_wrap(text, 1, text.split(), break_long_words=False)
- text = "I do all my shopping at 7-11."
- self.check_wrap(text, 25, ["I do all my shopping at",
- "7-11."])
- self.check_wrap(text, 27, ["I do all my shopping at",
- "7-11."])
- self.check_wrap(text, 29, ["I do all my shopping at 7-11."])
- self.check_wrap(text, 1, text.split(), break_long_words=False)
- def test_em_dash(self):
- # Test text with em-dashes
- text = "Em-dashes should be written -- thus."
- self.check_wrap(text, 25,
- ["Em-dashes should be",
- "written -- thus."])
- # Probe the boundaries of the properly written em-dash,
- # ie. " -- ".
- self.check_wrap(text, 29,
- ["Em-dashes should be written",
- "-- thus."])
- expect = ["Em-dashes should be written --",
- "thus."]
- self.check_wrap(text, 30, expect)
- self.check_wrap(text, 35, expect)
- self.check_wrap(text, 36,
- ["Em-dashes should be written -- thus."])
- # The improperly written em-dash is handled too, because
- # it's adjacent to non-whitespace on both sides.
- text = "You can also do--this or even---this."
- expect = ["You can also do",
- "--this or even",
- "---this."]
- self.check_wrap(text, 15, expect)
- self.check_wrap(text, 16, expect)
- expect = ["You can also do--",
- "this or even---",
- "this."]
- self.check_wrap(text, 17, expect)
- self.check_wrap(text, 19, expect)
- expect = ["You can also do--this or even",
- "---this."]
- self.check_wrap(text, 29, expect)
- self.check_wrap(text, 31, expect)
- expect = ["You can also do--this or even---",
- "this."]
- self.check_wrap(text, 32, expect)
- self.check_wrap(text, 35, expect)
- # All of the above behaviour could be deduced by probing the
- # _split() method.
- text = "Here's an -- em-dash and--here's another---and another!"
- expect = ["Here's", " ", "an", " ", "--", " ", "em-", "dash", " ",
- "and", "--", "here's", " ", "another", "---",
- "and", " ", "another!"]
- self.check_split(text, expect)
- text = "and then--bam!--he was gone"
- expect = ["and", " ", "then", "--", "bam!", "--",
- "he", " ", "was", " ", "gone"]
- self.check_split(text, expect)
- def test_unix_options (self):
- # Test that Unix-style command-line options are wrapped correctly.
- # Both Optik (OptionParser) and Docutils rely on this behaviour!
- text = "You should use the -n option, or --dry-run in its long form."
- self.check_wrap(text, 20,
- ["You should use the",
- "-n option, or --dry-",
- "run in its long",
- "form."])
- self.check_wrap(text, 21,
- ["You should use the -n",
- "option, or --dry-run",
- "in its long form."])
- expect = ["You should use the -n option, or",
- "--dry-run in its long form."]
- self.check_wrap(text, 32, expect)
- self.check_wrap(text, 34, expect)
- self.check_wrap(text, 35, expect)
- self.check_wrap(text, 38, expect)
- expect = ["You should use the -n option, or --dry-",
- "run in its long form."]
- self.check_wrap(text, 39, expect)
- self.check_wrap(text, 41, expect)
- expect = ["You should use the -n option, or --dry-run",
- "in its long form."]
- self.check_wrap(text, 42, expect)
- # Again, all of the above can be deduced from _split().
- text = "the -n option, or --dry-run or --dryrun"
- expect = ["the", " ", "-n", " ", "option,", " ", "or", " ",
- "--dry-", "run", " ", "or", " ", "--dryrun"]
- self.check_split(text, expect)
- def test_funky_hyphens (self):
- # Screwy edge cases cooked up by David Goodger. All reported
- # in SF bug #596434.
- self.check_split("what the--hey!", ["what", " ", "the", "--", "hey!"])
- self.check_split("what the--", ["what", " ", "the--"])
- self.check_split("what the--.", ["what", " ", "the--."])
- self.check_split("--text--.", ["--text--."])
- # When I first read bug #596434, this is what I thought David
- # was talking about. I was wrong; these have always worked
- # fine. The real problem is tested in test_funky_parens()
- # below...
- self.check_split("--option", ["--option"])
- self.check_split("--option-opt", ["--option-", "opt"])
- self.check_split("foo --option-opt bar",
- ["foo", " ", "--option-", "opt", " ", "bar"])
- def test_punct_hyphens(self):
- # Oh bother, SF #965425 found another problem with hyphens --
- # hyphenated words in single quotes weren't handled correctly.
- # In fact, the bug is that *any* punctuation around a hyphenated
- # word was handled incorrectly, except for a leading "--", which
- # was special-cased for Optik and Docutils. So test a variety
- # of styles of punctuation around a hyphenated word.
- # (Actually this is based on an Optik bug report, #813077).
- self.check_split("the 'wibble-wobble' widget",
- ['the', ' ', "'wibble-", "wobble'", ' ', 'widget'])
- self.check_split('the "wibble-wobble" widget',
- ['the', ' ', '"wibble-', 'wobble"', ' ', 'widget'])
- self.check_split("the (wibble-wobble) widget",
- ['the', ' ', "(wibble-", "wobble)", ' ', 'widget'])
- self.check_split("the ['wibble-wobble'] widget",
- ['the', ' ', "['wibble-", "wobble']", ' ', 'widget'])
- # The test tests current behavior but is not testing parts of the API.
- self.check_split("what-d'you-call-it.",
- "what-d'you-|call-|it.".split('|'))
- def test_funky_parens (self):
- # Second part of SF bug #596434: long option strings inside
- # parentheses.
- self.check_split("foo (--option) bar",
- ["foo", " ", "(--option)", " ", "bar"])
- # Related stuff -- make sure parens work in simpler contexts.
- self.check_split("foo (bar) baz",
- ["foo", " ", "(bar)", " ", "baz"])
- self.check_split("blah (ding dong), wubba",
- ["blah", " ", "(ding", " ", "dong),",
- " ", "wubba"])
- def test_drop_whitespace_false(self):
- # Check that drop_whitespace=False preserves whitespace.
- # SF patch #1581073
- text = " This is a sentence with much whitespace."
- self.check_wrap(text, 10,
- [" This is a", " ", "sentence ",
- "with ", "much white", "space."],
- drop_whitespace=False)
- def test_drop_whitespace_false_whitespace_only(self):
- # Check that drop_whitespace=False preserves a whitespace-only string.
- self.check_wrap(" ", 6, [" "], drop_whitespace=False)
- def test_drop_whitespace_false_whitespace_only_with_indent(self):
- # Check that a whitespace-only string gets indented (when
- # drop_whitespace is False).
- self.check_wrap(" ", 6, [" "], drop_whitespace=False,
- initial_indent=" ")
- def test_drop_whitespace_whitespace_only(self):
- # Check drop_whitespace on a whitespace-only string.
- self.check_wrap(" ", 6, [])
- def test_drop_whitespace_leading_whitespace(self):
- # Check that drop_whitespace does not drop leading whitespace (if
- # followed by non-whitespace).
- # SF bug #622849 reported inconsistent handling of leading
- # whitespace; let's test that a bit, shall we?
- text = " This is a sentence with leading whitespace."
- self.check_wrap(text, 50,
- [" This is a sentence with leading whitespace."])
- self.check_wrap(text, 30,
- [" This is a sentence with", "leading whitespace."])
- def test_drop_whitespace_whitespace_line(self):
- # Check that drop_whitespace skips the whole line if a non-leading
- # line consists only of whitespace.
- text = "abcd efgh"
- # Include the result for drop_whitespace=False for comparison.
- self.check_wrap(text, 6, ["abcd", " ", "efgh"],
- drop_whitespace=False)
- self.check_wrap(text, 6, ["abcd", "efgh"])
- def test_drop_whitespace_whitespace_only_with_indent(self):
- # Check that initial_indent is not applied to a whitespace-only
- # string. This checks a special case of the fact that dropping
- # whitespace occurs before indenting.
- self.check_wrap(" ", 6, [], initial_indent="++")
- def test_drop_whitespace_whitespace_indent(self):
- # Check that drop_whitespace does not drop whitespace indents.
- # This checks a special case of the fact that dropping whitespace
- # occurs before indenting.
- self.check_wrap("abcd efgh", 6, [" abcd", " efgh"],
- initial_indent=" ", subsequent_indent=" ")
- def test_split(self):
- # Ensure that the standard _split() method works as advertised
- # in the comments
- text = "Hello there -- you goof-ball, use the -b option!"
- result = self.wrapper._split(text)
- self.check(result,
- ["Hello", " ", "there", " ", "--", " ", "you", " ", "goof-",
- "ball,", " ", "use", " ", "the", " ", "-b", " ", "option!"])
- def test_break_on_hyphens(self):
- # Ensure that the break_on_hyphens attributes work
- text = "yaba daba-doo"
- self.check_wrap(text, 10, ["yaba daba-", "doo"],
- break_on_hyphens=True)
- self.check_wrap(text, 10, ["yaba", "daba-doo"],
- break_on_hyphens=False)
- def test_bad_width(self):
- # Ensure that width <= 0 is caught.
- text = "Whatever, it doesn't matter."
- self.assertRaises(ValueError, wrap, text, 0)
- self.assertRaises(ValueError, wrap, text, -1)
- def test_no_split_at_umlaut(self):
- text = "Die Empf\xe4nger-Auswahl"
- self.check_wrap(text, 13, ["Die", "Empf\xe4nger-", "Auswahl"])
- def test_umlaut_followed_by_dash(self):
- text = "aa \xe4\xe4-\xe4\xe4"
- self.check_wrap(text, 7, ["aa \xe4\xe4-", "\xe4\xe4"])
- def test_non_breaking_space(self):
- text = 'This is a sentence with non-breaking\N{NO-BREAK SPACE}space.'
- self.check_wrap(text, 20,
- ['This is a sentence',
- 'with non-',
- 'breaking\N{NO-BREAK SPACE}space.'],
- break_on_hyphens=True)
- self.check_wrap(text, 20,
- ['This is a sentence',
- 'with',
- 'non-breaking\N{NO-BREAK SPACE}space.'],
- break_on_hyphens=False)
- def test_narrow_non_breaking_space(self):
- text = ('This is a sentence with non-breaking'
- '\N{NARROW NO-BREAK SPACE}space.')
- self.check_wrap(text, 20,
- ['This is a sentence',
- 'with non-',
- 'breaking\N{NARROW NO-BREAK SPACE}space.'],
- break_on_hyphens=True)
- self.check_wrap(text, 20,
- ['This is a sentence',
- 'with',
- 'non-breaking\N{NARROW NO-BREAK SPACE}space.'],
- break_on_hyphens=False)
- class MaxLinesTestCase(BaseTestCase):
- text = "Hello there, how are you this fine day? I'm glad to hear it!"
- def test_simple(self):
- self.check_wrap(self.text, 12,
- ["Hello [...]"],
- max_lines=0)
- self.check_wrap(self.text, 12,
- ["Hello [...]"],
- max_lines=1)
- self.check_wrap(self.text, 12,
- ["Hello there,",
- "how [...]"],
- max_lines=2)
- self.check_wrap(self.text, 13,
- ["Hello there,",
- "how are [...]"],
- max_lines=2)
- self.check_wrap(self.text, 80, [self.text], max_lines=1)
- self.check_wrap(self.text, 12,
- ["Hello there,",
- "how are you",
- "this fine",
- "day? I'm",
- "glad to hear",
- "it!"],
- max_lines=6)
- def test_spaces(self):
- # strip spaces before placeholder
- self.check_wrap(self.text, 12,
- ["Hello there,",
- "how are you",
- "this fine",
- "day? [...]"],
- max_lines=4)
- # placeholder at the start of line
- self.check_wrap(self.text, 6,
- ["Hello",
- "[...]"],
- max_lines=2)
- # final spaces
- self.check_wrap(self.text + ' ' * 10, 12,
- ["Hello there,",
- "how are you",
- "this fine",
- "day? I'm",
- "glad to hear",
- "it!"],
- max_lines=6)
- def test_placeholder(self):
- self.check_wrap(self.text, 12,
- ["Hello..."],
- max_lines=1,
- placeholder='...')
- self.check_wrap(self.text, 12,
- ["Hello there,",
- "how are..."],
- max_lines=2,
- placeholder='...')
- # long placeholder and indentation
- with self.assertRaises(ValueError):
- wrap(self.text, 16, initial_indent=' ',
- max_lines=1, placeholder=' [truncated]...')
- with self.assertRaises(ValueError):
- wrap(self.text, 16, subsequent_indent=' ',
- max_lines=2, placeholder=' [truncated]...')
- self.check_wrap(self.text, 16,
- [" Hello there,",
- " [truncated]..."],
- max_lines=2,
- initial_indent=' ',
- subsequent_indent=' ',
- placeholder=' [truncated]...')
- self.check_wrap(self.text, 16,
- [" [truncated]..."],
- max_lines=1,
- initial_indent=' ',
- subsequent_indent=' ',
- placeholder=' [truncated]...')
- self.check_wrap(self.text, 80, [self.text], placeholder='.' * 1000)
- def test_placeholder_backtrack(self):
- # Test special case when max_lines insufficient, but what
- # would be last wrapped line so long the placeholder cannot
- # be added there without violence. So, textwrap backtracks,
- # adding placeholder to the penultimate line.
- text = 'Good grief Python features are advancing quickly!'
- self.check_wrap(text, 12,
- ['Good grief', 'Python*****'],
- max_lines=3,
- placeholder='*****')
- class LongWordTestCase (BaseTestCase):
- def setUp(self):
- self.wrapper = TextWrapper()
- self.text = '''\
- Did you say "supercalifragilisticexpialidocious?"
- How *do* you spell that odd word, anyways?
- '''
- def test_break_long(self):
- # Wrap text with long words and lots of punctuation
- self.check_wrap(self.text, 30,
- ['Did you say "supercalifragilis',
- 'ticexpialidocious?" How *do*',
- 'you spell that odd word,',
- 'anyways?'])
- self.check_wrap(self.text, 50,
- ['Did you say "supercalifragilisticexpialidocious?"',
- 'How *do* you spell that odd word, anyways?'])
- # SF bug 797650. Prevent an infinite loop by making sure that at
- # least one character gets split off on every pass.
- self.check_wrap('-'*10+'hello', 10,
- ['----------',
- ' h',
- ' e',
- ' l',
- ' l',
- ' o'],
- subsequent_indent = ' '*15)
- # bug 1146. Prevent a long word to be wrongly wrapped when the
- # preceding word is exactly one character shorter than the width
- self.check_wrap(self.text, 12,
- ['Did you say ',
- '"supercalifr',
- 'agilisticexp',
- 'ialidocious?',
- '" How *do*',
- 'you spell',
- 'that odd',
- 'word,',
- 'anyways?'])
- def test_nobreak_long(self):
- # Test with break_long_words disabled
- self.wrapper.break_long_words = 0
- self.wrapper.width = 30
- expect = ['Did you say',
- '"supercalifragilisticexpialidocious?"',
- 'How *do* you spell that odd',
- 'word, anyways?'
- ]
- result = self.wrapper.wrap(self.text)
- self.check(result, expect)
- # Same thing with kwargs passed to standalone wrap() function.
- result = wrap(self.text, width=30, break_long_words=0)
- self.check(result, expect)
- def test_max_lines_long(self):
- self.check_wrap(self.text, 12,
- ['Did you say ',
- '"supercalifr',
- 'agilisticexp',
- '[...]'],
- max_lines=4)
- class LongWordWithHyphensTestCase(BaseTestCase):
- def setUp(self):
- self.wrapper = TextWrapper()
- self.text1 = '''\
- We used enyzme 2-succinyl-6-hydroxy-2,4-cyclohexadiene-1-carboxylate synthase.
- '''
- self.text2 = '''\
- 1234567890-1234567890--this_is_a_very_long_option_indeed-good-bye"
- '''
- def test_break_long_words_on_hyphen(self):
- expected = ['We used enyzme 2-succinyl-6-hydroxy-2,4-',
- 'cyclohexadiene-1-carboxylate synthase.']
- self.check_wrap(self.text1, 50, expected)
- expected = ['We used', 'enyzme 2-', 'succinyl-', '6-hydroxy-', '2,4-',
- 'cyclohexad', 'iene-1-', 'carboxylat', 'e', 'synthase.']
- self.check_wrap(self.text1, 10, expected)
- expected = ['1234567890', '-123456789', '0--this_is', '_a_very_lo',
- 'ng_option_', 'indeed-', 'good-bye"']
- self.check_wrap(self.text2, 10, expected)
- def test_break_long_words_not_on_hyphen(self):
- expected = ['We used enyzme 2-succinyl-6-hydroxy-2,4-cyclohexad',
- 'iene-1-carboxylate synthase.']
- self.check_wrap(self.text1, 50, expected, break_on_hyphens=False)
- expected = ['We used', 'enyzme 2-s', 'uccinyl-6-', 'hydroxy-2,',
- '4-cyclohex', 'adiene-1-c', 'arboxylate', 'synthase.']
- self.check_wrap(self.text1, 10, expected, break_on_hyphens=False)
- expected = ['1234567890', '-123456789', '0--this_is', '_a_very_lo',
- 'ng_option_', 'indeed-', 'good-bye"']
- self.check_wrap(self.text2, 10, expected)
- def test_break_on_hyphen_but_not_long_words(self):
- expected = ['We used enyzme',
- '2-succinyl-6-hydroxy-2,4-cyclohexadiene-1-carboxylate',
- 'synthase.']
- self.check_wrap(self.text1, 50, expected, break_long_words=False)
- expected = ['We used', 'enyzme',
- '2-succinyl-6-hydroxy-2,4-cyclohexadiene-1-carboxylate',
- 'synthase.']
- self.check_wrap(self.text1, 10, expected, break_long_words=False)
- expected = ['1234567890', '-123456789', '0--this_is', '_a_very_lo',
- 'ng_option_', 'indeed-', 'good-bye"']
- self.check_wrap(self.text2, 10, expected)
- def test_do_not_break_long_words_or_on_hyphens(self):
- expected = ['We used enyzme',
- '2-succinyl-6-hydroxy-2,4-cyclohexadiene-1-carboxylate',
- 'synthase.']
- self.check_wrap(self.text1, 50, expected,
- break_long_words=False,
- break_on_hyphens=False)
- expected = ['We used', 'enyzme',
- '2-succinyl-6-hydroxy-2,4-cyclohexadiene-1-carboxylate',
- 'synthase.']
- self.check_wrap(self.text1, 10, expected,
- break_long_words=False,
- break_on_hyphens=False)
- expected = ['1234567890', '-123456789', '0--this_is', '_a_very_lo',
- 'ng_option_', 'indeed-', 'good-bye"']
- self.check_wrap(self.text2, 10, expected)
- class IndentTestCases(BaseTestCase):
- # called before each test method
- def setUp(self):
- self.text = '''\
- This paragraph will be filled, first without any indentation,
- and then with some (including a hanging indent).'''
- def test_fill(self):
- # Test the fill() method
- expect = '''\
- This paragraph will be filled, first
- without any indentation, and then with
- some (including a hanging indent).'''
- result = fill(self.text, 40)
- self.check(result, expect)
- def test_initial_indent(self):
- # Test initial_indent parameter
- expect = [" This paragraph will be filled,",
- "first without any indentation, and then",
- "with some (including a hanging indent)."]
- result = wrap(self.text, 40, initial_indent=" ")
- self.check(result, expect)
- expect = "\n".join(expect)
- result = fill(self.text, 40, initial_indent=" ")
- self.check(result, expect)
- def test_subsequent_indent(self):
- # Test subsequent_indent parameter
- expect = '''\
- * This paragraph will be filled, first
- without any indentation, and then
- with some (including a hanging
- indent).'''
- result = fill(self.text, 40,
- initial_indent=" * ", subsequent_indent=" ")
- self.check(result, expect)
- # Despite the similar names, DedentTestCase is *not* the inverse
- # of IndentTestCase!
- class DedentTestCase(unittest.TestCase):
- def assertUnchanged(self, text):
- """assert that dedent() has no effect on 'text'"""
- self.assertEqual(text, dedent(text))
- def test_dedent_nomargin(self):
- # No lines indented.
- text = "Hello there.\nHow are you?\nOh good, I'm glad."
- self.assertUnchanged(text)
- # Similar, with a blank line.
- text = "Hello there.\n\nBoo!"
- self.assertUnchanged(text)
- # Some lines indented, but overall margin is still zero.
- text = "Hello there.\n This is indented."
- self.assertUnchanged(text)
- # Again, add a blank line.
- text = "Hello there.\n\n Boo!\n"
- self.assertUnchanged(text)
- def test_dedent_even(self):
- # All lines indented by two spaces.
- text = " Hello there.\n How are ya?\n Oh good."
- expect = "Hello there.\nHow are ya?\nOh good."
- self.assertEqual(expect, dedent(text))
- # Same, with blank lines.
- text = " Hello there.\n\n How are ya?\n Oh good.\n"
- expect = "Hello there.\n\nHow are ya?\nOh good.\n"
- self.assertEqual(expect, dedent(text))
- # Now indent one of the blank lines.
- text = " Hello there.\n \n How are ya?\n Oh good.\n"
- expect = "Hello there.\n\nHow are ya?\nOh good.\n"
- self.assertEqual(expect, dedent(text))
- def test_dedent_uneven(self):
- # Lines indented unevenly.
- text = '''\
- def foo():
- while 1:
- return foo
- '''
- expect = '''\
- def foo():
- while 1:
- return foo
- '''
- self.assertEqual(expect, dedent(text))
- # Uneven indentation with a blank line.
- text = " Foo\n Bar\n\n Baz\n"
- expect = "Foo\n Bar\n\n Baz\n"
- self.assertEqual(expect, dedent(text))
- # Uneven indentation with a whitespace-only line.
- text = " Foo\n Bar\n \n Baz\n"
- expect = "Foo\n Bar\n\n Baz\n"
- self.assertEqual(expect, dedent(text))
- def test_dedent_declining(self):
- # Uneven indentation with declining indent level.
- text = " Foo\n Bar\n" # 5 spaces, then 4
- expect = " Foo\nBar\n"
- self.assertEqual(expect, dedent(text))
- # Declining indent level with blank line.
- text = " Foo\n\n Bar\n" # 5 spaces, blank, then 4
- expect = " Foo\n\nBar\n"
- self.assertEqual(expect, dedent(text))
- # Declining indent level with whitespace only line.
- text = " Foo\n \n Bar\n" # 5 spaces, then 4, then 4
- expect = " Foo\n\nBar\n"
- self.assertEqual(expect, dedent(text))
- # dedent() should not mangle internal tabs
- def test_dedent_preserve_internal_tabs(self):
- text = " hello\tthere\n how are\tyou?"
- expect = "hello\tthere\nhow are\tyou?"
- self.assertEqual(expect, dedent(text))
- # make sure that it preserves tabs when it's not making any
- # changes at all
- self.assertEqual(expect, dedent(expect))
- # dedent() should not mangle tabs in the margin (i.e.
- # tabs and spaces both count as margin, but are *not*
- # considered equivalent)
- def test_dedent_preserve_margin_tabs(self):
- text = " hello there\n\thow are you?"
- self.assertUnchanged(text)
- # same effect even if we have 8 spaces
- text = " hello there\n\thow are you?"
- self.assertUnchanged(text)
- # dedent() only removes whitespace that can be uniformly removed!
- text = "\thello there\n\thow are you?"
- expect = "hello there\nhow are you?"
- self.assertEqual(expect, dedent(text))
- text = " \thello there\n \thow are you?"
- self.assertEqual(expect, dedent(text))
- text = " \t hello there\n \t how are you?"
- self.assertEqual(expect, dedent(text))
- text = " \thello there\n \t how are you?"
- expect = "hello there\n how are you?"
- self.assertEqual(expect, dedent(text))
- # test margin is smaller than smallest indent
- text = " \thello there\n \thow are you?\n \tI'm fine, thanks"
- expect = " \thello there\n \thow are you?\n\tI'm fine, thanks"
- self.assertEqual(expect, dedent(text))
- # Test textwrap.indent
- class IndentTestCase(unittest.TestCase):
- # The examples used for tests. If any of these change, the expected
- # results in the various test cases must also be updated.
- # The roundtrip cases are separate, because textwrap.dedent doesn't
- # handle Windows line endings
- ROUNDTRIP_CASES = (
- # Basic test case
- "Hi.\nThis is a test.\nTesting.",
- # Include a blank line
- "Hi.\nThis is a test.\n\nTesting.",
- # Include leading and trailing blank lines
- "\nHi.\nThis is a test.\nTesting.\n",
- )
- CASES = ROUNDTRIP_CASES + (
- # Use Windows line endings
- "Hi.\r\nThis is a test.\r\nTesting.\r\n",
- # Pathological case
- "\nHi.\r\nThis is a test.\n\r\nTesting.\r\n\n",
- )
- def test_indent_nomargin_default(self):
- # indent should do nothing if 'prefix' is empty.
- for text in self.CASES:
- self.assertEqual(indent(text, ''), text)
- def test_indent_nomargin_explicit_default(self):
- # The same as test_indent_nomargin, but explicitly requesting
- # the default behaviour by passing None as the predicate
- for text in self.CASES:
- self.assertEqual(indent(text, '', None), text)
- def test_indent_nomargin_all_lines(self):
- # The same as test_indent_nomargin, but using the optional
- # predicate argument
- predicate = lambda line: True
- for text in self.CASES:
- self.assertEqual(indent(text, '', predicate), text)
- def test_indent_no_lines(self):
- # Explicitly skip indenting any lines
- predicate = lambda line: False
- for text in self.CASES:
- self.assertEqual(indent(text, ' ', predicate), text)
- def test_roundtrip_spaces(self):
- # A whitespace prefix should roundtrip with dedent
- for text in self.ROUNDTRIP_CASES:
- self.assertEqual(dedent(indent(text, ' ')), text)
- def test_roundtrip_tabs(self):
- # A whitespace prefix should roundtrip with dedent
- for text in self.ROUNDTRIP_CASES:
- self.assertEqual(dedent(indent(text, '\t\t')), text)
- def test_roundtrip_mixed(self):
- # A whitespace prefix should roundtrip with dedent
- for text in self.ROUNDTRIP_CASES:
- self.assertEqual(dedent(indent(text, ' \t \t ')), text)
- def test_indent_default(self):
- # Test default indenting of lines that are not whitespace only
- prefix = ' '
- expected = (
- # Basic test case
- " Hi.\n This is a test.\n Testing.",
- # Include a blank line
- " Hi.\n This is a test.\n\n Testing.",
- # Include leading and trailing blank lines
- "\n Hi.\n This is a test.\n Testing.\n",
- # Use Windows line endings
- " Hi.\r\n This is a test.\r\n Testing.\r\n",
- # Pathological case
- "\n Hi.\r\n This is a test.\n\r\n Testing.\r\n\n",
- )
- for text, expect in zip(self.CASES, expected):
- self.assertEqual(indent(text, prefix), expect)
- def test_indent_explicit_default(self):
- # Test default indenting of lines that are not whitespace only
- prefix = ' '
- expected = (
- # Basic test case
- " Hi.\n This is a test.\n Testing.",
- # Include a blank line
- " Hi.\n This is a test.\n\n Testing.",
- # Include leading and trailing blank lines
- "\n Hi.\n This is a test.\n Testing.\n",
- # Use Windows line endings
- " Hi.\r\n This is a test.\r\n Testing.\r\n",
- # Pathological case
- "\n Hi.\r\n This is a test.\n\r\n Testing.\r\n\n",
- )
- for text, expect in zip(self.CASES, expected):
- self.assertEqual(indent(text, prefix, None), expect)
- def test_indent_all_lines(self):
- # Add 'prefix' to all lines, including whitespace-only ones.
- prefix = ' '
- expected = (
- # Basic test case
- " Hi.\n This is a test.\n Testing.",
- # Include a blank line
- " Hi.\n This is a test.\n \n Testing.",
- # Include leading and trailing blank lines
- " \n Hi.\n This is a test.\n Testing.\n",
- # Use Windows line endings
- " Hi.\r\n This is a test.\r\n Testing.\r\n",
- # Pathological case
- " \n Hi.\r\n This is a test.\n \r\n Testing.\r\n \n",
- )
- predicate = lambda line: True
- for text, expect in zip(self.CASES, expected):
- self.assertEqual(indent(text, prefix, predicate), expect)
- def test_indent_empty_lines(self):
- # Add 'prefix' solely to whitespace-only lines.
- prefix = ' '
- expected = (
- # Basic test case
- "Hi.\nThis is a test.\nTesting.",
- # Include a blank line
- "Hi.\nThis is a test.\n \nTesting.",
- # Include leading and trailing blank lines
- " \nHi.\nThis is a test.\nTesting.\n",
- # Use Windows line endings
- "Hi.\r\nThis is a test.\r\nTesting.\r\n",
- # Pathological case
- " \nHi.\r\nThis is a test.\n \r\nTesting.\r\n \n",
- )
- predicate = lambda line: not line.strip()
- for text, expect in zip(self.CASES, expected):
- self.assertEqual(indent(text, prefix, predicate), expect)
- class ShortenTestCase(BaseTestCase):
- def check_shorten(self, text, width, expect, **kwargs):
- result = shorten(text, width, **kwargs)
- self.check(result, expect)
- def test_simple(self):
- # Simple case: just words, spaces, and a bit of punctuation
- text = "Hello there, how are you this fine day? I'm glad to hear it!"
- self.check_shorten(text, 18, "Hello there, [...]")
- self.check_shorten(text, len(text), text)
- self.check_shorten(text, len(text) - 1,
- "Hello there, how are you this fine day? "
- "I'm glad to [...]")
- def test_placeholder(self):
- text = "Hello there, how are you this fine day? I'm glad to hear it!"
- self.check_shorten(text, 17, "Hello there,$$", placeholder='$$')
- self.check_shorten(text, 18, "Hello there, how$$", placeholder='$$')
- self.check_shorten(text, 18, "Hello there, $$", placeholder=' $$')
- self.check_shorten(text, len(text), text, placeholder='$$')
- self.check_shorten(text, len(text) - 1,
- "Hello there, how are you this fine day? "
- "I'm glad to hear$$", placeholder='$$')
- def test_empty_string(self):
- self.check_shorten("", 6, "")
- def test_whitespace(self):
- # Whitespace collapsing
- text = """
- This is a paragraph that already has
- line breaks and \t tabs too."""
- self.check_shorten(text, 62,
- "This is a paragraph that already has line "
- "breaks and tabs too.")
- self.check_shorten(text, 61,
- "This is a paragraph that already has line "
- "breaks and [...]")
- self.check_shorten("hello world! ", 12, "hello world!")
- self.check_shorten("hello world! ", 11, "hello [...]")
- # The leading space is trimmed from the placeholder
- # (it would be ugly otherwise).
- self.check_shorten("hello world! ", 10, "[...]")
- def test_width_too_small_for_placeholder(self):
- shorten("x" * 20, width=8, placeholder="(......)")
- with self.assertRaises(ValueError):
- shorten("x" * 20, width=8, placeholder="(.......)")
- def test_first_word_too_long_but_placeholder_fits(self):
- self.check_shorten("Helloo", 5, "[...]")
- if __name__ == '__main__':
- unittest.main()
|