python/Lib/textwrap.py

7db96d56Sopenharmony_ci"""Text wrapping and filling.
7db96d56Sopenharmony_ci"""
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci# Copyright (C) 1999-2001 Gregory P. Ward.
7db96d56Sopenharmony_ci# Copyright (C) 2002, 2003 Python Software Foundation.
7db96d56Sopenharmony_ci# Written by Greg Ward <gward@python.net>
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ciimport re
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci__all__ = ['TextWrapper', 'wrap', 'fill', 'dedent', 'indent', 'shorten']
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci# Hardcode the recognized whitespace characters to the US-ASCII
7db96d56Sopenharmony_ci# whitespace characters.  The main reason for doing this is that
7db96d56Sopenharmony_ci# some Unicode spaces (like \u00a0) are non-breaking whitespaces.
7db96d56Sopenharmony_ci_whitespace = '\t\n\x0b\x0c\r '
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ciclass TextWrapper:
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    Object for wrapping/filling text.  The public interface consists of
7db96d56Sopenharmony_ci    the wrap() and fill() methods; the other methods are just there for
7db96d56Sopenharmony_ci    subclasses to override in order to tweak the default behaviour.
7db96d56Sopenharmony_ci    If you want to completely replace the main wrapping algorithm,
7db96d56Sopenharmony_ci    you'll probably have to override _wrap_chunks().
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    Several instance attributes control various aspects of wrapping:
7db96d56Sopenharmony_ci      width (default: 70)
7db96d56Sopenharmony_ci        the maximum width of wrapped lines (unless break_long_words
7db96d56Sopenharmony_ci        is false)
7db96d56Sopenharmony_ci      initial_indent (default: "")
7db96d56Sopenharmony_ci        string that will be prepended to the first line of wrapped
7db96d56Sopenharmony_ci        output.  Counts towards the line's width.
7db96d56Sopenharmony_ci      subsequent_indent (default: "")
7db96d56Sopenharmony_ci        string that will be prepended to all lines save the first
7db96d56Sopenharmony_ci        of wrapped output; also counts towards each line's width.
7db96d56Sopenharmony_ci      expand_tabs (default: true)
7db96d56Sopenharmony_ci        Expand tabs in input text to spaces before further processing.
7db96d56Sopenharmony_ci        Each tab will become 0 .. 'tabsize' spaces, depending on its position
7db96d56Sopenharmony_ci        in its line.  If false, each tab is treated as a single character.
7db96d56Sopenharmony_ci      tabsize (default: 8)
7db96d56Sopenharmony_ci        Expand tabs in input text to 0 .. 'tabsize' spaces, unless
7db96d56Sopenharmony_ci        'expand_tabs' is false.
7db96d56Sopenharmony_ci      replace_whitespace (default: true)
7db96d56Sopenharmony_ci        Replace all whitespace characters in the input text by spaces
7db96d56Sopenharmony_ci        after tab expansion.  Note that if expand_tabs is false and
7db96d56Sopenharmony_ci        replace_whitespace is true, every tab will be converted to a
7db96d56Sopenharmony_ci        single space!
7db96d56Sopenharmony_ci      fix_sentence_endings (default: false)
7db96d56Sopenharmony_ci        Ensure that sentence-ending punctuation is always followed
7db96d56Sopenharmony_ci        by two spaces.  Off by default because the algorithm is
7db96d56Sopenharmony_ci        (unavoidably) imperfect.
7db96d56Sopenharmony_ci      break_long_words (default: true)
7db96d56Sopenharmony_ci        Break words longer than 'width'.  If false, those words will not
7db96d56Sopenharmony_ci        be broken, and some lines might be longer than 'width'.
7db96d56Sopenharmony_ci      break_on_hyphens (default: true)
7db96d56Sopenharmony_ci        Allow breaking hyphenated words. If true, wrapping will occur
7db96d56Sopenharmony_ci        preferably on whitespaces and right after hyphens part of
7db96d56Sopenharmony_ci        compound words.
7db96d56Sopenharmony_ci      drop_whitespace (default: true)
7db96d56Sopenharmony_ci        Drop leading and trailing whitespace from lines.
7db96d56Sopenharmony_ci      max_lines (default: None)
7db96d56Sopenharmony_ci        Truncate wrapped lines.
7db96d56Sopenharmony_ci      placeholder (default: ' [...]')
7db96d56Sopenharmony_ci        Append to the last line of truncated text.
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    unicode_whitespace_trans = dict.fromkeys(map(ord, _whitespace), ord(' '))
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # This funky little regex is just the trick for splitting
7db96d56Sopenharmony_ci    # text up into word-wrappable chunks.  E.g.
7db96d56Sopenharmony_ci    #   "Hello there -- you goof-ball, use the -b option!"
7db96d56Sopenharmony_ci    # splits into
7db96d56Sopenharmony_ci    #   Hello/ /there/ /--/ /you/ /goof-/ball,/ /use/ /the/ /-b/ /option!
7db96d56Sopenharmony_ci    # (after stripping out empty strings).
7db96d56Sopenharmony_ci    word_punct = r'[\w!"\'&.,?]'
7db96d56Sopenharmony_ci    letter = r'[^\d\W]'
7db96d56Sopenharmony_ci    whitespace = r'[%s]' % re.escape(_whitespace)
7db96d56Sopenharmony_ci    nowhitespace = '[^' + whitespace[1:]
7db96d56Sopenharmony_ci    wordsep_re = re.compile(r'''
7db96d56Sopenharmony_ci        ( # any whitespace
7db96d56Sopenharmony_ci          %(ws)s+
7db96d56Sopenharmony_ci        | # em-dash between words
7db96d56Sopenharmony_ci          (?<=%(wp)s) -{2,} (?=\w)
7db96d56Sopenharmony_ci        | # word, possibly hyphenated
7db96d56Sopenharmony_ci          %(nws)s+? (?:
7db96d56Sopenharmony_ci            # hyphenated word
7db96d56Sopenharmony_ci              -(?: (?<=%(lt)s{2}-) | (?<=%(lt)s-%(lt)s-))
7db96d56Sopenharmony_ci              (?= %(lt)s -? %(lt)s)
7db96d56Sopenharmony_ci            | # end of word
7db96d56Sopenharmony_ci              (?=%(ws)s|\Z)
7db96d56Sopenharmony_ci            | # em-dash
7db96d56Sopenharmony_ci              (?<=%(wp)s) (?=-{2,}\w)
7db96d56Sopenharmony_ci            )
7db96d56Sopenharmony_ci        )''' % {'wp': word_punct, 'lt': letter,
7db96d56Sopenharmony_ci                'ws': whitespace, 'nws': nowhitespace},
7db96d56Sopenharmony_ci        re.VERBOSE)
7db96d56Sopenharmony_ci    del word_punct, letter, nowhitespace
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # This less funky little regex just split on recognized spaces. E.g.
7db96d56Sopenharmony_ci    #   "Hello there -- you goof-ball, use the -b option!"
7db96d56Sopenharmony_ci    # splits into
7db96d56Sopenharmony_ci    #   Hello/ /there/ /--/ /you/ /goof-ball,/ /use/ /the/ /-b/ /option!/
7db96d56Sopenharmony_ci    wordsep_simple_re = re.compile(r'(%s+)' % whitespace)
7db96d56Sopenharmony_ci    del whitespace
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # XXX this is not locale- or charset-aware -- string.lowercase
7db96d56Sopenharmony_ci    # is US-ASCII only (and therefore English-only)
7db96d56Sopenharmony_ci    sentence_end_re = re.compile(r'[a-z]'             # lowercase letter
7db96d56Sopenharmony_ci                                 r'[\.\!\?]'          # sentence-ending punct.
7db96d56Sopenharmony_ci                                 r'[\"\']?'           # optional end-of-quote
7db96d56Sopenharmony_ci                                 r'\Z')               # end of chunk
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def __init__(self,
7db96d56Sopenharmony_ci                 width=70,
7db96d56Sopenharmony_ci                 initial_indent="",
7db96d56Sopenharmony_ci                 subsequent_indent="",
7db96d56Sopenharmony_ci                 expand_tabs=True,
7db96d56Sopenharmony_ci                 replace_whitespace=True,
7db96d56Sopenharmony_ci                 fix_sentence_endings=False,
7db96d56Sopenharmony_ci                 break_long_words=True,
7db96d56Sopenharmony_ci                 drop_whitespace=True,
7db96d56Sopenharmony_ci                 break_on_hyphens=True,
7db96d56Sopenharmony_ci                 tabsize=8,
7db96d56Sopenharmony_ci                 *,
7db96d56Sopenharmony_ci                 max_lines=None,
7db96d56Sopenharmony_ci                 placeholder=' [...]'):
7db96d56Sopenharmony_ci        self.width = width
7db96d56Sopenharmony_ci        self.initial_indent = initial_indent
7db96d56Sopenharmony_ci        self.subsequent_indent = subsequent_indent
7db96d56Sopenharmony_ci        self.expand_tabs = expand_tabs
7db96d56Sopenharmony_ci        self.replace_whitespace = replace_whitespace
7db96d56Sopenharmony_ci        self.fix_sentence_endings = fix_sentence_endings
7db96d56Sopenharmony_ci        self.break_long_words = break_long_words
7db96d56Sopenharmony_ci        self.drop_whitespace = drop_whitespace
7db96d56Sopenharmony_ci        self.break_on_hyphens = break_on_hyphens
7db96d56Sopenharmony_ci        self.tabsize = tabsize
7db96d56Sopenharmony_ci        self.max_lines = max_lines
7db96d56Sopenharmony_ci        self.placeholder = placeholder
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # -- Private methods -----------------------------------------------
7db96d56Sopenharmony_ci    # (possibly useful for subclasses to override)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _munge_whitespace(self, text):
7db96d56Sopenharmony_ci        """_munge_whitespace(text : string) -> string
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Munge whitespace in text: expand tabs and convert all other
7db96d56Sopenharmony_ci        whitespace characters to spaces.  Eg. " foo\\tbar\\n\\nbaz"
7db96d56Sopenharmony_ci        becomes " foo    bar  baz".
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        if self.expand_tabs:
7db96d56Sopenharmony_ci            text = text.expandtabs(self.tabsize)
7db96d56Sopenharmony_ci        if self.replace_whitespace:
7db96d56Sopenharmony_ci            text = text.translate(self.unicode_whitespace_trans)
7db96d56Sopenharmony_ci        return text
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _split(self, text):
7db96d56Sopenharmony_ci        """_split(text : string) -> [string]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Split the text to wrap into indivisible chunks.  Chunks are
7db96d56Sopenharmony_ci        not quite the same as words; see _wrap_chunks() for full
7db96d56Sopenharmony_ci        details.  As an example, the text
7db96d56Sopenharmony_ci          Look, goof-ball -- use the -b option!
7db96d56Sopenharmony_ci        breaks into the following chunks:
7db96d56Sopenharmony_ci          'Look,', ' ', 'goof-', 'ball', ' ', '--', ' ',
7db96d56Sopenharmony_ci          'use', ' ', 'the', ' ', '-b', ' ', 'option!'
7db96d56Sopenharmony_ci        if break_on_hyphens is True, or in:
7db96d56Sopenharmony_ci          'Look,', ' ', 'goof-ball', ' ', '--', ' ',
7db96d56Sopenharmony_ci          'use', ' ', 'the', ' ', '-b', ' ', option!'
7db96d56Sopenharmony_ci        otherwise.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        if self.break_on_hyphens is True:
7db96d56Sopenharmony_ci            chunks = self.wordsep_re.split(text)
7db96d56Sopenharmony_ci        else:
7db96d56Sopenharmony_ci            chunks = self.wordsep_simple_re.split(text)
7db96d56Sopenharmony_ci        chunks = [c for c in chunks if c]
7db96d56Sopenharmony_ci        return chunks
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _fix_sentence_endings(self, chunks):
7db96d56Sopenharmony_ci        """_fix_sentence_endings(chunks : [string])
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Correct for sentence endings buried in 'chunks'.  Eg. when the
7db96d56Sopenharmony_ci        original text contains "... foo.\\nBar ...", munge_whitespace()
7db96d56Sopenharmony_ci        and split() will convert that to [..., "foo.", " ", "Bar", ...]
7db96d56Sopenharmony_ci        which has one too few spaces; this method simply changes the one
7db96d56Sopenharmony_ci        space to two.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        i = 0
7db96d56Sopenharmony_ci        patsearch = self.sentence_end_re.search
7db96d56Sopenharmony_ci        while i < len(chunks)-1:
7db96d56Sopenharmony_ci            if chunks[i+1] == " " and patsearch(chunks[i]):
7db96d56Sopenharmony_ci                chunks[i+1] = "  "
7db96d56Sopenharmony_ci                i += 2
7db96d56Sopenharmony_ci            else:
7db96d56Sopenharmony_ci                i += 1
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):
7db96d56Sopenharmony_ci        """_handle_long_word(chunks : [string],
7db96d56Sopenharmony_ci                             cur_line : [string],
7db96d56Sopenharmony_ci                             cur_len : int, width : int)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Handle a chunk of text (most likely a word, not whitespace) that
7db96d56Sopenharmony_ci        is too long to fit in any line.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        # Figure out when indent is larger than the specified width, and make
7db96d56Sopenharmony_ci        # sure at least one character is stripped off on every pass
7db96d56Sopenharmony_ci        if width < 1:
7db96d56Sopenharmony_ci            space_left = 1
7db96d56Sopenharmony_ci        else:
7db96d56Sopenharmony_ci            space_left = width - cur_len
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # If we're allowed to break long words, then do so: put as much
7db96d56Sopenharmony_ci        # of the next chunk onto the current line as will fit.
7db96d56Sopenharmony_ci        if self.break_long_words:
7db96d56Sopenharmony_ci            end = space_left
7db96d56Sopenharmony_ci            chunk = reversed_chunks[-1]
7db96d56Sopenharmony_ci            if self.break_on_hyphens and len(chunk) > space_left:
7db96d56Sopenharmony_ci                # break after last hyphen, but only if there are
7db96d56Sopenharmony_ci                # non-hyphens before it
7db96d56Sopenharmony_ci                hyphen = chunk.rfind('-', 0, space_left)
7db96d56Sopenharmony_ci                if hyphen > 0 and any(c != '-' for c in chunk[:hyphen]):
7db96d56Sopenharmony_ci                    end = hyphen + 1
7db96d56Sopenharmony_ci            cur_line.append(chunk[:end])
7db96d56Sopenharmony_ci            reversed_chunks[-1] = chunk[end:]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # Otherwise, we have to preserve the long word intact.  Only add
7db96d56Sopenharmony_ci        # it to the current line if there's nothing already there --
7db96d56Sopenharmony_ci        # that minimizes how much we violate the width constraint.
7db96d56Sopenharmony_ci        elif not cur_line:
7db96d56Sopenharmony_ci            cur_line.append(reversed_chunks.pop())
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # If we're not allowed to break long words, and there's already
7db96d56Sopenharmony_ci        # text on the current line, do nothing.  Next time through the
7db96d56Sopenharmony_ci        # main loop of _wrap_chunks(), we'll wind up here again, but
7db96d56Sopenharmony_ci        # cur_len will be zero, so the next line will be entirely
7db96d56Sopenharmony_ci        # devoted to the long word that we can't handle right now.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _wrap_chunks(self, chunks):
7db96d56Sopenharmony_ci        """_wrap_chunks(chunks : [string]) -> [string]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Wrap a sequence of text chunks and return a list of lines of
7db96d56Sopenharmony_ci        length 'self.width' or less.  (If 'break_long_words' is false,
7db96d56Sopenharmony_ci        some lines may be longer than this.)  Chunks correspond roughly
7db96d56Sopenharmony_ci        to words and the whitespace between them: each chunk is
7db96d56Sopenharmony_ci        indivisible (modulo 'break_long_words'), but a line break can
7db96d56Sopenharmony_ci        come between any two chunks.  Chunks should not have internal
7db96d56Sopenharmony_ci        whitespace; ie. a chunk is either all whitespace or a "word".
7db96d56Sopenharmony_ci        Whitespace chunks will be removed from the beginning and end of
7db96d56Sopenharmony_ci        lines, but apart from that whitespace is preserved.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        lines = []
7db96d56Sopenharmony_ci        if self.width <= 0:
7db96d56Sopenharmony_ci            raise ValueError("invalid width %r (must be > 0)" % self.width)
7db96d56Sopenharmony_ci        if self.max_lines is not None:
7db96d56Sopenharmony_ci            if self.max_lines > 1:
7db96d56Sopenharmony_ci                indent = self.subsequent_indent
7db96d56Sopenharmony_ci            else:
7db96d56Sopenharmony_ci                indent = self.initial_indent
7db96d56Sopenharmony_ci            if len(indent) + len(self.placeholder.lstrip()) > self.width:
7db96d56Sopenharmony_ci                raise ValueError("placeholder too large for max width")
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # Arrange in reverse order so items can be efficiently popped
7db96d56Sopenharmony_ci        # from a stack of chucks.
7db96d56Sopenharmony_ci        chunks.reverse()
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        while chunks:
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # Start the list of chunks that will make up the current line.
7db96d56Sopenharmony_ci            # cur_len is just the length of all the chunks in cur_line.
7db96d56Sopenharmony_ci            cur_line = []
7db96d56Sopenharmony_ci            cur_len = 0
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # Figure out which static string will prefix this line.
7db96d56Sopenharmony_ci            if lines:
7db96d56Sopenharmony_ci                indent = self.subsequent_indent
7db96d56Sopenharmony_ci            else:
7db96d56Sopenharmony_ci                indent = self.initial_indent
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # Maximum width for this line.
7db96d56Sopenharmony_ci            width = self.width - len(indent)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # First chunk on line is whitespace -- drop it, unless this
7db96d56Sopenharmony_ci            # is the very beginning of the text (ie. no lines started yet).
7db96d56Sopenharmony_ci            if self.drop_whitespace and chunks[-1].strip() == '' and lines:
7db96d56Sopenharmony_ci                del chunks[-1]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            while chunks:
7db96d56Sopenharmony_ci                l = len(chunks[-1])
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci                # Can at least squeeze this chunk onto the current line.
7db96d56Sopenharmony_ci                if cur_len + l <= width:
7db96d56Sopenharmony_ci                    cur_line.append(chunks.pop())
7db96d56Sopenharmony_ci                    cur_len += l
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci                # Nope, this line is full.
7db96d56Sopenharmony_ci                else:
7db96d56Sopenharmony_ci                    break
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # The current line is full, and the next chunk is too big to
7db96d56Sopenharmony_ci            # fit on *any* line (not just this one).
7db96d56Sopenharmony_ci            if chunks and len(chunks[-1]) > width:
7db96d56Sopenharmony_ci                self._handle_long_word(chunks, cur_line, cur_len, width)
7db96d56Sopenharmony_ci                cur_len = sum(map(len, cur_line))
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            # If the last chunk on this line is all whitespace, drop it.
7db96d56Sopenharmony_ci            if self.drop_whitespace and cur_line and cur_line[-1].strip() == '':
7db96d56Sopenharmony_ci                cur_len -= len(cur_line[-1])
7db96d56Sopenharmony_ci                del cur_line[-1]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci            if cur_line:
7db96d56Sopenharmony_ci                if (self.max_lines is None or
7db96d56Sopenharmony_ci                    len(lines) + 1 < self.max_lines or
7db96d56Sopenharmony_ci                    (not chunks or
7db96d56Sopenharmony_ci                     self.drop_whitespace and
7db96d56Sopenharmony_ci                     len(chunks) == 1 and
7db96d56Sopenharmony_ci                     not chunks[0].strip()) and cur_len <= width):
7db96d56Sopenharmony_ci                    # Convert current line back to a string and store it in
7db96d56Sopenharmony_ci                    # list of all lines (return value).
7db96d56Sopenharmony_ci                    lines.append(indent + ''.join(cur_line))
7db96d56Sopenharmony_ci                else:
7db96d56Sopenharmony_ci                    while cur_line:
7db96d56Sopenharmony_ci                        if (cur_line[-1].strip() and
7db96d56Sopenharmony_ci                            cur_len + len(self.placeholder) <= width):
7db96d56Sopenharmony_ci                            cur_line.append(self.placeholder)
7db96d56Sopenharmony_ci                            lines.append(indent + ''.join(cur_line))
7db96d56Sopenharmony_ci                            break
7db96d56Sopenharmony_ci                        cur_len -= len(cur_line[-1])
7db96d56Sopenharmony_ci                        del cur_line[-1]
7db96d56Sopenharmony_ci                    else:
7db96d56Sopenharmony_ci                        if lines:
7db96d56Sopenharmony_ci                            prev_line = lines[-1].rstrip()
7db96d56Sopenharmony_ci                            if (len(prev_line) + len(self.placeholder) <=
7db96d56Sopenharmony_ci                                    self.width):
7db96d56Sopenharmony_ci                                lines[-1] = prev_line + self.placeholder
7db96d56Sopenharmony_ci                                break
7db96d56Sopenharmony_ci                        lines.append(indent + self.placeholder.lstrip())
7db96d56Sopenharmony_ci                    break
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        return lines
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def _split_chunks(self, text):
7db96d56Sopenharmony_ci        text = self._munge_whitespace(text)
7db96d56Sopenharmony_ci        return self._split(text)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # -- Public interface ----------------------------------------------
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def wrap(self, text):
7db96d56Sopenharmony_ci        """wrap(text : string) -> [string]
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Reformat the single paragraph in 'text' so it fits in lines of
7db96d56Sopenharmony_ci        no more than 'self.width' columns, and return a list of wrapped
7db96d56Sopenharmony_ci        lines.  Tabs in 'text' are expanded with string.expandtabs(),
7db96d56Sopenharmony_ci        and all other whitespace characters (including newline) are
7db96d56Sopenharmony_ci        converted to space.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        chunks = self._split_chunks(text)
7db96d56Sopenharmony_ci        if self.fix_sentence_endings:
7db96d56Sopenharmony_ci            self._fix_sentence_endings(chunks)
7db96d56Sopenharmony_ci        return self._wrap_chunks(chunks)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def fill(self, text):
7db96d56Sopenharmony_ci        """fill(text : string) -> string
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        Reformat the single paragraph in 'text' to fit in lines of no
7db96d56Sopenharmony_ci        more than 'self.width' columns, and return a new string
7db96d56Sopenharmony_ci        containing the entire wrapped paragraph.
7db96d56Sopenharmony_ci        """
7db96d56Sopenharmony_ci        return "\n".join(self.wrap(text))
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci# -- Convenience interface ---------------------------------------------
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_cidef wrap(text, width=70, **kwargs):
7db96d56Sopenharmony_ci    """Wrap a single paragraph of text, returning a list of wrapped lines.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    Reformat the single paragraph in 'text' so it fits in lines of no
7db96d56Sopenharmony_ci    more than 'width' columns, and return a list of wrapped lines.  By
7db96d56Sopenharmony_ci    default, tabs in 'text' are expanded with string.expandtabs(), and
7db96d56Sopenharmony_ci    all other whitespace characters (including newline) are converted to
7db96d56Sopenharmony_ci    space.  See TextWrapper class for available keyword args to customize
7db96d56Sopenharmony_ci    wrapping behaviour.
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    w = TextWrapper(width=width, **kwargs)
7db96d56Sopenharmony_ci    return w.wrap(text)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_cidef fill(text, width=70, **kwargs):
7db96d56Sopenharmony_ci    """Fill a single paragraph of text, returning a new string.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    Reformat the single paragraph in 'text' to fit in lines of no more
7db96d56Sopenharmony_ci    than 'width' columns, and return a new string containing the entire
7db96d56Sopenharmony_ci    wrapped paragraph.  As with wrap(), tabs are expanded and other
7db96d56Sopenharmony_ci    whitespace characters converted to space.  See TextWrapper class for
7db96d56Sopenharmony_ci    available keyword args to customize wrapping behaviour.
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    w = TextWrapper(width=width, **kwargs)
7db96d56Sopenharmony_ci    return w.fill(text)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_cidef shorten(text, width, **kwargs):
7db96d56Sopenharmony_ci    """Collapse and truncate the given text to fit in the given width.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    The text first has its whitespace collapsed.  If it then fits in
7db96d56Sopenharmony_ci    the *width*, it is returned as is.  Otherwise, as many words
7db96d56Sopenharmony_ci    as possible are joined and then the placeholder is appended::
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        >>> textwrap.shorten("Hello  world!", width=12)
7db96d56Sopenharmony_ci        'Hello world!'
7db96d56Sopenharmony_ci        >>> textwrap.shorten("Hello  world!", width=11)
7db96d56Sopenharmony_ci        'Hello [...]'
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    w = TextWrapper(width=width, max_lines=1, **kwargs)
7db96d56Sopenharmony_ci    return w.fill(' '.join(text.strip().split()))
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci# -- Loosely related functionality -------------------------------------
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci_whitespace_only_re = re.compile('^[ \t]+$', re.MULTILINE)
7db96d56Sopenharmony_ci_leading_whitespace_re = re.compile('(^[ \t]*)(?:[^ \t\n])', re.MULTILINE)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_cidef dedent(text):
7db96d56Sopenharmony_ci    """Remove any common leading whitespace from every line in `text`.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    This can be used to make triple-quoted strings line up with the left
7db96d56Sopenharmony_ci    edge of the display, while still presenting them in the source code
7db96d56Sopenharmony_ci    in indented form.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    Note that tabs and spaces are both treated as whitespace, but they
7db96d56Sopenharmony_ci    are not equal: the lines "  hello" and "\\thello" are
7db96d56Sopenharmony_ci    considered to have no common leading whitespace.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    Entirely blank lines are normalized to a newline character.
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    # Look for the longest leading string of spaces and tabs common to
7db96d56Sopenharmony_ci    # all lines.
7db96d56Sopenharmony_ci    margin = None
7db96d56Sopenharmony_ci    text = _whitespace_only_re.sub('', text)
7db96d56Sopenharmony_ci    indents = _leading_whitespace_re.findall(text)
7db96d56Sopenharmony_ci    for indent in indents:
7db96d56Sopenharmony_ci        if margin is None:
7db96d56Sopenharmony_ci            margin = indent
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # Current line more deeply indented than previous winner:
7db96d56Sopenharmony_ci        # no change (previous winner is still on top).
7db96d56Sopenharmony_ci        elif indent.startswith(margin):
7db96d56Sopenharmony_ci            pass
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # Current line consistent with and no deeper than previous winner:
7db96d56Sopenharmony_ci        # it's the new winner.
7db96d56Sopenharmony_ci        elif margin.startswith(indent):
7db96d56Sopenharmony_ci            margin = indent
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci        # Find the largest common whitespace between current line and previous
7db96d56Sopenharmony_ci        # winner.
7db96d56Sopenharmony_ci        else:
7db96d56Sopenharmony_ci            for i, (x, y) in enumerate(zip(margin, indent)):
7db96d56Sopenharmony_ci                if x != y:
7db96d56Sopenharmony_ci                    margin = margin[:i]
7db96d56Sopenharmony_ci                    break
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    # sanity check (testing/debugging only)
7db96d56Sopenharmony_ci    if 0 and margin:
7db96d56Sopenharmony_ci        for line in text.split("\n"):
7db96d56Sopenharmony_ci            assert not line or line.startswith(margin), \
7db96d56Sopenharmony_ci                   "line = %r, margin = %r" % (line, margin)
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    if margin:
7db96d56Sopenharmony_ci        text = re.sub(r'(?m)^' + margin, '', text)
7db96d56Sopenharmony_ci    return text
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_cidef indent(text, prefix, predicate=None):
7db96d56Sopenharmony_ci    """Adds 'prefix' to the beginning of selected lines in 'text'.
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    If 'predicate' is provided, 'prefix' will only be added to the lines
7db96d56Sopenharmony_ci    where 'predicate(line)' is True. If 'predicate' is not provided,
7db96d56Sopenharmony_ci    it will default to adding 'prefix' to all non-empty lines that do not
7db96d56Sopenharmony_ci    consist solely of whitespace characters.
7db96d56Sopenharmony_ci    """
7db96d56Sopenharmony_ci    if predicate is None:
7db96d56Sopenharmony_ci        def predicate(line):
7db96d56Sopenharmony_ci            return line.strip()
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci    def prefixed_lines():
7db96d56Sopenharmony_ci        for line in text.splitlines(True):
7db96d56Sopenharmony_ci            yield (prefix + line if predicate(line) else line)
7db96d56Sopenharmony_ci    return ''.join(prefixed_lines())
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ci
7db96d56Sopenharmony_ciif __name__ == "__main__":
7db96d56Sopenharmony_ci    #print dedent("\tfoo\n\tbar")
7db96d56Sopenharmony_ci    #print dedent("  \thello there\n  \t  how are you?")
7db96d56Sopenharmony_ci    print(dedent("Hello there.\n  This is indented."))