You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					441 lines
				
				17 KiB
			
		
		
			
		
	
	
					441 lines
				
				17 KiB
			| 
											3 years ago
										 | // Partial port of python's argparse module, version 3.9.0 (only wrap and fill functions):
 | ||
|  | // https://github.com/python/cpython/blob/v3.9.0b4/Lib/textwrap.py
 | ||
|  | 
 | ||
|  | 'use strict' | ||
|  | 
 | ||
|  | /* | ||
|  |  * Text wrapping and filling. | ||
|  |  */ | ||
|  | 
 | ||
|  | // Copyright (C) 1999-2001 Gregory P. Ward.
 | ||
|  | // Copyright (C) 2002, 2003 Python Software Foundation.
 | ||
|  | // Copyright (C) 2020 argparse.js authors
 | ||
|  | // Originally written by Greg Ward <gward@python.net>
 | ||
|  | 
 | ||
|  | // Hardcode the recognized whitespace characters to the US-ASCII
 | ||
|  | // whitespace characters.  The main reason for doing this is that
 | ||
|  | // some Unicode spaces (like \u00a0) are non-breaking whitespaces.
 | ||
|  | //
 | ||
|  | // This less funky little regex just split on recognized spaces. E.g.
 | ||
|  | //   "Hello there -- you goof-ball, use the -b option!"
 | ||
|  | // splits into
 | ||
|  | //   Hello/ /there/ /--/ /you/ /goof-ball,/ /use/ /the/ /-b/ /option!/
 | ||
|  | const wordsep_simple_re = /([\t\n\x0b\x0c\r ]+)/ | ||
|  | 
 | ||
|  | class TextWrapper { | ||
|  |     /* | ||
|  |      *  Object for wrapping/filling text.  The public interface consists of | ||
|  |      *  the wrap() and fill() methods; the other methods are just there for | ||
|  |      *  subclasses to override in order to tweak the default behaviour. | ||
|  |      *  If you want to completely replace the main wrapping algorithm, | ||
|  |      *  you'll probably have to override _wrap_chunks(). | ||
|  |      * | ||
|  |      *  Several instance attributes control various aspects of wrapping: | ||
|  |      *    width (default: 70) | ||
|  |      *      the maximum width of wrapped lines (unless break_long_words | ||
|  |      *      is false) | ||
|  |      *    initial_indent (default: "") | ||
|  |      *      string that will be prepended to the first line of wrapped | ||
|  |      *      output.  Counts towards the line's width. | ||
|  |      *    subsequent_indent (default: "") | ||
|  |      *      string that will be prepended to all lines save the first | ||
|  |      *      of wrapped output; also counts towards each line's width. | ||
|  |      *    expand_tabs (default: true) | ||
|  |      *      Expand tabs in input text to spaces before further processing. | ||
|  |      *      Each tab will become 0 .. 'tabsize' spaces, depending on its position | ||
|  |      *      in its line.  If false, each tab is treated as a single character. | ||
|  |      *    tabsize (default: 8) | ||
|  |      *      Expand tabs in input text to 0 .. 'tabsize' spaces, unless | ||
|  |      *      'expand_tabs' is false. | ||
|  |      *    replace_whitespace (default: true) | ||
|  |      *      Replace all whitespace characters in the input text by spaces | ||
|  |      *      after tab expansion.  Note that if expand_tabs is false and | ||
|  |      *      replace_whitespace is true, every tab will be converted to a | ||
|  |      *      single space! | ||
|  |      *    fix_sentence_endings (default: false) | ||
|  |      *      Ensure that sentence-ending punctuation is always followed | ||
|  |      *      by two spaces.  Off by default because the algorithm is | ||
|  |      *      (unavoidably) imperfect. | ||
|  |      *    break_long_words (default: true) | ||
|  |      *      Break words longer than 'width'.  If false, those words will not | ||
|  |      *      be broken, and some lines might be longer than 'width'. | ||
|  |      *    break_on_hyphens (default: true) | ||
|  |      *      Allow breaking hyphenated words. If true, wrapping will occur | ||
|  |      *      preferably on whitespaces and right after hyphens part of | ||
|  |      *      compound words. | ||
|  |      *    drop_whitespace (default: true) | ||
|  |      *      Drop leading and trailing whitespace from lines. | ||
|  |      *    max_lines (default: None) | ||
|  |      *      Truncate wrapped lines. | ||
|  |      *    placeholder (default: ' [...]') | ||
|  |      *      Append to the last line of truncated text. | ||
|  |      */ | ||
|  | 
 | ||
|  |     constructor(options = {}) { | ||
|  |         let { | ||
|  |             width = 70, | ||
|  |             initial_indent = '', | ||
|  |             subsequent_indent = '', | ||
|  |             expand_tabs = true, | ||
|  |             replace_whitespace = true, | ||
|  |             fix_sentence_endings = false, | ||
|  |             break_long_words = true, | ||
|  |             drop_whitespace = true, | ||
|  |             break_on_hyphens = true, | ||
|  |             tabsize = 8, | ||
|  |             max_lines = undefined, | ||
|  |             placeholder=' [...]' | ||
|  |         } = options | ||
|  | 
 | ||
|  |         this.width = width | ||
|  |         this.initial_indent = initial_indent | ||
|  |         this.subsequent_indent = subsequent_indent | ||
|  |         this.expand_tabs = expand_tabs | ||
|  |         this.replace_whitespace = replace_whitespace | ||
|  |         this.fix_sentence_endings = fix_sentence_endings | ||
|  |         this.break_long_words = break_long_words | ||
|  |         this.drop_whitespace = drop_whitespace | ||
|  |         this.break_on_hyphens = break_on_hyphens | ||
|  |         this.tabsize = tabsize | ||
|  |         this.max_lines = max_lines | ||
|  |         this.placeholder = placeholder | ||
|  |     } | ||
|  | 
 | ||
|  | 
 | ||
|  |     // -- Private methods -----------------------------------------------
 | ||
|  |     // (possibly useful for subclasses to override)
 | ||
|  | 
 | ||
|  |     _munge_whitespace(text) { | ||
|  |         /* | ||
|  |          *  _munge_whitespace(text : string) -> string | ||
|  |          * | ||
|  |          *  Munge whitespace in text: expand tabs and convert all other | ||
|  |          *  whitespace characters to spaces.  Eg. " foo\\tbar\\n\\nbaz" | ||
|  |          *  becomes " foo    bar  baz". | ||
|  |          */ | ||
|  |         if (this.expand_tabs) { | ||
|  |             text = text.replace(/\t/g, ' '.repeat(this.tabsize)) // not strictly correct in js
 | ||
|  |         } | ||
|  |         if (this.replace_whitespace) { | ||
|  |             text = text.replace(/[\t\n\x0b\x0c\r]/g, ' ') | ||
|  |         } | ||
|  |         return text | ||
|  |     } | ||
|  | 
 | ||
|  |     _split(text) { | ||
|  |         /* | ||
|  |          *  _split(text : string) -> [string] | ||
|  |          * | ||
|  |          *  Split the text to wrap into indivisible chunks.  Chunks are | ||
|  |          *  not quite the same as words; see _wrap_chunks() for full | ||
|  |          *  details.  As an example, the text | ||
|  |          *    Look, goof-ball -- use the -b option! | ||
|  |          *  breaks into the following chunks: | ||
|  |          *    'Look,', ' ', 'goof-', 'ball', ' ', '--', ' ', | ||
|  |          *    'use', ' ', 'the', ' ', '-b', ' ', 'option!' | ||
|  |          *  if break_on_hyphens is True, or in: | ||
|  |          *    'Look,', ' ', 'goof-ball', ' ', '--', ' ', | ||
|  |          *    'use', ' ', 'the', ' ', '-b', ' ', option!' | ||
|  |          *  otherwise. | ||
|  |          */ | ||
|  |         let chunks = text.split(wordsep_simple_re) | ||
|  |         chunks = chunks.filter(Boolean) | ||
|  |         return chunks | ||
|  |     } | ||
|  | 
 | ||
|  |     _handle_long_word(reversed_chunks, cur_line, cur_len, width) { | ||
|  |         /* | ||
|  |          *  _handle_long_word(chunks : [string], | ||
|  |          *                    cur_line : [string], | ||
|  |          *                    cur_len : int, width : int) | ||
|  |          * | ||
|  |          *  Handle a chunk of text (most likely a word, not whitespace) that | ||
|  |          *  is too long to fit in any line. | ||
|  |          */ | ||
|  |         // Figure out when indent is larger than the specified width, and make
 | ||
|  |         // sure at least one character is stripped off on every pass
 | ||
|  |         let space_left | ||
|  |         if (width < 1) { | ||
|  |             space_left = 1 | ||
|  |         } else { | ||
|  |             space_left = width - cur_len | ||
|  |         } | ||
|  | 
 | ||
|  |         // If we're allowed to break long words, then do so: put as much
 | ||
|  |         // of the next chunk onto the current line as will fit.
 | ||
|  |         if (this.break_long_words) { | ||
|  |             cur_line.push(reversed_chunks[reversed_chunks.length - 1].slice(0, space_left)) | ||
|  |             reversed_chunks[reversed_chunks.length - 1] = reversed_chunks[reversed_chunks.length - 1].slice(space_left) | ||
|  | 
 | ||
|  |         // Otherwise, we have to preserve the long word intact.  Only add
 | ||
|  |         // it to the current line if there's nothing already there --
 | ||
|  |         // that minimizes how much we violate the width constraint.
 | ||
|  |         } else if (!cur_line) { | ||
|  |             cur_line.push(...reversed_chunks.pop()) | ||
|  |         } | ||
|  | 
 | ||
|  |         // If we're not allowed to break long words, and there's already
 | ||
|  |         // text on the current line, do nothing.  Next time through the
 | ||
|  |         // main loop of _wrap_chunks(), we'll wind up here again, but
 | ||
|  |         // cur_len will be zero, so the next line will be entirely
 | ||
|  |         // devoted to the long word that we can't handle right now.
 | ||
|  |     } | ||
|  | 
 | ||
|  |     _wrap_chunks(chunks) { | ||
|  |         /* | ||
|  |          *  _wrap_chunks(chunks : [string]) -> [string] | ||
|  |          * | ||
|  |          *  Wrap a sequence of text chunks and return a list of lines of | ||
|  |          *  length 'self.width' or less.  (If 'break_long_words' is false, | ||
|  |          *  some lines may be longer than this.)  Chunks correspond roughly | ||
|  |          *  to words and the whitespace between them: each chunk is | ||
|  |          *  indivisible (modulo 'break_long_words'), but a line break can | ||
|  |          *  come between any two chunks.  Chunks should not have internal | ||
|  |          *  whitespace; ie. a chunk is either all whitespace or a "word". | ||
|  |          *  Whitespace chunks will be removed from the beginning and end of | ||
|  |          *  lines, but apart from that whitespace is preserved. | ||
|  |          */ | ||
|  |         let lines = [] | ||
|  |         let indent | ||
|  |         if (this.width <= 0) { | ||
|  |             throw Error(`invalid width ${this.width} (must be > 0)`) | ||
|  |         } | ||
|  |         if (this.max_lines !== undefined) { | ||
|  |             if (this.max_lines > 1) { | ||
|  |                 indent = this.subsequent_indent | ||
|  |             } else { | ||
|  |                 indent = this.initial_indent | ||
|  |             } | ||
|  |             if (indent.length + this.placeholder.trimStart().length > this.width) { | ||
|  |                 throw Error('placeholder too large for max width') | ||
|  |             } | ||
|  |         } | ||
|  | 
 | ||
|  |         // Arrange in reverse order so items can be efficiently popped
 | ||
|  |         // from a stack of chucks.
 | ||
|  |         chunks = chunks.reverse() | ||
|  | 
 | ||
|  |         while (chunks.length > 0) { | ||
|  | 
 | ||
|  |             // Start the list of chunks that will make up the current line.
 | ||
|  |             // cur_len is just the length of all the chunks in cur_line.
 | ||
|  |             let cur_line = [] | ||
|  |             let cur_len = 0 | ||
|  | 
 | ||
|  |             // Figure out which static string will prefix this line.
 | ||
|  |             let indent | ||
|  |             if (lines) { | ||
|  |                 indent = this.subsequent_indent | ||
|  |             } else { | ||
|  |                 indent = this.initial_indent | ||
|  |             } | ||
|  | 
 | ||
|  |             // Maximum width for this line.
 | ||
|  |             let width = this.width - indent.length | ||
|  | 
 | ||
|  |             // First chunk on line is whitespace -- drop it, unless this
 | ||
|  |             // is the very beginning of the text (ie. no lines started yet).
 | ||
|  |             if (this.drop_whitespace && chunks[chunks.length - 1].trim() === '' && lines.length > 0) { | ||
|  |                 chunks.pop() | ||
|  |             } | ||
|  | 
 | ||
|  |             while (chunks.length > 0) { | ||
|  |                 let l = chunks[chunks.length - 1].length | ||
|  | 
 | ||
|  |                 // Can at least squeeze this chunk onto the current line.
 | ||
|  |                 if (cur_len + l <= width) { | ||
|  |                     cur_line.push(chunks.pop()) | ||
|  |                     cur_len += l | ||
|  | 
 | ||
|  |                 // Nope, this line is full.
 | ||
|  |                 } else { | ||
|  |                     break | ||
|  |                 } | ||
|  |             } | ||
|  | 
 | ||
|  |             // The current line is full, and the next chunk is too big to
 | ||
|  |             // fit on *any* line (not just this one).
 | ||
|  |             if (chunks.length && chunks[chunks.length - 1].length > width) { | ||
|  |                 this._handle_long_word(chunks, cur_line, cur_len, width) | ||
|  |                 cur_len = cur_line.map(l => l.length).reduce((a, b) => a + b, 0) | ||
|  |             } | ||
|  | 
 | ||
|  |             // If the last chunk on this line is all whitespace, drop it.
 | ||
|  |             if (this.drop_whitespace && cur_line.length > 0 && cur_line[cur_line.length - 1].trim() === '') { | ||
|  |                 cur_len -= cur_line[cur_line.length - 1].length | ||
|  |                 cur_line.pop() | ||
|  |             } | ||
|  | 
 | ||
|  |             if (cur_line) { | ||
|  |                 if (this.max_lines === undefined || | ||
|  |                     lines.length + 1 < this.max_lines || | ||
|  |                     (chunks.length === 0 || | ||
|  |                      this.drop_whitespace && | ||
|  |                      chunks.length === 1 && | ||
|  |                      !chunks[0].trim()) && cur_len <= width) { | ||
|  |                     // Convert current line back to a string and store it in
 | ||
|  |                     // list of all lines (return value).
 | ||
|  |                     lines.push(indent + cur_line.join('')) | ||
|  |                 } else { | ||
|  |                     let had_break = false | ||
|  |                     while (cur_line) { | ||
|  |                         if (cur_line[cur_line.length - 1].trim() && | ||
|  |                             cur_len + this.placeholder.length <= width) { | ||
|  |                             cur_line.push(this.placeholder) | ||
|  |                             lines.push(indent + cur_line.join('')) | ||
|  |                             had_break = true | ||
|  |                             break | ||
|  |                         } | ||
|  |                         cur_len -= cur_line[-1].length | ||
|  |                         cur_line.pop() | ||
|  |                     } | ||
|  |                     if (!had_break) { | ||
|  |                         if (lines) { | ||
|  |                             let prev_line = lines[lines.length - 1].trimEnd() | ||
|  |                             if (prev_line.length + this.placeholder.length <= | ||
|  |                                     this.width) { | ||
|  |                                 lines[lines.length - 1] = prev_line + this.placeholder | ||
|  |                                 break | ||
|  |                             } | ||
|  |                         } | ||
|  |                         lines.push(indent + this.placeholder.lstrip()) | ||
|  |                     } | ||
|  |                     break | ||
|  |                 } | ||
|  |             } | ||
|  |         } | ||
|  | 
 | ||
|  |         return lines | ||
|  |     } | ||
|  | 
 | ||
|  |     _split_chunks(text) { | ||
|  |         text = this._munge_whitespace(text) | ||
|  |         return this._split(text) | ||
|  |     } | ||
|  | 
 | ||
|  |     // -- Public interface ----------------------------------------------
 | ||
|  | 
 | ||
|  |     wrap(text) { | ||
|  |         /* | ||
|  |          *  wrap(text : string) -> [string] | ||
|  |          * | ||
|  |          *  Reformat the single paragraph in 'text' so it fits in lines of | ||
|  |          *  no more than 'self.width' columns, and return a list of wrapped | ||
|  |          *  lines.  Tabs in 'text' are expanded with string.expandtabs(), | ||
|  |          *  and all other whitespace characters (including newline) are | ||
|  |          *  converted to space. | ||
|  |          */ | ||
|  |         let chunks = this._split_chunks(text) | ||
|  |         // not implemented in js
 | ||
|  |         //if (this.fix_sentence_endings) {
 | ||
|  |         //    this._fix_sentence_endings(chunks)
 | ||
|  |         //}
 | ||
|  |         return this._wrap_chunks(chunks) | ||
|  |     } | ||
|  | 
 | ||
|  |     fill(text) { | ||
|  |         /* | ||
|  |          *  fill(text : string) -> string | ||
|  |          * | ||
|  |          *  Reformat the single paragraph in 'text' to fit in lines of no | ||
|  |          *  more than 'self.width' columns, and return a new string | ||
|  |          *  containing the entire wrapped paragraph. | ||
|  |          */ | ||
|  |         return this.wrap(text).join('\n') | ||
|  |     } | ||
|  | } | ||
|  | 
 | ||
|  | 
 | ||
|  | // -- Convenience interface ---------------------------------------------
 | ||
|  | 
 | ||
|  | function wrap(text, options = {}) { | ||
|  |     /* | ||
|  |      *  Wrap a single paragraph of text, returning a list of wrapped lines. | ||
|  |      * | ||
|  |      *  Reformat the single paragraph in 'text' so it fits in lines of no | ||
|  |      *  more than 'width' columns, and return a list of wrapped lines.  By | ||
|  |      *  default, tabs in 'text' are expanded with string.expandtabs(), and | ||
|  |      *  all other whitespace characters (including newline) are converted to | ||
|  |      *  space.  See TextWrapper class for available keyword args to customize | ||
|  |      *  wrapping behaviour. | ||
|  |      */ | ||
|  |     let { width = 70, ...kwargs } = options | ||
|  |     let w = new TextWrapper(Object.assign({ width }, kwargs)) | ||
|  |     return w.wrap(text) | ||
|  | } | ||
|  | 
 | ||
|  | function fill(text, options = {}) { | ||
|  |     /* | ||
|  |      *  Fill a single paragraph of text, returning a new string. | ||
|  |      * | ||
|  |      *  Reformat the single paragraph in 'text' to fit in lines of no more | ||
|  |      *  than 'width' columns, and return a new string containing the entire | ||
|  |      *  wrapped paragraph.  As with wrap(), tabs are expanded and other | ||
|  |      *  whitespace characters converted to space.  See TextWrapper class for | ||
|  |      *  available keyword args to customize wrapping behaviour. | ||
|  |      */ | ||
|  |     let { width = 70, ...kwargs } = options | ||
|  |     let w = new TextWrapper(Object.assign({ width }, kwargs)) | ||
|  |     return w.fill(text) | ||
|  | } | ||
|  | 
 | ||
|  | // -- Loosely related functionality -------------------------------------
 | ||
|  | 
 | ||
|  | let _whitespace_only_re = /^[ \t]+$/mg | ||
|  | let _leading_whitespace_re = /(^[ \t]*)(?:[^ \t\n])/mg | ||
|  | 
 | ||
|  | function dedent(text) { | ||
|  |     /* | ||
|  |      *  Remove any common leading whitespace from every line in `text`. | ||
|  |      * | ||
|  |      *  This can be used to make triple-quoted strings line up with the left | ||
|  |      *  edge of the display, while still presenting them in the source code | ||
|  |      *  in indented form. | ||
|  |      * | ||
|  |      *  Note that tabs and spaces are both treated as whitespace, but they | ||
|  |      *  are not equal: the lines "  hello" and "\\thello" are | ||
|  |      *  considered to have no common leading whitespace. | ||
|  |      * | ||
|  |      *  Entirely blank lines are normalized to a newline character. | ||
|  |      */ | ||
|  |     // Look for the longest leading string of spaces and tabs common to
 | ||
|  |     // all lines.
 | ||
|  |     let margin = undefined | ||
|  |     text = text.replace(_whitespace_only_re, '') | ||
|  |     let indents = text.match(_leading_whitespace_re) || [] | ||
|  |     for (let indent of indents) { | ||
|  |         indent = indent.slice(0, -1) | ||
|  | 
 | ||
|  |         if (margin === undefined) { | ||
|  |             margin = indent | ||
|  | 
 | ||
|  |         // Current line more deeply indented than previous winner:
 | ||
|  |         // no change (previous winner is still on top).
 | ||
|  |         } else if (indent.startsWith(margin)) { | ||
|  |             // pass
 | ||
|  | 
 | ||
|  |         // Current line consistent with and no deeper than previous winner:
 | ||
|  |         // it's the new winner.
 | ||
|  |         } else if (margin.startsWith(indent)) { | ||
|  |             margin = indent | ||
|  | 
 | ||
|  |         // Find the largest common whitespace between current line and previous
 | ||
|  |         // winner.
 | ||
|  |         } else { | ||
|  |             for (let i = 0; i < margin.length && i < indent.length; i++) { | ||
|  |                 if (margin[i] !== indent[i]) { | ||
|  |                     margin = margin.slice(0, i) | ||
|  |                     break | ||
|  |                 } | ||
|  |             } | ||
|  |         } | ||
|  |     } | ||
|  | 
 | ||
|  |     if (margin) { | ||
|  |         text = text.replace(new RegExp('^' + margin, 'mg'), '') | ||
|  |     } | ||
|  |     return text | ||
|  | } | ||
|  | 
 | ||
|  | module.exports = { wrap, fill, dedent } |