| // Partial port of python's argparse module, version 3.9.0 (only wrap and fill functions): |
| // https://github.com/python/cpython/blob/v3.9.0b4/Lib/textwrap.py |
| |
| 'use strict' |
| |
| /* |
| * Text wrapping and filling. |
| */ |
| |
| // Copyright (C) 1999-2001 Gregory P. Ward. |
| // Copyright (C) 2002, 2003 Python Software Foundation. |
| // Copyright (C) 2020 argparse.js authors |
| // Originally written by Greg Ward <gward@python.net> |
| |
| // Hardcode the recognized whitespace characters to the US-ASCII |
| // whitespace characters. The main reason for doing this is that |
| // some Unicode spaces (like \u00a0) are non-breaking whitespaces. |
| // |
| // This less funky little regex just split on recognized spaces. E.g. |
| // "Hello there -- you goof-ball, use the -b option!" |
| // splits into |
| // Hello/ /there/ /--/ /you/ /goof-ball,/ /use/ /the/ /-b/ /option!/ |
| const wordsep_simple_re = /([\t\n\x0b\x0c\r ]+)/ |
| |
| class TextWrapper { |
| /* |
| * Object for wrapping/filling text. The public interface consists of |
| * the wrap() and fill() methods; the other methods are just there for |
| * subclasses to override in order to tweak the default behaviour. |
| * If you want to completely replace the main wrapping algorithm, |
| * you'll probably have to override _wrap_chunks(). |
| * |
| * Several instance attributes control various aspects of wrapping: |
| * width (default: 70) |
| * the maximum width of wrapped lines (unless break_long_words |
| * is false) |
| * initial_indent (default: "") |
| * string that will be prepended to the first line of wrapped |
| * output. Counts towards the line's width. |
| * subsequent_indent (default: "") |
| * string that will be prepended to all lines save the first |
| * of wrapped output; also counts towards each line's width. |
| * expand_tabs (default: true) |
| * Expand tabs in input text to spaces before further processing. |
| * Each tab will become 0 .. 'tabsize' spaces, depending on its position |
| * in its line. If false, each tab is treated as a single character. |
| * tabsize (default: 8) |
| * Expand tabs in input text to 0 .. 'tabsize' spaces, unless |
| * 'expand_tabs' is false. |
| * replace_whitespace (default: true) |
| * Replace all whitespace characters in the input text by spaces |
| * after tab expansion. Note that if expand_tabs is false and |
| * replace_whitespace is true, every tab will be converted to a |
| * single space! |
| * fix_sentence_endings (default: false) |
| * Ensure that sentence-ending punctuation is always followed |
| * by two spaces. Off by default because the algorithm is |
| * (unavoidably) imperfect. |
| * break_long_words (default: true) |
| * Break words longer than 'width'. If false, those words will not |
| * be broken, and some lines might be longer than 'width'. |
| * break_on_hyphens (default: true) |
| * Allow breaking hyphenated words. If true, wrapping will occur |
| * preferably on whitespaces and right after hyphens part of |
| * compound words. |
| * drop_whitespace (default: true) |
| * Drop leading and trailing whitespace from lines. |
| * max_lines (default: None) |
| * Truncate wrapped lines. |
| * placeholder (default: ' [...]') |
| * Append to the last line of truncated text. |
| */ |
| |
| constructor(options = {}) { |
| let { |
| width = 70, |
| initial_indent = '', |
| subsequent_indent = '', |
| expand_tabs = true, |
| replace_whitespace = true, |
| fix_sentence_endings = false, |
| break_long_words = true, |
| drop_whitespace = true, |
| break_on_hyphens = true, |
| tabsize = 8, |
| max_lines = undefined, |
| placeholder=' [...]' |
| } = options |
| |
| this.width = width |
| this.initial_indent = initial_indent |
| this.subsequent_indent = subsequent_indent |
| this.expand_tabs = expand_tabs |
| this.replace_whitespace = replace_whitespace |
| this.fix_sentence_endings = fix_sentence_endings |
| this.break_long_words = break_long_words |
| this.drop_whitespace = drop_whitespace |
| this.break_on_hyphens = break_on_hyphens |
| this.tabsize = tabsize |
| this.max_lines = max_lines |
| this.placeholder = placeholder |
| } |
| |
| |
| // -- Private methods ----------------------------------------------- |
| // (possibly useful for subclasses to override) |
| |
| _munge_whitespace(text) { |
| /* |
| * _munge_whitespace(text : string) -> string |
| * |
| * Munge whitespace in text: expand tabs and convert all other |
| * whitespace characters to spaces. Eg. " foo\\tbar\\n\\nbaz" |
| * becomes " foo bar baz". |
| */ |
| if (this.expand_tabs) { |
| text = text.replace(/\t/g, ' '.repeat(this.tabsize)) // not strictly correct in js |
| } |
| if (this.replace_whitespace) { |
| text = text.replace(/[\t\n\x0b\x0c\r]/g, ' ') |
| } |
| return text |
| } |
| |
| _split(text) { |
| /* |
| * _split(text : string) -> [string] |
| * |
| * Split the text to wrap into indivisible chunks. Chunks are |
| * not quite the same as words; see _wrap_chunks() for full |
| * details. As an example, the text |
| * Look, goof-ball -- use the -b option! |
| * breaks into the following chunks: |
| * 'Look,', ' ', 'goof-', 'ball', ' ', '--', ' ', |
| * 'use', ' ', 'the', ' ', '-b', ' ', 'option!' |
| * if break_on_hyphens is True, or in: |
| * 'Look,', ' ', 'goof-ball', ' ', '--', ' ', |
| * 'use', ' ', 'the', ' ', '-b', ' ', option!' |
| * otherwise. |
| */ |
| let chunks = text.split(wordsep_simple_re) |
| chunks = chunks.filter(Boolean) |
| return chunks |
| } |
| |
| _handle_long_word(reversed_chunks, cur_line, cur_len, width) { |
| /* |
| * _handle_long_word(chunks : [string], |
| * cur_line : [string], |
| * cur_len : int, width : int) |
| * |
| * Handle a chunk of text (most likely a word, not whitespace) that |
| * is too long to fit in any line. |
| */ |
| // Figure out when indent is larger than the specified width, and make |
| // sure at least one character is stripped off on every pass |
| let space_left |
| if (width < 1) { |
| space_left = 1 |
| } else { |
| space_left = width - cur_len |
| } |
| |
| // If we're allowed to break long words, then do so: put as much |
| // of the next chunk onto the current line as will fit. |
| if (this.break_long_words) { |
| cur_line.push(reversed_chunks[reversed_chunks.length - 1].slice(0, space_left)) |
| reversed_chunks[reversed_chunks.length - 1] = reversed_chunks[reversed_chunks.length - 1].slice(space_left) |
| |
| // Otherwise, we have to preserve the long word intact. Only add |
| // it to the current line if there's nothing already there -- |
| // that minimizes how much we violate the width constraint. |
| } else if (!cur_line) { |
| cur_line.push(...reversed_chunks.pop()) |
| } |
| |
| // If we're not allowed to break long words, and there's already |
| // text on the current line, do nothing. Next time through the |
| // main loop of _wrap_chunks(), we'll wind up here again, but |
| // cur_len will be zero, so the next line will be entirely |
| // devoted to the long word that we can't handle right now. |
| } |
| |
| _wrap_chunks(chunks) { |
| /* |
| * _wrap_chunks(chunks : [string]) -> [string] |
| * |
| * Wrap a sequence of text chunks and return a list of lines of |
| * length 'self.width' or less. (If 'break_long_words' is false, |
| * some lines may be longer than this.) Chunks correspond roughly |
| * to words and the whitespace between them: each chunk is |
| * indivisible (modulo 'break_long_words'), but a line break can |
| * come between any two chunks. Chunks should not have internal |
| * whitespace; ie. a chunk is either all whitespace or a "word". |
| * Whitespace chunks will be removed from the beginning and end of |
| * lines, but apart from that whitespace is preserved. |
| */ |
| let lines = [] |
| let indent |
| if (this.width <= 0) { |
| throw Error(`invalid width ${this.width} (must be > 0)`) |
| } |
| if (this.max_lines !== undefined) { |
| if (this.max_lines > 1) { |
| indent = this.subsequent_indent |
| } else { |
| indent = this.initial_indent |
| } |
| if (indent.length + this.placeholder.trimStart().length > this.width) { |
| throw Error('placeholder too large for max width') |
| } |
| } |
| |
| // Arrange in reverse order so items can be efficiently popped |
| // from a stack of chucks. |
| chunks = chunks.reverse() |
| |
| while (chunks.length > 0) { |
| |
| // Start the list of chunks that will make up the current line. |
| // cur_len is just the length of all the chunks in cur_line. |
| let cur_line = [] |
| let cur_len = 0 |
| |
| // Figure out which static string will prefix this line. |
| let indent |
| if (lines) { |
| indent = this.subsequent_indent |
| } else { |
| indent = this.initial_indent |
| } |
| |
| // Maximum width for this line. |
| let width = this.width - indent.length |
| |
| // First chunk on line is whitespace -- drop it, unless this |
| // is the very beginning of the text (ie. no lines started yet). |
| if (this.drop_whitespace && chunks[chunks.length - 1].trim() === '' && lines.length > 0) { |
| chunks.pop() |
| } |
| |
| while (chunks.length > 0) { |
| let l = chunks[chunks.length - 1].length |
| |
| // Can at least squeeze this chunk onto the current line. |
| if (cur_len + l <= width) { |
| cur_line.push(chunks.pop()) |
| cur_len += l |
| |
| // Nope, this line is full. |
| } else { |
| break |
| } |
| } |
| |
| // The current line is full, and the next chunk is too big to |
| // fit on *any* line (not just this one). |
| if (chunks.length && chunks[chunks.length - 1].length > width) { |
| this._handle_long_word(chunks, cur_line, cur_len, width) |
| cur_len = cur_line.map(l => l.length).reduce((a, b) => a + b, 0) |
| } |
| |
| // If the last chunk on this line is all whitespace, drop it. |
| if (this.drop_whitespace && cur_line.length > 0 && cur_line[cur_line.length - 1].trim() === '') { |
| cur_len -= cur_line[cur_line.length - 1].length |
| cur_line.pop() |
| } |
| |
| if (cur_line) { |
| if (this.max_lines === undefined || |
| lines.length + 1 < this.max_lines || |
| (chunks.length === 0 || |
| this.drop_whitespace && |
| chunks.length === 1 && |
| !chunks[0].trim()) && cur_len <= width) { |
| // Convert current line back to a string and store it in |
| // list of all lines (return value). |
| lines.push(indent + cur_line.join('')) |
| } else { |
| let had_break = false |
| while (cur_line) { |
| if (cur_line[cur_line.length - 1].trim() && |
| cur_len + this.placeholder.length <= width) { |
| cur_line.push(this.placeholder) |
| lines.push(indent + cur_line.join('')) |
| had_break = true |
| break |
| } |
| cur_len -= cur_line[-1].length |
| cur_line.pop() |
| } |
| if (!had_break) { |
| if (lines) { |
| let prev_line = lines[lines.length - 1].trimEnd() |
| if (prev_line.length + this.placeholder.length <= |
| this.width) { |
| lines[lines.length - 1] = prev_line + this.placeholder |
| break |
| } |
| } |
| lines.push(indent + this.placeholder.lstrip()) |
| } |
| break |
| } |
| } |
| } |
| |
| return lines |
| } |
| |
| _split_chunks(text) { |
| text = this._munge_whitespace(text) |
| return this._split(text) |
| } |
| |
| // -- Public interface ---------------------------------------------- |
| |
| wrap(text) { |
| /* |
| * wrap(text : string) -> [string] |
| * |
| * Reformat the single paragraph in 'text' so it fits in lines of |
| * no more than 'self.width' columns, and return a list of wrapped |
| * lines. Tabs in 'text' are expanded with string.expandtabs(), |
| * and all other whitespace characters (including newline) are |
| * converted to space. |
| */ |
| let chunks = this._split_chunks(text) |
| // not implemented in js |
| //if (this.fix_sentence_endings) { |
| // this._fix_sentence_endings(chunks) |
| //} |
| return this._wrap_chunks(chunks) |
| } |
| |
| fill(text) { |
| /* |
| * fill(text : string) -> string |
| * |
| * Reformat the single paragraph in 'text' to fit in lines of no |
| * more than 'self.width' columns, and return a new string |
| * containing the entire wrapped paragraph. |
| */ |
| return this.wrap(text).join('\n') |
| } |
| } |
| |
| |
| // -- Convenience interface --------------------------------------------- |
| |
| function wrap(text, options = {}) { |
| /* |
| * Wrap a single paragraph of text, returning a list of wrapped lines. |
| * |
| * Reformat the single paragraph in 'text' so it fits in lines of no |
| * more than 'width' columns, and return a list of wrapped lines. By |
| * default, tabs in 'text' are expanded with string.expandtabs(), and |
| * all other whitespace characters (including newline) are converted to |
| * space. See TextWrapper class for available keyword args to customize |
| * wrapping behaviour. |
| */ |
| let { width = 70, ...kwargs } = options |
| let w = new TextWrapper(Object.assign({ width }, kwargs)) |
| return w.wrap(text) |
| } |
| |
| function fill(text, options = {}) { |
| /* |
| * Fill a single paragraph of text, returning a new string. |
| * |
| * Reformat the single paragraph in 'text' to fit in lines of no more |
| * than 'width' columns, and return a new string containing the entire |
| * wrapped paragraph. As with wrap(), tabs are expanded and other |
| * whitespace characters converted to space. See TextWrapper class for |
| * available keyword args to customize wrapping behaviour. |
| */ |
| let { width = 70, ...kwargs } = options |
| let w = new TextWrapper(Object.assign({ width }, kwargs)) |
| return w.fill(text) |
| } |
| |
| // -- Loosely related functionality ------------------------------------- |
| |
| let _whitespace_only_re = /^[ \t]+$/mg |
| let _leading_whitespace_re = /(^[ \t]*)(?:[^ \t\n])/mg |
| |
| function dedent(text) { |
| /* |
| * Remove any common leading whitespace from every line in `text`. |
| * |
| * This can be used to make triple-quoted strings line up with the left |
| * edge of the display, while still presenting them in the source code |
| * in indented form. |
| * |
| * Note that tabs and spaces are both treated as whitespace, but they |
| * are not equal: the lines " hello" and "\\thello" are |
| * considered to have no common leading whitespace. |
| * |
| * Entirely blank lines are normalized to a newline character. |
| */ |
| // Look for the longest leading string of spaces and tabs common to |
| // all lines. |
| let margin = undefined |
| text = text.replace(_whitespace_only_re, '') |
| let indents = text.match(_leading_whitespace_re) || [] |
| for (let indent of indents) { |
| indent = indent.slice(0, -1) |
| |
| if (margin === undefined) { |
| margin = indent |
| |
| // Current line more deeply indented than previous winner: |
| // no change (previous winner is still on top). |
| } else if (indent.startsWith(margin)) { |
| // pass |
| |
| // Current line consistent with and no deeper than previous winner: |
| // it's the new winner. |
| } else if (margin.startsWith(indent)) { |
| margin = indent |
| |
| // Find the largest common whitespace between current line and previous |
| // winner. |
| } else { |
| for (let i = 0; i < margin.length && i < indent.length; i++) { |
| if (margin[i] !== indent[i]) { |
| margin = margin.slice(0, i) |
| break |
| } |
| } |
| } |
| } |
| |
| if (margin) { |
| text = text.replace(new RegExp('^' + margin, 'mg'), '') |
| } |
| return text |
| } |
| |
| module.exports = { wrap, fill, dedent } |