| """Format all or a selected region (line slice) of text. |
| |
| Region formatting options: paragraph, comment block, indent, deindent, |
| comment, uncomment, tabify, and untabify. |
| |
| File renamed from paragraph.py with functions added from editor.py. |
| """ |
| import re |
| from tkinter.messagebox import askyesno |
| from tkinter.simpledialog import askinteger |
| from idlelib.config import idleConf |
| |
| |
| class FormatParagraph: |
| """Format a paragraph, comment block, or selection to a max width. |
| |
| Does basic, standard text formatting, and also understands Python |
| comment blocks. Thus, for editing Python source code, this |
| extension is really only suitable for reformatting these comment |
| blocks or triple-quoted strings. |
| |
| Known problems with comment reformatting: |
| * If there is a selection marked, and the first line of the |
| selection is not complete, the block will probably not be detected |
| as comments, and will have the normal "text formatting" rules |
| applied. |
| * If a comment block has leading whitespace that mixes tabs and |
| spaces, they will not be considered part of the same block. |
| * Fancy comments, like this bulleted list, aren't handled :-) |
| """ |
| def __init__(self, editwin): |
| self.editwin = editwin |
| |
| @classmethod |
| def reload(cls): |
| cls.max_width = idleConf.GetOption('extensions', 'FormatParagraph', |
| 'max-width', type='int', default=72) |
| |
| def close(self): |
| self.editwin = None |
| |
| def format_paragraph_event(self, event, limit=None): |
| """Formats paragraph to a max width specified in idleConf. |
| |
| If text is selected, format_paragraph_event will start breaking lines |
| at the max width, starting from the beginning selection. |
| |
| If no text is selected, format_paragraph_event uses the current |
| cursor location to determine the paragraph (lines of text surrounded |
| by blank lines) and formats it. |
| |
| The length limit parameter is for testing with a known value. |
| """ |
| limit = self.max_width if limit is None else limit |
| text = self.editwin.text |
| first, last = self.editwin.get_selection_indices() |
| if first and last: |
| data = text.get(first, last) |
| comment_header = get_comment_header(data) |
| else: |
| first, last, comment_header, data = \ |
| find_paragraph(text, text.index("insert")) |
| if comment_header: |
| newdata = reformat_comment(data, limit, comment_header) |
| else: |
| newdata = reformat_paragraph(data, limit) |
| text.tag_remove("sel", "1.0", "end") |
| |
| if newdata != data: |
| text.mark_set("insert", first) |
| text.undo_block_start() |
| text.delete(first, last) |
| text.insert(first, newdata) |
| text.undo_block_stop() |
| else: |
| text.mark_set("insert", last) |
| text.see("insert") |
| return "break" |
| |
| |
| FormatParagraph.reload() |
| |
| def find_paragraph(text, mark): |
| """Returns the start/stop indices enclosing the paragraph that mark is in. |
| |
| Also returns the comment format string, if any, and paragraph of text |
| between the start/stop indices. |
| """ |
| lineno, col = map(int, mark.split(".")) |
| line = text.get("%d.0" % lineno, "%d.end" % lineno) |
| |
| # Look for start of next paragraph if the index passed in is a blank line |
| while text.compare("%d.0" % lineno, "<", "end") and is_all_white(line): |
| lineno = lineno + 1 |
| line = text.get("%d.0" % lineno, "%d.end" % lineno) |
| first_lineno = lineno |
| comment_header = get_comment_header(line) |
| comment_header_len = len(comment_header) |
| |
| # Once start line found, search for end of paragraph (a blank line) |
| while get_comment_header(line)==comment_header and \ |
| not is_all_white(line[comment_header_len:]): |
| lineno = lineno + 1 |
| line = text.get("%d.0" % lineno, "%d.end" % lineno) |
| last = "%d.0" % lineno |
| |
| # Search back to beginning of paragraph (first blank line before) |
| lineno = first_lineno - 1 |
| line = text.get("%d.0" % lineno, "%d.end" % lineno) |
| while lineno > 0 and \ |
| get_comment_header(line)==comment_header and \ |
| not is_all_white(line[comment_header_len:]): |
| lineno = lineno - 1 |
| line = text.get("%d.0" % lineno, "%d.end" % lineno) |
| first = "%d.0" % (lineno+1) |
| |
| return first, last, comment_header, text.get(first, last) |
| |
| # This should perhaps be replaced with textwrap.wrap |
| def reformat_paragraph(data, limit): |
| """Return data reformatted to specified width (limit).""" |
| lines = data.split("\n") |
| i = 0 |
| n = len(lines) |
| while i < n and is_all_white(lines[i]): |
| i = i+1 |
| if i >= n: |
| return data |
| indent1 = get_indent(lines[i]) |
| if i+1 < n and not is_all_white(lines[i+1]): |
| indent2 = get_indent(lines[i+1]) |
| else: |
| indent2 = indent1 |
| new = lines[:i] |
| partial = indent1 |
| while i < n and not is_all_white(lines[i]): |
| # XXX Should take double space after period (etc.) into account |
| words = re.split(r"(\s+)", lines[i]) |
| for j in range(0, len(words), 2): |
| word = words[j] |
| if not word: |
| continue # Can happen when line ends in whitespace |
| if len((partial + word).expandtabs()) > limit and \ |
| partial != indent1: |
| new.append(partial.rstrip()) |
| partial = indent2 |
| partial = partial + word + " " |
| if j+1 < len(words) and words[j+1] != " ": |
| partial = partial + " " |
| i = i+1 |
| new.append(partial.rstrip()) |
| # XXX Should reformat remaining paragraphs as well |
| new.extend(lines[i:]) |
| return "\n".join(new) |
| |
| def reformat_comment(data, limit, comment_header): |
| """Return data reformatted to specified width with comment header.""" |
| |
| # Remove header from the comment lines |
| lc = len(comment_header) |
| data = "\n".join(line[lc:] for line in data.split("\n")) |
| # Reformat to maxformatwidth chars or a 20 char width, |
| # whichever is greater. |
| format_width = max(limit - len(comment_header), 20) |
| newdata = reformat_paragraph(data, format_width) |
| # re-split and re-insert the comment header. |
| newdata = newdata.split("\n") |
| # If the block ends in a \n, we don't want the comment prefix |
| # inserted after it. (Im not sure it makes sense to reformat a |
| # comment block that is not made of complete lines, but whatever!) |
| # Can't think of a clean solution, so we hack away |
| block_suffix = "" |
| if not newdata[-1]: |
| block_suffix = "\n" |
| newdata = newdata[:-1] |
| return '\n'.join(comment_header+line for line in newdata) + block_suffix |
| |
| def is_all_white(line): |
| """Return True if line is empty or all whitespace.""" |
| |
| return re.match(r"^\s*$", line) is not None |
| |
| def get_indent(line): |
| """Return the initial space or tab indent of line.""" |
| return re.match(r"^([ \t]*)", line).group() |
| |
| def get_comment_header(line): |
| """Return string with leading whitespace and '#' from line or ''. |
| |
| A null return indicates that the line is not a comment line. A non- |
| null return, such as ' #', will be used to find the other lines of |
| a comment block with the same indent. |
| """ |
| m = re.match(r"^([ \t]*#*)", line) |
| if m is None: return "" |
| return m.group(1) |
| |
| |
| # Copied from editor.py; importing it would cause an import cycle. |
| _line_indent_re = re.compile(r'[ \t]*') |
| |
| def get_line_indent(line, tabwidth): |
| """Return a line's indentation as (# chars, effective # of spaces). |
| |
| The effective # of spaces is the length after properly "expanding" |
| the tabs into spaces, as done by str.expandtabs(tabwidth). |
| """ |
| m = _line_indent_re.match(line) |
| return m.end(), len(m.group().expandtabs(tabwidth)) |
| |
| |
| class FormatRegion: |
| "Format selected text (region)." |
| |
| def __init__(self, editwin): |
| self.editwin = editwin |
| |
| def get_region(self): |
| """Return line information about the selected text region. |
| |
| If text is selected, the first and last indices will be |
| for the selection. If there is no text selected, the |
| indices will be the current cursor location. |
| |
| Return a tuple containing (first index, last index, |
| string representation of text, list of text lines). |
| """ |
| text = self.editwin.text |
| first, last = self.editwin.get_selection_indices() |
| if first and last: |
| head = text.index(first + " linestart") |
| tail = text.index(last + "-1c lineend +1c") |
| else: |
| head = text.index("insert linestart") |
| tail = text.index("insert lineend +1c") |
| chars = text.get(head, tail) |
| lines = chars.split("\n") |
| return head, tail, chars, lines |
| |
| def set_region(self, head, tail, chars, lines): |
| """Replace the text between the given indices. |
| |
| Args: |
| head: Starting index of text to replace. |
| tail: Ending index of text to replace. |
| chars: Expected to be string of current text |
| between head and tail. |
| lines: List of new lines to insert between head |
| and tail. |
| """ |
| text = self.editwin.text |
| newchars = "\n".join(lines) |
| if newchars == chars: |
| text.bell() |
| return |
| text.tag_remove("sel", "1.0", "end") |
| text.mark_set("insert", head) |
| text.undo_block_start() |
| text.delete(head, tail) |
| text.insert(head, newchars) |
| text.undo_block_stop() |
| text.tag_add("sel", head, "insert") |
| |
| def indent_region_event(self, event=None): |
| "Indent region by indentwidth spaces." |
| head, tail, chars, lines = self.get_region() |
| for pos in range(len(lines)): |
| line = lines[pos] |
| if line: |
| raw, effective = get_line_indent(line, self.editwin.tabwidth) |
| effective = effective + self.editwin.indentwidth |
| lines[pos] = self.editwin._make_blanks(effective) + line[raw:] |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def dedent_region_event(self, event=None): |
| "Dedent region by indentwidth spaces." |
| head, tail, chars, lines = self.get_region() |
| for pos in range(len(lines)): |
| line = lines[pos] |
| if line: |
| raw, effective = get_line_indent(line, self.editwin.tabwidth) |
| effective = max(effective - self.editwin.indentwidth, 0) |
| lines[pos] = self.editwin._make_blanks(effective) + line[raw:] |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def comment_region_event(self, event=None): |
| """Comment out each line in region. |
| |
| ## is appended to the beginning of each line to comment it out. |
| """ |
| head, tail, chars, lines = self.get_region() |
| for pos in range(len(lines) - 1): |
| line = lines[pos] |
| lines[pos] = '##' + line |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def uncomment_region_event(self, event=None): |
| """Uncomment each line in region. |
| |
| Remove ## or # in the first positions of a line. If the comment |
| is not in the beginning position, this command will have no effect. |
| """ |
| head, tail, chars, lines = self.get_region() |
| for pos in range(len(lines)): |
| line = lines[pos] |
| if not line: |
| continue |
| if line[:2] == '##': |
| line = line[2:] |
| elif line[:1] == '#': |
| line = line[1:] |
| lines[pos] = line |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def tabify_region_event(self, event=None): |
| "Convert leading spaces to tabs for each line in selected region." |
| head, tail, chars, lines = self.get_region() |
| tabwidth = self._asktabwidth() |
| if tabwidth is None: |
| return |
| for pos in range(len(lines)): |
| line = lines[pos] |
| if line: |
| raw, effective = get_line_indent(line, tabwidth) |
| ntabs, nspaces = divmod(effective, tabwidth) |
| lines[pos] = '\t' * ntabs + ' ' * nspaces + line[raw:] |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def untabify_region_event(self, event=None): |
| "Expand tabs to spaces for each line in region." |
| head, tail, chars, lines = self.get_region() |
| tabwidth = self._asktabwidth() |
| if tabwidth is None: |
| return |
| for pos in range(len(lines)): |
| lines[pos] = lines[pos].expandtabs(tabwidth) |
| self.set_region(head, tail, chars, lines) |
| return "break" |
| |
| def _asktabwidth(self): |
| "Return value for tab width." |
| return askinteger( |
| "Tab width", |
| "Columns per tab? (2-16)", |
| parent=self.editwin.text, |
| initialvalue=self.editwin.indentwidth, |
| minvalue=2, |
| maxvalue=16) |
| |
| |
| class Indents: |
| "Change future indents." |
| |
| def __init__(self, editwin): |
| self.editwin = editwin |
| |
| def toggle_tabs_event(self, event): |
| editwin = self.editwin |
| usetabs = editwin.usetabs |
| if askyesno( |
| "Toggle tabs", |
| "Turn tabs " + ("on", "off")[usetabs] + |
| "?\nIndent width " + |
| ("will be", "remains at")[usetabs] + " 8." + |
| "\n Note: a tab is always 8 columns", |
| parent=editwin.text): |
| editwin.usetabs = not usetabs |
| # Try to prevent inconsistent indentation. |
| # User must change indent width manually after using tabs. |
| editwin.indentwidth = 8 |
| return "break" |
| |
| def change_indentwidth_event(self, event): |
| editwin = self.editwin |
| new = askinteger( |
| "Indent width", |
| "New indent width (2-16)\n(Always use 8 when using tabs)", |
| parent=editwin.text, |
| initialvalue=editwin.indentwidth, |
| minvalue=2, |
| maxvalue=16) |
| if new and new != editwin.indentwidth and not editwin.usetabs: |
| editwin.indentwidth = new |
| return "break" |
| |
| |
| class Rstrip: # 'Strip Trailing Whitespace" on "Format" menu. |
| def __init__(self, editwin): |
| self.editwin = editwin |
| |
| def do_rstrip(self, event=None): |
| text = self.editwin.text |
| undo = self.editwin.undo |
| undo.undo_block_start() |
| |
| end_line = int(float(text.index('end'))) |
| for cur in range(1, end_line): |
| txt = text.get('%i.0' % cur, '%i.end' % cur) |
| raw = len(txt) |
| cut = len(txt.rstrip()) |
| # Since text.delete() marks file as changed, even if not, |
| # only call it when needed to actually delete something. |
| if cut < raw: |
| text.delete('%i.%i' % (cur, cut), '%i.end' % cur) |
| |
| if (text.get('end-2c') == '\n' # File ends with at least 1 newline; |
| and not hasattr(self.editwin, 'interp')): # & is not Shell. |
| # Delete extra user endlines. |
| while (text.index('end-1c') > '1.0' # Stop if file empty. |
| and text.get('end-3c') == '\n'): |
| text.delete('end-3c') |
| # Because tk indexes are slice indexes and never raise, |
| # a file with only newlines will be emptied. |
| # patchcheck.py does the same. |
| |
| undo.undo_block_stop() |
| |
| |
| if __name__ == "__main__": |
| from unittest import main |
| main('idlelib.idle_test.test_format', verbosity=2, exit=False) |