358 lines
13 KiB
Python
358 lines
13 KiB
Python
|
"""Format all or a selected region (line slice) of text.
|
||
|
|
||
|
Region formatting options: paragraph, comment block, indent, deindent,
|
||
|
comment, uncomment, tabify, and untabify.
|
||
|
|
||
|
File renamed from paragraph.py with functions added from editor.py.
|
||
|
"""
|
||
|
import re
|
||
|
from tkinter.simpledialog import askinteger
|
||
|
from idlelib.config import idleConf
|
||
|
|
||
|
|
||
|
class FormatParagraph:
|
||
|
"""Format a paragraph, comment block, or selection to a max width.
|
||
|
|
||
|
Does basic, standard text formatting, and also understands Python
|
||
|
comment blocks. Thus, for editing Python source code, this
|
||
|
extension is really only suitable for reformatting these comment
|
||
|
blocks or triple-quoted strings.
|
||
|
|
||
|
Known problems with comment reformatting:
|
||
|
* If there is a selection marked, and the first line of the
|
||
|
selection is not complete, the block will probably not be detected
|
||
|
as comments, and will have the normal "text formatting" rules
|
||
|
applied.
|
||
|
* If a comment block has leading whitespace that mixes tabs and
|
||
|
spaces, they will not be considered part of the same block.
|
||
|
* Fancy comments, like this bulleted list, aren't handled :-)
|
||
|
"""
|
||
|
def __init__(self, editwin):
|
||
|
self.editwin = editwin
|
||
|
|
||
|
@classmethod
|
||
|
def reload(cls):
|
||
|
cls.max_width = idleConf.GetOption('extensions', 'FormatParagraph',
|
||
|
'max-width', type='int', default=72)
|
||
|
|
||
|
def close(self):
|
||
|
self.editwin = None
|
||
|
|
||
|
def format_paragraph_event(self, event, limit=None):
|
||
|
"""Formats paragraph to a max width specified in idleConf.
|
||
|
|
||
|
If text is selected, format_paragraph_event will start breaking lines
|
||
|
at the max width, starting from the beginning selection.
|
||
|
|
||
|
If no text is selected, format_paragraph_event uses the current
|
||
|
cursor location to determine the paragraph (lines of text surrounded
|
||
|
by blank lines) and formats it.
|
||
|
|
||
|
The length limit parameter is for testing with a known value.
|
||
|
"""
|
||
|
limit = self.max_width if limit is None else limit
|
||
|
text = self.editwin.text
|
||
|
first, last = self.editwin.get_selection_indices()
|
||
|
if first and last:
|
||
|
data = text.get(first, last)
|
||
|
comment_header = get_comment_header(data)
|
||
|
else:
|
||
|
first, last, comment_header, data = \
|
||
|
find_paragraph(text, text.index("insert"))
|
||
|
if comment_header:
|
||
|
newdata = reformat_comment(data, limit, comment_header)
|
||
|
else:
|
||
|
newdata = reformat_paragraph(data, limit)
|
||
|
text.tag_remove("sel", "1.0", "end")
|
||
|
|
||
|
if newdata != data:
|
||
|
text.mark_set("insert", first)
|
||
|
text.undo_block_start()
|
||
|
text.delete(first, last)
|
||
|
text.insert(first, newdata)
|
||
|
text.undo_block_stop()
|
||
|
else:
|
||
|
text.mark_set("insert", last)
|
||
|
text.see("insert")
|
||
|
return "break"
|
||
|
|
||
|
|
||
|
FormatParagraph.reload()
|
||
|
|
||
|
def find_paragraph(text, mark):
|
||
|
"""Returns the start/stop indices enclosing the paragraph that mark is in.
|
||
|
|
||
|
Also returns the comment format string, if any, and paragraph of text
|
||
|
between the start/stop indices.
|
||
|
"""
|
||
|
lineno, col = map(int, mark.split("."))
|
||
|
line = text.get("%d.0" % lineno, "%d.end" % lineno)
|
||
|
|
||
|
# Look for start of next paragraph if the index passed in is a blank line
|
||
|
while text.compare("%d.0" % lineno, "<", "end") and is_all_white(line):
|
||
|
lineno = lineno + 1
|
||
|
line = text.get("%d.0" % lineno, "%d.end" % lineno)
|
||
|
first_lineno = lineno
|
||
|
comment_header = get_comment_header(line)
|
||
|
comment_header_len = len(comment_header)
|
||
|
|
||
|
# Once start line found, search for end of paragraph (a blank line)
|
||
|
while get_comment_header(line)==comment_header and \
|
||
|
not is_all_white(line[comment_header_len:]):
|
||
|
lineno = lineno + 1
|
||
|
line = text.get("%d.0" % lineno, "%d.end" % lineno)
|
||
|
last = "%d.0" % lineno
|
||
|
|
||
|
# Search back to beginning of paragraph (first blank line before)
|
||
|
lineno = first_lineno - 1
|
||
|
line = text.get("%d.0" % lineno, "%d.end" % lineno)
|
||
|
while lineno > 0 and \
|
||
|
get_comment_header(line)==comment_header and \
|
||
|
not is_all_white(line[comment_header_len:]):
|
||
|
lineno = lineno - 1
|
||
|
line = text.get("%d.0" % lineno, "%d.end" % lineno)
|
||
|
first = "%d.0" % (lineno+1)
|
||
|
|
||
|
return first, last, comment_header, text.get(first, last)
|
||
|
|
||
|
# This should perhaps be replaced with textwrap.wrap
|
||
|
def reformat_paragraph(data, limit):
|
||
|
"""Return data reformatted to specified width (limit)."""
|
||
|
lines = data.split("\n")
|
||
|
i = 0
|
||
|
n = len(lines)
|
||
|
while i < n and is_all_white(lines[i]):
|
||
|
i = i+1
|
||
|
if i >= n:
|
||
|
return data
|
||
|
indent1 = get_indent(lines[i])
|
||
|
if i+1 < n and not is_all_white(lines[i+1]):
|
||
|
indent2 = get_indent(lines[i+1])
|
||
|
else:
|
||
|
indent2 = indent1
|
||
|
new = lines[:i]
|
||
|
partial = indent1
|
||
|
while i < n and not is_all_white(lines[i]):
|
||
|
# XXX Should take double space after period (etc.) into account
|
||
|
words = re.split(r"(\s+)", lines[i])
|
||
|
for j in range(0, len(words), 2):
|
||
|
word = words[j]
|
||
|
if not word:
|
||
|
continue # Can happen when line ends in whitespace
|
||
|
if len((partial + word).expandtabs()) > limit and \
|
||
|
partial != indent1:
|
||
|
new.append(partial.rstrip())
|
||
|
partial = indent2
|
||
|
partial = partial + word + " "
|
||
|
if j+1 < len(words) and words[j+1] != " ":
|
||
|
partial = partial + " "
|
||
|
i = i+1
|
||
|
new.append(partial.rstrip())
|
||
|
# XXX Should reformat remaining paragraphs as well
|
||
|
new.extend(lines[i:])
|
||
|
return "\n".join(new)
|
||
|
|
||
|
def reformat_comment(data, limit, comment_header):
|
||
|
"""Return data reformatted to specified width with comment header."""
|
||
|
|
||
|
# Remove header from the comment lines
|
||
|
lc = len(comment_header)
|
||
|
data = "\n".join(line[lc:] for line in data.split("\n"))
|
||
|
# Reformat to maxformatwidth chars or a 20 char width,
|
||
|
# whichever is greater.
|
||
|
format_width = max(limit - len(comment_header), 20)
|
||
|
newdata = reformat_paragraph(data, format_width)
|
||
|
# re-split and re-insert the comment header.
|
||
|
newdata = newdata.split("\n")
|
||
|
# If the block ends in a \n, we don't want the comment prefix
|
||
|
# inserted after it. (Im not sure it makes sense to reformat a
|
||
|
# comment block that is not made of complete lines, but whatever!)
|
||
|
# Can't think of a clean solution, so we hack away
|
||
|
block_suffix = ""
|
||
|
if not newdata[-1]:
|
||
|
block_suffix = "\n"
|
||
|
newdata = newdata[:-1]
|
||
|
return '\n'.join(comment_header+line for line in newdata) + block_suffix
|
||
|
|
||
|
def is_all_white(line):
|
||
|
"""Return True if line is empty or all whitespace."""
|
||
|
|
||
|
return re.match(r"^\s*$", line) is not None
|
||
|
|
||
|
def get_indent(line):
|
||
|
"""Return the initial space or tab indent of line."""
|
||
|
return re.match(r"^([ \t]*)", line).group()
|
||
|
|
||
|
def get_comment_header(line):
|
||
|
"""Return string with leading whitespace and '#' from line or ''.
|
||
|
|
||
|
A null return indicates that the line is not a comment line. A non-
|
||
|
null return, such as ' #', will be used to find the other lines of
|
||
|
a comment block with the same indent.
|
||
|
"""
|
||
|
m = re.match(r"^([ \t]*#*)", line)
|
||
|
if m is None: return ""
|
||
|
return m.group(1)
|
||
|
|
||
|
|
||
|
# Copy from editor.py; importing it would cause an import cycle.
|
||
|
_line_indent_re = re.compile(r'[ \t]*')
|
||
|
|
||
|
def get_line_indent(line, tabwidth):
|
||
|
"""Return a line's indentation as (# chars, effective # of spaces).
|
||
|
|
||
|
The effective # of spaces is the length after properly "expanding"
|
||
|
the tabs into spaces, as done by str.expandtabs(tabwidth).
|
||
|
"""
|
||
|
m = _line_indent_re.match(line)
|
||
|
return m.end(), len(m.group().expandtabs(tabwidth))
|
||
|
|
||
|
|
||
|
class FormatRegion:
|
||
|
"Format selected text."
|
||
|
|
||
|
def __init__(self, editwin):
|
||
|
self.editwin = editwin
|
||
|
|
||
|
def get_region(self):
|
||
|
"""Return line information about the selected text region.
|
||
|
|
||
|
If text is selected, the first and last indices will be
|
||
|
for the selection. If there is no text selected, the
|
||
|
indices will be the current cursor location.
|
||
|
|
||
|
Return a tuple containing (first index, last index,
|
||
|
string representation of text, list of text lines).
|
||
|
"""
|
||
|
text = self.editwin.text
|
||
|
first, last = self.editwin.get_selection_indices()
|
||
|
if first and last:
|
||
|
head = text.index(first + " linestart")
|
||
|
tail = text.index(last + "-1c lineend +1c")
|
||
|
else:
|
||
|
head = text.index("insert linestart")
|
||
|
tail = text.index("insert lineend +1c")
|
||
|
chars = text.get(head, tail)
|
||
|
lines = chars.split("\n")
|
||
|
return head, tail, chars, lines
|
||
|
|
||
|
def set_region(self, head, tail, chars, lines):
|
||
|
"""Replace the text between the given indices.
|
||
|
|
||
|
Args:
|
||
|
head: Starting index of text to replace.
|
||
|
tail: Ending index of text to replace.
|
||
|
chars: Expected to be string of current text
|
||
|
between head and tail.
|
||
|
lines: List of new lines to insert between head
|
||
|
and tail.
|
||
|
"""
|
||
|
text = self.editwin.text
|
||
|
newchars = "\n".join(lines)
|
||
|
if newchars == chars:
|
||
|
text.bell()
|
||
|
return
|
||
|
text.tag_remove("sel", "1.0", "end")
|
||
|
text.mark_set("insert", head)
|
||
|
text.undo_block_start()
|
||
|
text.delete(head, tail)
|
||
|
text.insert(head, newchars)
|
||
|
text.undo_block_stop()
|
||
|
text.tag_add("sel", head, "insert")
|
||
|
|
||
|
def indent_region_event(self, event=None):
|
||
|
"Indent region by indentwidth spaces."
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
for pos in range(len(lines)):
|
||
|
line = lines[pos]
|
||
|
if line:
|
||
|
raw, effective = get_line_indent(line, self.editwin.tabwidth)
|
||
|
effective = effective + self.editwin.indentwidth
|
||
|
lines[pos] = self.editwin._make_blanks(effective) + line[raw:]
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def dedent_region_event(self, event=None):
|
||
|
"Dedent region by indentwidth spaces."
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
for pos in range(len(lines)):
|
||
|
line = lines[pos]
|
||
|
if line:
|
||
|
raw, effective = get_line_indent(line, self.editwin.tabwidth)
|
||
|
effective = max(effective - self.editwin.indentwidth, 0)
|
||
|
lines[pos] = self.editwin._make_blanks(effective) + line[raw:]
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def comment_region_event(self, event=None):
|
||
|
"""Comment out each line in region.
|
||
|
|
||
|
## is appended to the beginning of each line to comment it out.
|
||
|
"""
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
for pos in range(len(lines) - 1):
|
||
|
line = lines[pos]
|
||
|
lines[pos] = '##' + line
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def uncomment_region_event(self, event=None):
|
||
|
"""Uncomment each line in region.
|
||
|
|
||
|
Remove ## or # in the first positions of a line. If the comment
|
||
|
is not in the beginning position, this command will have no effect.
|
||
|
"""
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
for pos in range(len(lines)):
|
||
|
line = lines[pos]
|
||
|
if not line:
|
||
|
continue
|
||
|
if line[:2] == '##':
|
||
|
line = line[2:]
|
||
|
elif line[:1] == '#':
|
||
|
line = line[1:]
|
||
|
lines[pos] = line
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def tabify_region_event(self, event=None):
|
||
|
"Convert leading spaces to tabs for each line in selected region."
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
tabwidth = self._asktabwidth()
|
||
|
if tabwidth is None:
|
||
|
return
|
||
|
for pos in range(len(lines)):
|
||
|
line = lines[pos]
|
||
|
if line:
|
||
|
raw, effective = get_line_indent(line, tabwidth)
|
||
|
ntabs, nspaces = divmod(effective, tabwidth)
|
||
|
lines[pos] = '\t' * ntabs + ' ' * nspaces + line[raw:]
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def untabify_region_event(self, event=None):
|
||
|
"Expand tabs to spaces for each line in region."
|
||
|
head, tail, chars, lines = self.get_region()
|
||
|
tabwidth = self._asktabwidth()
|
||
|
if tabwidth is None:
|
||
|
return
|
||
|
for pos in range(len(lines)):
|
||
|
lines[pos] = lines[pos].expandtabs(tabwidth)
|
||
|
self.set_region(head, tail, chars, lines)
|
||
|
return "break"
|
||
|
|
||
|
def _asktabwidth(self):
|
||
|
"Return value for tab width."
|
||
|
return askinteger(
|
||
|
"Tab width",
|
||
|
"Columns per tab? (2-16)",
|
||
|
parent=self.editwin.text,
|
||
|
initialvalue=self.editwin.indentwidth,
|
||
|
minvalue=2,
|
||
|
maxvalue=16)
|
||
|
|
||
|
|
||
|
if __name__ == "__main__":
|
||
|
from unittest import main
|
||
|
main('idlelib.idle_test.test_format', verbosity=2, exit=False)
|