Commit 7c64aad9 authored by Terry Jan Reedy's avatar Terry Jan Reedy

Issue #18226: Add docstrings and unittests for idlelib/FormatParagraph.py.

Move comment code to a separate function so it can be separately tested.
Original patches by Todd Rovito and Phil Webster.
parent 056bafe7
# Extension to format a paragraph """Extension to format a paragraph or selection to a max width.
# Does basic, standard text formatting, and also understands Python Does basic, standard text formatting, and also understands Python
# comment blocks. Thus, for editing Python source code, this comment blocks. Thus, for editing Python source code, this
# extension is really only suitable for reformatting these comment extension is really only suitable for reformatting these comment
# blocks or triple-quoted strings. blocks or triple-quoted strings.
# Known problems with comment reformatting: Known problems with comment reformatting:
# * If there is a selection marked, and the first line of the * If there is a selection marked, and the first line of the
# selection is not complete, the block will probably not be detected selection is not complete, the block will probably not be detected
# as comments, and will have the normal "text formatting" rules as comments, and will have the normal "text formatting" rules
# applied. applied.
# * If a comment block has leading whitespace that mixes tabs and * If a comment block has leading whitespace that mixes tabs and
# spaces, they will not be considered part of the same block. spaces, they will not be considered part of the same block.
# * Fancy comments, like this bulleted list, arent handled :-) * Fancy comments, like this bulleted list, aren't handled :-)
"""
import re import re
from idlelib.configHandler import idleConf from idlelib.configHandler import idleConf
...@@ -32,42 +33,31 @@ class FormatParagraph: ...@@ -32,42 +33,31 @@ class FormatParagraph:
self.editwin = None self.editwin = None
def format_paragraph_event(self, event): def format_paragraph_event(self, event):
maxformatwidth = int(idleConf.GetOption('main', 'FormatParagraph', """Formats paragraph to a max width specified in idleConf.
'paragraph', type='int'))
If text is selected, format_paragraph_event will start breaking lines
at the max width, starting from the beginning selection.
If no text is selected, format_paragraph_event uses the current
cursor location to determine the paragraph (lines of text surrounded
by blank lines) and formats it.
"""
maxformatwidth = idleConf.GetOption(
'main', 'FormatParagraph', 'paragraph', type='int')
text = self.editwin.text text = self.editwin.text
first, last = self.editwin.get_selection_indices() first, last = self.editwin.get_selection_indices()
if first and last: if first and last:
data = text.get(first, last) data = text.get(first, last)
comment_header = '' comment_header = get_comment_header(data)
else: else:
first, last, comment_header, data = \ first, last, comment_header, data = \
find_paragraph(text, text.index("insert")) find_paragraph(text, text.index("insert"))
if comment_header: if comment_header:
# Reformat the comment lines - convert to text sans header. newdata = reformat_comment(data, maxformatwidth, comment_header)
lines = data.split("\n")
lines = map(lambda st, l=len(comment_header): st[l:], lines)
data = "\n".join(lines)
# Reformat to maxformatwidth chars or a 20 char width,
# whichever is greater.
format_width = max(maxformatwidth - len(comment_header), 20)
newdata = reformat_paragraph(data, format_width)
# re-split and re-insert the comment header.
newdata = newdata.split("\n")
# If the block ends in a \n, we dont want the comment
# prefix inserted after it. (Im not sure it makes sense to
# reformat a comment block that isnt made of complete
# lines, but whatever!) Can't think of a clean solution,
# so we hack away
block_suffix = ""
if not newdata[-1]:
block_suffix = "\n"
newdata = newdata[:-1]
builder = lambda item, prefix=comment_header: prefix+item
newdata = '\n'.join(map(builder, newdata)) + block_suffix
else: else:
# Just a normal text format
newdata = reformat_paragraph(data, maxformatwidth) newdata = reformat_paragraph(data, maxformatwidth)
text.tag_remove("sel", "1.0", "end") text.tag_remove("sel", "1.0", "end")
if newdata != data: if newdata != data:
text.mark_set("insert", first) text.mark_set("insert", first)
text.undo_block_start() text.undo_block_start()
...@@ -80,31 +70,44 @@ class FormatParagraph: ...@@ -80,31 +70,44 @@ class FormatParagraph:
return "break" return "break"
def find_paragraph(text, mark): def find_paragraph(text, mark):
"""Returns the start/stop indices enclosing the paragraph that mark is in.
Also returns the comment format string, if any, and paragraph of text
between the start/stop indices.
"""
lineno, col = map(int, mark.split(".")) lineno, col = map(int, mark.split("."))
line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno) line = text.get("%d.0" % lineno, "%d.end" % lineno)
# Look for start of next paragraph if the index passed in is a blank line
while text.compare("%d.0" % lineno, "<", "end") and is_all_white(line): while text.compare("%d.0" % lineno, "<", "end") and is_all_white(line):
lineno = lineno + 1 lineno = lineno + 1
line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno) line = text.get("%d.0" % lineno, "%d.end" % lineno)
first_lineno = lineno first_lineno = lineno
comment_header = get_comment_header(line) comment_header = get_comment_header(line)
comment_header_len = len(comment_header) comment_header_len = len(comment_header)
# Once start line found, search for end of paragraph (a blank line)
while get_comment_header(line)==comment_header and \ while get_comment_header(line)==comment_header and \
not is_all_white(line[comment_header_len:]): not is_all_white(line[comment_header_len:]):
lineno = lineno + 1 lineno = lineno + 1
line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno) line = text.get("%d.0" % lineno, "%d.end" % lineno)
last = "%d.0" % lineno last = "%d.0" % lineno
# Search back to beginning of paragraph
# Search back to beginning of paragraph (first blank line before)
lineno = first_lineno - 1 lineno = first_lineno - 1
line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno) line = text.get("%d.0" % lineno, "%d.end" % lineno)
while lineno > 0 and \ while lineno > 0 and \
get_comment_header(line)==comment_header and \ get_comment_header(line)==comment_header and \
not is_all_white(line[comment_header_len:]): not is_all_white(line[comment_header_len:]):
lineno = lineno - 1 lineno = lineno - 1
line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno) line = text.get("%d.0" % lineno, "%d.end" % lineno)
first = "%d.0" % (lineno+1) first = "%d.0" % (lineno+1)
return first, last, comment_header, text.get(first, last) return first, last, comment_header, text.get(first, last)
# This should perhaps be replaced with textwrap.wrap
def reformat_paragraph(data, limit): def reformat_paragraph(data, limit):
"""Return data reformatted to specified width (limit)."""
lines = data.split("\n") lines = data.split("\n")
i = 0 i = 0
n = len(lines) n = len(lines)
...@@ -139,13 +142,50 @@ def reformat_paragraph(data, limit): ...@@ -139,13 +142,50 @@ def reformat_paragraph(data, limit):
new.extend(lines[i:]) new.extend(lines[i:])
return "\n".join(new) return "\n".join(new)
def reformat_comment(data, limit, comment_header):
"""Return data reformatted to specified width with comment header."""
# Remove header from the comment lines
lc = len(comment_header)
data = "\n".join(line[lc:] for line in data.split("\n"))
# Reformat to maxformatwidth chars or a 20 char width,
# whichever is greater.
format_width = max(limit - len(comment_header), 20)
newdata = reformat_paragraph(data, format_width)
# re-split and re-insert the comment header.
newdata = newdata.split("\n")
# If the block ends in a \n, we dont want the comment prefix
# inserted after it. (Im not sure it makes sense to reformat a
# comment block that is not made of complete lines, but whatever!)
# Can't think of a clean solution, so we hack away
block_suffix = ""
if not newdata[-1]:
block_suffix = "\n"
newdata = newdata[:-1]
return '\n'.join(comment_header+line for line in newdata) + block_suffix
def is_all_white(line): def is_all_white(line):
"""Return True if line is empty or all whitespace."""
return re.match(r"^\s*$", line) is not None return re.match(r"^\s*$", line) is not None
def get_indent(line): def get_indent(line):
return re.match(r"^(\s*)", line).group() """Return the initial space or tab indent of line."""
return re.match(r"^([ \t]*)", line).group()
def get_comment_header(line): def get_comment_header(line):
m = re.match(r"^(\s*#*)", line) """Return string with leading whitespace and '#' from line or ''.
A null return indicates that the line is not a comment line. A non-
null return, such as ' #', will be used to find the other lines of
a comment block with the same indent.
"""
m = re.match(r"^([ \t]*#*)", line)
if m is None: return "" if m is None: return ""
return m.group(1) return m.group(1)
if __name__ == "__main__":
from test import support; support.use_resources = ['gui']
import unittest
unittest.main('idlelib.idle_test.test_formatparagraph',
verbosity=2, exit=False)
This diff is collapsed.
...@@ -212,6 +212,9 @@ C API ...@@ -212,6 +212,9 @@ C API
IDLE IDLE
---- ----
- Issue #18226: Add docstrings and unittests for FormatParagraph.py.
Original patches by Todd Rovito and Phil Webster.
- Issue #18279: Format - Strip trailing whitespace no longer marks a file as - Issue #18279: Format - Strip trailing whitespace no longer marks a file as
changed when it has not been changed. This fix followed the addition of a changed when it has not been changed. This fix followed the addition of a
test file originally written by Phil Webster (the issue's main goal). test file originally written by Phil Webster (the issue's main goal).
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment