blob: c1bc769c22eed805ca19a9ae848ac7418cf251c4 [file] [log] [blame]
Guido van Rossum94e82ce1999-01-04 13:04:54 +00001# Extension to format a paragraph
2
Guido van Rossum3dd36891999-06-10 17:48:02 +00003# Does basic, standard text formatting, and also understands Python
4# comment blocks. Thus, for editing Python source code, this
5# extension is really only suitable for reformatting these comment
6# blocks or triple-quoted strings.
7
8# Known problems with comment reformatting:
9# * If there is a selection marked, and the first line of the
10# selection is not complete, the block will probably not be detected
11# as comments, and will have the normal "text formatting" rules
12# applied.
13# * If a comment block has leading whitespace that mixes tabs and
14# spaces, they will not be considered part of the same block.
15# * Fancy comments, like this bulleted list, arent handled :-)
16
Guido van Rossum94e82ce1999-01-04 13:04:54 +000017import re
18
19class FormatParagraph:
20
21 menudefs = [
22 ('edit', [
23 ('Format Paragraph', '<<format-paragraph>>'),
24 ])
25 ]
26
27 keydefs = {
28 '<<format-paragraph>>': ['<Alt-q>'],
29 }
Tim Peters70c43782001-01-17 08:48:39 +000030
Guido van Rossume911c3e1999-01-04 16:34:41 +000031 unix_keydefs = {
32 '<<format-paragraph>>': ['<Meta-q>'],
Tim Peters70c43782001-01-17 08:48:39 +000033 }
Guido van Rossum94e82ce1999-01-04 13:04:54 +000034
35 def __init__(self, editwin):
36 self.editwin = editwin
37
Guido van Rossume689f001999-06-25 16:02:22 +000038 def close(self):
39 self.editwin = None
40
Guido van Rossum94e82ce1999-01-04 13:04:54 +000041 def format_paragraph_event(self, event):
42 text = self.editwin.text
Guido van Rossum13205601999-06-11 15:03:00 +000043 first, last = self.editwin.get_selection_indices()
Guido van Rossum94e82ce1999-01-04 13:04:54 +000044 if first and last:
45 data = text.get(first, last)
Guido van Rossum3dd36891999-06-10 17:48:02 +000046 comment_header = ''
Guido van Rossum94e82ce1999-01-04 13:04:54 +000047 else:
Guido van Rossum3dd36891999-06-10 17:48:02 +000048 first, last, comment_header, data = \
49 find_paragraph(text, text.index("insert"))
50 if comment_header:
51 # Reformat the comment lines - convert to text sans header.
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000052 lines = data.split("\n")
Guido van Rossum3dd36891999-06-10 17:48:02 +000053 lines = map(lambda st, l=len(comment_header): st[l:], lines)
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000054 data = "\n".join(lines)
Guido van Rossum3dd36891999-06-10 17:48:02 +000055 # Reformat to 70 chars or a 20 char width, whichever is greater.
56 format_width = max(70-len(comment_header), 20)
57 newdata = reformat_paragraph(data, format_width)
58 # re-split and re-insert the comment header.
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000059 newdata = newdata.split("\n")
Guido van Rossum3dd36891999-06-10 17:48:02 +000060 # If the block ends in a \n, we dont want the comment
61 # prefix inserted after it. (Im not sure it makes sense to
62 # reformat a comment block that isnt made of complete
63 # lines, but whatever!) Can't think of a clean soltution,
64 # so we hack away
65 block_suffix = ""
66 if not newdata[-1]:
67 block_suffix = "\n"
68 newdata = newdata[:-1]
69 builder = lambda item, prefix=comment_header: prefix+item
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000070 newdata = '\n'.join(map(builder, newdata)) + block_suffix
Guido van Rossum3dd36891999-06-10 17:48:02 +000071 else:
72 # Just a normal text format
73 newdata = reformat_paragraph(data)
Guido van Rossum94e82ce1999-01-04 13:04:54 +000074 text.tag_remove("sel", "1.0", "end")
75 if newdata != data:
76 text.mark_set("insert", first)
Guido van Rossum318a70d1999-05-03 15:49:52 +000077 text.undo_block_start()
Guido van Rossum94e82ce1999-01-04 13:04:54 +000078 text.delete(first, last)
79 text.insert(first, newdata)
Guido van Rossum318a70d1999-05-03 15:49:52 +000080 text.undo_block_stop()
Guido van Rossum94e82ce1999-01-04 13:04:54 +000081 else:
82 text.mark_set("insert", last)
83 text.see("insert")
84
85def find_paragraph(text, mark):
Walter Dörwaldaaab30e2002-09-11 20:36:02 +000086 lineno, col = map(int, mark.split("."))
Guido van Rossum94e82ce1999-01-04 13:04:54 +000087 line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno)
Guido van Rossum1e899cd1999-01-04 21:19:09 +000088 while text.compare("%d.0" % lineno, "<", "end") and is_all_white(line):
Guido van Rossum94e82ce1999-01-04 13:04:54 +000089 lineno = lineno + 1
90 line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno)
91 first_lineno = lineno
Guido van Rossum3dd36891999-06-10 17:48:02 +000092 comment_header = get_comment_header(line)
93 comment_header_len = len(comment_header)
94 while get_comment_header(line)==comment_header and \
95 not is_all_white(line[comment_header_len:]):
Guido van Rossum94e82ce1999-01-04 13:04:54 +000096 lineno = lineno + 1
97 line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno)
98 last = "%d.0" % lineno
99 # Search back to beginning of paragraph
100 lineno = first_lineno - 1
101 line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno)
Guido van Rossum3dd36891999-06-10 17:48:02 +0000102 while lineno > 0 and \
103 get_comment_header(line)==comment_header and \
104 not is_all_white(line[comment_header_len:]):
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000105 lineno = lineno - 1
106 line = text.get("%d.0" % lineno, "%d.0 lineend" % lineno)
107 first = "%d.0" % (lineno+1)
Guido van Rossum3dd36891999-06-10 17:48:02 +0000108 return first, last, comment_header, text.get(first, last)
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000109
Guido van Rossum629082e1999-01-07 00:12:15 +0000110def reformat_paragraph(data, limit=70):
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000111 lines = data.split("\n")
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000112 i = 0
113 n = len(lines)
114 while i < n and is_all_white(lines[i]):
115 i = i+1
116 if i >= n:
117 return data
118 indent1 = get_indent(lines[i])
119 if i+1 < n and not is_all_white(lines[i+1]):
120 indent2 = get_indent(lines[i+1])
121 else:
122 indent2 = indent1
123 new = lines[:i]
124 partial = indent1
125 while i < n and not is_all_white(lines[i]):
126 # XXX Should take double space after period (etc.) into account
127 words = re.split("(\s+)", lines[i])
128 for j in range(0, len(words), 2):
129 word = words[j]
130 if not word:
131 continue # Can happen when line ends in whitespace
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000132 if len((partial + word).expandtabs()) > limit and \
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000133 partial != indent1:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000134 new.append(partial.rstrip())
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000135 partial = indent2
136 partial = partial + word + " "
137 if j+1 < len(words) and words[j+1] != " ":
138 partial = partial + " "
139 i = i+1
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000140 new.append(partial.rstrip())
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000141 # XXX Should reformat remaining paragraphs as well
142 new.extend(lines[i:])
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000143 return "\n".join(new)
Guido van Rossum94e82ce1999-01-04 13:04:54 +0000144
145def is_all_white(line):
146 return re.match(r"^\s*$", line) is not None
147
148def get_indent(line):
149 return re.match(r"^(\s*)", line).group()
Guido van Rossum3dd36891999-06-10 17:48:02 +0000150
151def get_comment_header(line):
152 m = re.match(r"^(\s*#*)", line)
153 if m is None: return ""
154 return m.group(1)