blob: c1842561ec40b81170d37c59f36fd621eabf8607 [file] [log] [blame]
Guido van Rossum11e7f621992-01-01 18:38:09 +00001#! /ufs/guido/bin/sgi/python
Guido van Rossum2c4d7e71991-12-26 12:58:17 +00002#! /usr/local/python
3
Guido van Rossum0a60ee11992-01-01 19:22:09 +00004# Fix Python source files to use the new class definition syntax, i.e.,
Guido van Rossum2c4d7e71991-12-26 12:58:17 +00005# class C() = base(), base(), ...: ...
Guido van Rossum0a60ee11992-01-01 19:22:09 +00006# is changed to
7# class C(base, base, ...): ...
8# The script uses heuristics to find class definitions that usually
9# work but occasionally can fail; carefully check the output!
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000010#
11# Command line arguments are files or directories to be processed.
12# Directories are searched recursively for files whose name looks
13# like a python module.
14# Symbolic links are always ignored (except as explicit directory
15# arguments). Of course, the original file is kept as a back-up
16# (with a "~" attached to its name).
17#
Guido van Rossum11e7f621992-01-01 18:38:09 +000018# Changes made are reported to stdout in a diff-like format.
19#
20# Undoubtedly you can do this using find and sed or perl, but this is
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000021# a nice example of Python code that recurses down a directory tree
22# and uses regular expressions. Also note several subtleties like
23# preserving the file's mode and avoiding to even write a temp file
24# when no changes are needed for a file.
25#
Guido van Rossum11e7f621992-01-01 18:38:09 +000026# NB: by changing only the function fixline() you can turn this
27# into a program for a different change to Python programs...
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000028
29import sys
Guido van Rossum11e7f621992-01-01 18:38:09 +000030import regex
Guido van Rossumb2ac8091992-03-30 11:12:23 +000031import os
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000032from stat import *
33
34err = sys.stderr.write
35dbg = err
36rep = sys.stdout.write
37
38def main():
39 bad = 0
40 if not sys.argv[1:]: # No arguments
Guido van Rossum11e7f621992-01-01 18:38:09 +000041 err('usage: ' + argv[0] + ' file-or-directory ...\n')
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000042 sys.exit(2)
43 for arg in sys.argv[1:]:
Guido van Rossumb2ac8091992-03-30 11:12:23 +000044 if os.path.isdir(arg):
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000045 if recursedown(arg): bad = 1
Guido van Rossumb2ac8091992-03-30 11:12:23 +000046 elif os.path.islink(arg):
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000047 err(arg + ': will not process symbolic links\n')
48 bad = 1
49 else:
50 if fix(arg): bad = 1
51 sys.exit(bad)
52
Guido van Rossum11e7f621992-01-01 18:38:09 +000053ispythonprog = regex.compile('^[a-zA-Z0-9_]+\.py$')
54def ispython(name):
55 return ispythonprog.match(name) >= 0
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000056
57def recursedown(dirname):
58 dbg('recursedown(' + `dirname` + ')\n')
59 bad = 0
60 try:
Guido van Rossumb2ac8091992-03-30 11:12:23 +000061 names = os.listdir(dirname)
62 except os.error, msg:
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000063 err(dirname + ': cannot list directory: ' + `msg` + '\n')
64 return 1
Guido van Rossum11e7f621992-01-01 18:38:09 +000065 names.sort()
66 subdirs = []
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000067 for name in names:
Guido van Rossumb2ac8091992-03-30 11:12:23 +000068 if name in (os.curdir, os.pardir): continue
69 fullname = os.path.join(dirname, name)
70 if os.path.islink(fullname): pass
71 elif os.path.isdir(fullname):
Guido van Rossum11e7f621992-01-01 18:38:09 +000072 subdirs.append(fullname)
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000073 elif ispython(name):
74 if fix(fullname): bad = 1
Guido van Rossum11e7f621992-01-01 18:38:09 +000075 for fullname in subdirs:
76 if recursedown(fullname): bad = 1
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000077 return bad
78
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000079def fix(filename):
Guido van Rossum0a60ee11992-01-01 19:22:09 +000080## dbg('fix(' + `filename` + ')\n')
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000081 try:
82 f = open(filename, 'r')
83 except IOError, msg:
84 err(filename + ': cannot open: ' + `msg` + '\n')
85 return 1
Guido van Rossumb2ac8091992-03-30 11:12:23 +000086 head, tail = os.path.split(filename)
87 tempname = os.path.join(head, '@' + tail)
Guido van Rossum11e7f621992-01-01 18:38:09 +000088 g = None
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000089 # If we find a match, we rewind the file and start over but
90 # now copy everything to a temp file.
Guido van Rossum11e7f621992-01-01 18:38:09 +000091 lineno = 0
Guido van Rossum2c4d7e71991-12-26 12:58:17 +000092 while 1:
93 line = f.readline()
94 if not line: break
Guido van Rossum11e7f621992-01-01 18:38:09 +000095 lineno = lineno + 1
96 while line[-2:] == '\\\n':
97 nextline = f.readline()
98 if not nextline: break
99 line = line + nextline
100 lineno = lineno + 1
101 newline = fixline(line)
102 if newline != line:
103 if g is None:
104 try:
105 g = open(tempname, 'w')
106 except IOError, msg:
107 f.close()
108 err(tempname+': cannot create: '+\
109 `msg`+'\n')
110 return 1
111 f.seek(0)
112 lineno = 0
113 rep(filename + ':\n')
114 continue # restart from the beginning
115 rep(`lineno` + '\n')
116 rep('< ' + line)
117 rep('> ' + newline)
118 if g is not None:
119 g.write(newline)
120
121 # End of file
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000122 f.close()
Guido van Rossum11e7f621992-01-01 18:38:09 +0000123 if not g: return 0 # No changes
124
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000125 # Finishing touch -- move files
126
127 # First copy the file's mode to the temp file
128 try:
Guido van Rossumb2ac8091992-03-30 11:12:23 +0000129 statbuf = os.stat(filename)
130 os.chmod(tempname, statbuf[ST_MODE] & 07777)
131 except os.error, msg:
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000132 err(tempname + ': warning: chmod failed (' + `msg` + ')\n')
133 # Then make a backup of the original file as filename~
134 try:
Guido van Rossumb2ac8091992-03-30 11:12:23 +0000135 os.rename(filename, filename + '~')
136 except os.error, msg:
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000137 err(filename + ': warning: backup failed (' + `msg` + ')\n')
138 # Now move the temp file to the original file
139 try:
Guido van Rossumb2ac8091992-03-30 11:12:23 +0000140 os.rename(tempname, filename)
141 except os.error, msg:
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000142 err(filename + ': rename failed (' + `msg` + ')\n')
143 return 1
144 # Return succes
145 return 0
146
Guido van Rossum11e7f621992-01-01 18:38:09 +0000147# This expression doesn't catch *all* class definition headers,
148# but it's pretty darn close.
149classexpr = '^\([ \t]*class +[a-zA-Z0-9_]+\) *( *) *\(\(=.*\)?\):'
150classprog = regex.compile(classexpr)
151
152# Expressions for finding base class expressions.
153baseexpr = '^ *\(.*\) *( *) *$'
154baseprog = regex.compile(baseexpr)
155
156import string
157
158def fixline(line):
159 if classprog.match(line) < 0: # No 'class' keyword -- no change
160 return line
161
162 (a0, b0), (a1, b1), (a2, b2) = classprog.regs[:3]
163 # a0, b0 = Whole match (up to ':')
164 # a1, b1 = First subexpression (up to classname)
165 # a2, b2 = Second subexpression (=.*)
166 head = line[:b1]
167 tail = line[b0:] # Unmatched rest of line
168
169 if a2 == b2: # No base classes -- easy case
170 return head + ':' + tail
171
172 # Get rid of leading '='
173 basepart = line[a2+1:b2]
174
175 # Extract list of base expressions
176 bases = string.splitfields(basepart, ',')
177
178 # Strip trailing '()' from each base expression
179 for i in range(len(bases)):
180 if baseprog.match(bases[i]) >= 0:
181 x1, y1 = baseprog.regs[1]
182 bases[i] = bases[i][x1:y1]
183
184 # Join the bases back again and build the new line
185 basepart = string.joinfields(bases, ', ')
186
187 return head + '(' + basepart + '):' + tail
188
Guido van Rossum2c4d7e71991-12-26 12:58:17 +0000189main()