| #! /usr/bin/env python |
| |
| # Fix Python source files to use the new equality test operator, i.e., |
| # if x = y: ... |
| # is changed to |
| # if x == y: ... |
| # The script correctly tokenizes the Python program to reliably |
| # distinguish between assignments and equality tests. |
| # |
| # Command line arguments are files or directories to be processed. |
| # Directories are searched recursively for files whose name looks |
| # like a python module. |
| # Symbolic links are always ignored (except as explicit directory |
| # arguments). Of course, the original file is kept as a back-up |
| # (with a "~" attached to its name). |
| # It complains about binaries (files containing null bytes) |
| # and about files that are ostensibly not Python files: if the first |
| # line starts with '#!' and does not contain the string 'python'. |
| # |
| # Changes made are reported to stdout in a diff-like format. |
| # |
| # Undoubtedly you can do this using find and sed or perl, but this is |
| # a nice example of Python code that recurses down a directory tree |
| # and uses regular expressions. Also note several subtleties like |
| # preserving the file's mode and avoiding to even write a temp file |
| # when no changes are needed for a file. |
| # |
| # NB: by changing only the function fixline() you can turn this |
| # into a program for a different change to Python programs... |
| |
| import sys |
| import re |
| import os |
| from stat import * |
| import string |
| |
| err = sys.stderr.write |
| dbg = err |
| rep = sys.stdout.write |
| |
| def main(): |
| bad = 0 |
| if not sys.argv[1:]: # No arguments |
| err('usage: ' + sys.argv[0] + ' file-or-directory ...\n') |
| sys.exit(2) |
| for arg in sys.argv[1:]: |
| if os.path.isdir(arg): |
| if recursedown(arg): bad = 1 |
| elif os.path.islink(arg): |
| err(arg + ': will not process symbolic links\n') |
| bad = 1 |
| else: |
| if fix(arg): bad = 1 |
| sys.exit(bad) |
| |
| ispythonprog = re.compile('^[a-zA-Z0-9_]+\.py$') |
| def ispython(name): |
| return ispythonprog.match(name) >= 0 |
| |
| def recursedown(dirname): |
| dbg('recursedown(%r)\n' % (dirname,)) |
| bad = 0 |
| try: |
| names = os.listdir(dirname) |
| except os.error, msg: |
| err('%s: cannot list directory: %r\n' % (dirname, msg)) |
| return 1 |
| names.sort() |
| subdirs = [] |
| for name in names: |
| if name in (os.curdir, os.pardir): continue |
| fullname = os.path.join(dirname, name) |
| if os.path.islink(fullname): pass |
| elif os.path.isdir(fullname): |
| subdirs.append(fullname) |
| elif ispython(name): |
| if fix(fullname): bad = 1 |
| for fullname in subdirs: |
| if recursedown(fullname): bad = 1 |
| return bad |
| |
| def fix(filename): |
| ## dbg('fix(%r)\n' % (dirname,)) |
| try: |
| f = open(filename, 'r') |
| except IOError, msg: |
| err('%s: cannot open: %r\n' % (filename, msg)) |
| return 1 |
| head, tail = os.path.split(filename) |
| tempname = os.path.join(head, '@' + tail) |
| g = None |
| # If we find a match, we rewind the file and start over but |
| # now copy everything to a temp file. |
| lineno = 0 |
| while 1: |
| line = f.readline() |
| if not line: break |
| lineno = lineno + 1 |
| if g is None and '\0' in line: |
| # Check for binary files |
| err(filename + ': contains null bytes; not fixed\n') |
| f.close() |
| return 1 |
| if lineno == 1 and g is None and line[:2] == '#!': |
| # Check for non-Python scripts |
| words = string.split(line[2:]) |
| if words and re.search('[pP]ython', words[0]) < 0: |
| msg = filename + ': ' + words[0] |
| msg = msg + ' script; not fixed\n' |
| err(msg) |
| f.close() |
| return 1 |
| while line[-2:] == '\\\n': |
| nextline = f.readline() |
| if not nextline: break |
| line = line + nextline |
| lineno = lineno + 1 |
| newline = fixline(line) |
| if newline != line: |
| if g is None: |
| try: |
| g = open(tempname, 'w') |
| except IOError, msg: |
| f.close() |
| err('%s: cannot create: %r\n' % (tempname, msg)) |
| return 1 |
| f.seek(0) |
| lineno = 0 |
| rep(filename + ':\n') |
| continue # restart from the beginning |
| rep(repr(lineno) + '\n') |
| rep('< ' + line) |
| rep('> ' + newline) |
| if g is not None: |
| g.write(newline) |
| |
| # End of file |
| f.close() |
| if not g: return 0 # No changes |
| |
| # Finishing touch -- move files |
| |
| # First copy the file's mode to the temp file |
| try: |
| statbuf = os.stat(filename) |
| os.chmod(tempname, statbuf[ST_MODE] & 07777) |
| except os.error, msg: |
| err('%s: warning: chmod failed (%r)\n' % (tempname, msg)) |
| # Then make a backup of the original file as filename~ |
| try: |
| os.rename(filename, filename + '~') |
| except os.error, msg: |
| err('%s: warning: backup failed (%r)\n' % (filename, msg)) |
| # Now move the temp file to the original file |
| try: |
| os.rename(tempname, filename) |
| except os.error, msg: |
| err('%s: rename failed (%r)\n' % (filename, msg)) |
| return 1 |
| # Return succes |
| return 0 |
| |
| |
| from tokenize import tokenprog |
| |
| match = {'if':':', 'elif':':', 'while':':', 'return':'\n', \ |
| '(':')', '[':']', '{':'}', '`':'`'} |
| |
| def fixline(line): |
| # Quick check for easy case |
| if '=' not in line: return line |
| |
| i, n = 0, len(line) |
| stack = [] |
| while i < n: |
| j = tokenprog.match(line, i) |
| if j < 0: |
| # A bad token; forget about the rest of this line |
| print '(Syntax error:)' |
| print line, |
| return line |
| a, b = tokenprog.regs[3] # Location of the token proper |
| token = line[a:b] |
| i = i+j |
| if stack and token == stack[-1]: |
| del stack[-1] |
| elif match.has_key(token): |
| stack.append(match[token]) |
| elif token == '=' and stack: |
| line = line[:a] + '==' + line[b:] |
| i, n = a + len('=='), len(line) |
| elif token == '==' and not stack: |
| print '(Warning: \'==\' at top level:)' |
| print line, |
| return line |
| |
| if __name__ == "__main__": |
| main() |