blob: b3e9dc7361091251bce9e9385b8a0668c89c17f0 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#!/usr/bin/env python3
Georg Brandl56897312005-08-24 18:32:30 +00002
3"""List all those Python files that require a coding directive
4
Éric Araujo1e794f62011-05-05 20:18:16 +02005Usage: findnocoding.py dir1 [dir2...]
Georg Brandl56897312005-08-24 18:32:30 +00006"""
7
Thomas Wouters89f507f2006-12-13 04:49:30 +00008__author__ = "Oleg Broytmann, Georg Brandl"
Georg Brandl56897312005-08-24 18:32:30 +00009
10import sys, os, re, getopt
11
12# our pysource module finds Python source files
13try:
14 import pysource
Benjamin Petersonc0747cf2008-11-03 20:31:38 +000015except ImportError:
Georg Brandl56897312005-08-24 18:32:30 +000016 # emulate the module with a simple os.walk
17 class pysource:
18 has_python_ext = looks_like_python = can_be_compiled = None
19 def walk_python_files(self, paths, *args, **kwargs):
20 for path in paths:
21 if os.path.isfile(path):
22 yield path.endswith(".py")
23 elif os.path.isdir(path):
24 for root, dirs, files in os.walk(path):
25 for filename in files:
26 if filename.endswith(".py"):
27 yield os.path.join(root, filename)
28 pysource = pysource()
Tim Peters9e34c042005-08-26 15:20:46 +000029
30
Collin Winter6afaeb72007-08-03 17:06:41 +000031 print("The pysource module is not available; "
32 "no sophisticated Python source file search will be done.", file=sys.stderr)
Georg Brandl56897312005-08-24 18:32:30 +000033
34
Victor Stinner98516a62012-08-01 20:12:51 +020035decl_re = re.compile(rb"coding[=:]\s*([-\w.]+)")
Georg Brandl56897312005-08-24 18:32:30 +000036
37def get_declaration(line):
38 match = decl_re.search(line)
39 if match:
40 return match.group(1)
41 return ''
42
43def has_correct_encoding(text, codec):
44 try:
Georg Brandl8efadf52008-05-16 15:23:30 +000045 str(text, codec)
Georg Brandl56897312005-08-24 18:32:30 +000046 except UnicodeDecodeError:
47 return False
48 else:
49 return True
50
51def needs_declaration(fullpath):
52 try:
Victor Stinner98516a62012-08-01 20:12:51 +020053 infile = open(fullpath, 'rb')
Georg Brandl56897312005-08-24 18:32:30 +000054 except IOError: # Oops, the file was removed - ignore it
55 return None
56
Victor Stinner98516a62012-08-01 20:12:51 +020057 with infile:
58 line1 = infile.readline()
59 line2 = infile.readline()
Tim Peters9e34c042005-08-26 15:20:46 +000060
Victor Stinner98516a62012-08-01 20:12:51 +020061 if get_declaration(line1) or get_declaration(line2):
62 # the file does have an encoding declaration, so trust it
Victor Stinner98516a62012-08-01 20:12:51 +020063 return False
Tim Peters9e34c042005-08-26 15:20:46 +000064
Victor Stinner98516a62012-08-01 20:12:51 +020065 # check the whole file for non utf-8 characters
66 rest = infile.read()
Tim Peters9e34c042005-08-26 15:20:46 +000067
Benjamin Petersoncff882c2008-10-25 23:43:00 +000068 if has_correct_encoding(line1+line2+rest, "utf-8"):
Georg Brandl56897312005-08-24 18:32:30 +000069 return False
Tim Peters9e34c042005-08-26 15:20:46 +000070
Georg Brandl56897312005-08-24 18:32:30 +000071 return True
72
73
74usage = """Usage: %s [-cd] paths...
75 -c: recognize Python source files trying to compile them
76 -d: debug output""" % sys.argv[0]
77
R David Murray54ac8322012-04-04 21:28:14 -040078if __name__ == '__main__':
Georg Brandl56897312005-08-24 18:32:30 +000079
R David Murray54ac8322012-04-04 21:28:14 -040080 try:
81 opts, args = getopt.getopt(sys.argv[1:], 'cd')
82 except getopt.error as msg:
83 print(msg, file=sys.stderr)
84 print(usage, file=sys.stderr)
85 sys.exit(1)
Georg Brandl56897312005-08-24 18:32:30 +000086
R David Murray54ac8322012-04-04 21:28:14 -040087 is_python = pysource.looks_like_python
88 debug = False
Georg Brandl56897312005-08-24 18:32:30 +000089
R David Murray54ac8322012-04-04 21:28:14 -040090 for o, a in opts:
91 if o == '-c':
92 is_python = pysource.can_be_compiled
93 elif o == '-d':
94 debug = True
Georg Brandl56897312005-08-24 18:32:30 +000095
R David Murray54ac8322012-04-04 21:28:14 -040096 if not args:
97 print(usage, file=sys.stderr)
98 sys.exit(1)
99
100 for fullpath in pysource.walk_python_files(args, is_python):
101 if debug:
102 print("Testing for coding: %s" % fullpath)
103 result = needs_declaration(fullpath)
104 if result:
105 print(fullpath)