blob: 8e59c78a4c58443dbed01d7a5b642e55592afc8b [file] [log] [blame]
Éric Araujoa0e92a82011-07-26 18:01:08 +02001#!/usr/bin/env python3
Brett Cannon70cb1872017-06-24 16:51:23 -07002"""Check proposed changes for common issues."""
Georg Brandla9afb682010-10-21 12:49:28 +00003import re
4import sys
5import shutil
Christian Heimesada8c3b2008-03-18 18:26:33 +00006import os.path
7import subprocess
Éric Araujoa3e072b2011-07-30 21:34:04 +02008import sysconfig
Christian Heimesada8c3b2008-03-18 18:26:33 +00009
10import reindent
Georg Brandla9afb682010-10-21 12:49:28 +000011import untabify
Christian Heimesada8c3b2008-03-18 18:26:33 +000012
13
Victor Stinner4a347ce2017-08-17 16:29:15 +020014# Excluded directories which are copies of external libraries:
15# don't check their coding style
16EXCLUDE_DIRS = [os.path.join('Modules', '_ctypes', 'libffi_osx'),
17 os.path.join('Modules', '_ctypes', 'libffi_msvc'),
18 os.path.join('Modules', '_decimal', 'libmpdec'),
19 os.path.join('Modules', 'expat'),
20 os.path.join('Modules', 'zlib')]
Éric Araujoa3e072b2011-07-30 21:34:04 +020021SRCDIR = sysconfig.get_config_var('srcdir')
22
Victor Stinner4a347ce2017-08-17 16:29:15 +020023
Brett Cannon058173e2010-07-04 22:05:34 +000024def n_files_str(count):
25 """Return 'N file(s)' with the proper plurality on 'file'."""
26 return "{} file{}".format(count, "s" if count != 1 else "")
27
Florent Xiclunae4a33802010-08-09 12:24:20 +000028
Christian Heimesada8c3b2008-03-18 18:26:33 +000029def status(message, modal=False, info=None):
30 """Decorator to output status info to stdout."""
31 def decorated_fxn(fxn):
32 def call_fxn(*args, **kwargs):
33 sys.stdout.write(message + ' ... ')
34 sys.stdout.flush()
35 result = fxn(*args, **kwargs)
36 if not modal and not info:
37 print("done")
38 elif info:
39 print(info(result))
40 else:
Florent Xiclunae4a33802010-08-09 12:24:20 +000041 print("yes" if result else "NO")
Christian Heimesada8c3b2008-03-18 18:26:33 +000042 return result
43 return call_fxn
44 return decorated_fxn
45
Florent Xiclunae4a33802010-08-09 12:24:20 +000046
Nick Coghlan482f7a22017-03-12 13:19:08 +100047def get_git_branch():
48 """Get the symbolic name for the current git branch"""
49 cmd = "git rev-parse --abbrev-ref HEAD".split()
50 try:
Alexey Izbyshevaa95bfb2018-10-20 03:49:41 +030051 return subprocess.check_output(cmd,
52 stderr=subprocess.DEVNULL,
Miss Islington (bot)4cc83692021-05-10 11:58:42 -070053 cwd=SRCDIR,
54 encoding='UTF-8')
Nick Coghlan482f7a22017-03-12 13:19:08 +100055 except subprocess.CalledProcessError:
56 return None
57
58
59def get_git_upstream_remote():
60 """Get the remote name to use for upstream branches
61
62 Uses "upstream" if it exists, "origin" otherwise
63 """
64 cmd = "git remote get-url upstream".split()
65 try:
Alexey Izbyshevaa95bfb2018-10-20 03:49:41 +030066 subprocess.check_output(cmd,
67 stderr=subprocess.DEVNULL,
Miss Islington (bot)4cc83692021-05-10 11:58:42 -070068 cwd=SRCDIR,
69 encoding='UTF-8')
Nick Coghlan482f7a22017-03-12 13:19:08 +100070 except subprocess.CalledProcessError:
71 return "origin"
72 return "upstream"
73
74
Miss Islington (bot)4cc83692021-05-10 11:58:42 -070075def get_git_remote_default_branch(remote_name):
76 """Get the name of the default branch for the given remote
77
78 It is typically called 'main', but may differ
79 """
80 cmd = "git remote show {}".format(remote_name).split()
Miss Islington (bot)336dc522021-05-13 11:42:31 -070081 env = os.environ.copy()
82 env['LANG'] = 'C'
Miss Islington (bot)4cc83692021-05-10 11:58:42 -070083 try:
84 remote_info = subprocess.check_output(cmd,
85 stderr=subprocess.DEVNULL,
86 cwd=SRCDIR,
Miss Islington (bot)336dc522021-05-13 11:42:31 -070087 encoding='UTF-8',
88 env=env)
Miss Islington (bot)4cc83692021-05-10 11:58:42 -070089 except subprocess.CalledProcessError:
90 return None
91 for line in remote_info.splitlines():
92 if "HEAD branch:" in line:
93 base_branch = line.split(":")[1].strip()
94 return base_branch
95 return None
96
97
Nick Coghlan482f7a22017-03-12 13:19:08 +100098@status("Getting base branch for PR",
99 info=lambda x: x if x is not None else "not a PR branch")
100def get_base_branch():
Nick Coghlan2abfdf52017-04-09 18:33:03 +1000101 if not os.path.exists(os.path.join(SRCDIR, '.git')):
Nick Coghlan482f7a22017-03-12 13:19:08 +1000102 # Not a git checkout, so there's no base branch
103 return None
Miss Islington (bot)4cc83692021-05-10 11:58:42 -0700104 upstream_remote = get_git_upstream_remote()
Nick Coghlan482f7a22017-03-12 13:19:08 +1000105 version = sys.version_info
106 if version.releaselevel == 'alpha':
Miss Islington (bot)4cc83692021-05-10 11:58:42 -0700107 base_branch = get_git_remote_default_branch(upstream_remote)
Nick Coghlan482f7a22017-03-12 13:19:08 +1000108 else:
109 base_branch = "{0.major}.{0.minor}".format(version)
110 this_branch = get_git_branch()
111 if this_branch is None or this_branch == base_branch:
112 # Not on a git PR branch, so there's no base branch
113 return None
Nick Coghlan482f7a22017-03-12 13:19:08 +1000114 return upstream_remote + "/" + base_branch
115
116
Christian Heimesada8c3b2008-03-18 18:26:33 +0000117@status("Getting the list of files that have been added/changed",
Georg Brandla9afb682010-10-21 12:49:28 +0000118 info=lambda x: n_files_str(len(x)))
Nick Coghlan482f7a22017-03-12 13:19:08 +1000119def changed_files(base_branch=None):
Benjamin Petersonb8c08452018-06-05 22:40:12 -0700120 """Get the list of changed or added files from git."""
121 if os.path.exists(os.path.join(SRCDIR, '.git')):
Nick Coghlan6a6d0902017-03-12 19:37:09 +1000122 # We just use an existence check here as:
123 # directory = normal git checkout/clone
124 # file = git worktree directory
Nick Coghlan482f7a22017-03-12 13:19:08 +1000125 if base_branch:
126 cmd = 'git diff --name-status ' + base_branch
127 else:
128 cmd = 'git status --porcelain'
Christian Heimesd98c6772015-04-23 11:24:14 +0200129 filenames = []
Alexey Izbyshevaa95bfb2018-10-20 03:49:41 +0300130 with subprocess.Popen(cmd.split(),
131 stdout=subprocess.PIPE,
132 cwd=SRCDIR) as st:
Christian Heimesd98c6772015-04-23 11:24:14 +0200133 for line in st.stdout:
134 line = line.decode().rstrip()
Nick Coghlan482f7a22017-03-12 13:19:08 +1000135 status_text, filename = line.split(maxsplit=1)
136 status = set(status_text)
Christian Heimesd98c6772015-04-23 11:24:14 +0200137 # modified, added or unmerged files
138 if not status.intersection('MAU'):
139 continue
Christian Heimesd98c6772015-04-23 11:24:14 +0200140 if ' -> ' in filename:
141 # file is renamed
142 filename = filename.split(' -> ', 2)[1].strip()
143 filenames.append(filename)
Christian Heimesd98c6772015-04-23 11:24:14 +0200144 else:
Benjamin Petersonb8c08452018-06-05 22:40:12 -0700145 sys.exit('need a git checkout to get modified files')
Florent Xiclunae4a33802010-08-09 12:24:20 +0000146
Victor Stinner4a347ce2017-08-17 16:29:15 +0200147 filenames2 = []
148 for filename in filenames:
149 # Normalize the path to be able to match using .startswith()
150 filename = os.path.normpath(filename)
151 if any(filename.startswith(path) for path in EXCLUDE_DIRS):
152 # Exclude the file
153 continue
154 filenames2.append(filename)
155
156 return filenames2
157
Christian Heimesada8c3b2008-03-18 18:26:33 +0000158
Brett Cannon058173e2010-07-04 22:05:34 +0000159def report_modified_files(file_paths):
160 count = len(file_paths)
161 if count == 0:
162 return n_files_str(count)
163 else:
164 lines = ["{}:".format(n_files_str(count))]
165 for path in file_paths:
166 lines.append(" {}".format(path))
167 return "\n".join(lines)
168
Florent Xiclunae4a33802010-08-09 12:24:20 +0000169
Brett Cannon70cb1872017-06-24 16:51:23 -0700170@status("Fixing Python file whitespace", info=report_modified_files)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000171def normalize_whitespace(file_paths):
172 """Make sure that the whitespace for .py files have been normalized."""
173 reindent.makebackup = False # No need to create backups.
Benjamin Peterson4177eff2011-06-27 18:25:06 -0500174 fixed = [path for path in file_paths if path.endswith('.py') and
Éric Araujoad548b82011-07-31 18:33:00 +0200175 reindent.check(os.path.join(SRCDIR, path))]
Brett Cannon058173e2010-07-04 22:05:34 +0000176 return fixed
Christian Heimesada8c3b2008-03-18 18:26:33 +0000177
Florent Xiclunae4a33802010-08-09 12:24:20 +0000178
Georg Brandla9afb682010-10-21 12:49:28 +0000179@status("Fixing C file whitespace", info=report_modified_files)
180def normalize_c_whitespace(file_paths):
181 """Report if any C files """
182 fixed = []
183 for path in file_paths:
Éric Araujoa3e072b2011-07-30 21:34:04 +0200184 abspath = os.path.join(SRCDIR, path)
185 with open(abspath, 'r') as f:
Georg Brandla9afb682010-10-21 12:49:28 +0000186 if '\t' not in f.read():
187 continue
Éric Araujoa3e072b2011-07-30 21:34:04 +0200188 untabify.process(abspath, 8, verbose=False)
Georg Brandla9afb682010-10-21 12:49:28 +0000189 fixed.append(path)
190 return fixed
191
192
193ws_re = re.compile(br'\s+(\r?\n)$')
194
195@status("Fixing docs whitespace", info=report_modified_files)
196def normalize_docs_whitespace(file_paths):
197 fixed = []
198 for path in file_paths:
Éric Araujoa3e072b2011-07-30 21:34:04 +0200199 abspath = os.path.join(SRCDIR, path)
Georg Brandla9afb682010-10-21 12:49:28 +0000200 try:
Éric Araujoa3e072b2011-07-30 21:34:04 +0200201 with open(abspath, 'rb') as f:
Georg Brandla9afb682010-10-21 12:49:28 +0000202 lines = f.readlines()
203 new_lines = [ws_re.sub(br'\1', line) for line in lines]
204 if new_lines != lines:
Éric Araujoa3e072b2011-07-30 21:34:04 +0200205 shutil.copyfile(abspath, abspath + '.bak')
206 with open(abspath, 'wb') as f:
Georg Brandla9afb682010-10-21 12:49:28 +0000207 f.writelines(new_lines)
208 fixed.append(path)
209 except Exception as err:
210 print('Cannot fix %s: %s' % (path, err))
211 return fixed
212
213
Christian Heimesada8c3b2008-03-18 18:26:33 +0000214@status("Docs modified", modal=True)
215def docs_modified(file_paths):
Brett Cannon058173e2010-07-04 22:05:34 +0000216 """Report if any file in the Doc directory has been changed."""
217 return bool(file_paths)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000218
Florent Xiclunae4a33802010-08-09 12:24:20 +0000219
Christian Heimesada8c3b2008-03-18 18:26:33 +0000220@status("Misc/ACKS updated", modal=True)
221def credit_given(file_paths):
222 """Check if Misc/ACKS has been changed."""
Terry Jan Reedy6e2711b2013-07-21 20:57:44 -0400223 return os.path.join('Misc', 'ACKS') in file_paths
Christian Heimesada8c3b2008-03-18 18:26:33 +0000224
Florent Xiclunae4a33802010-08-09 12:24:20 +0000225
Antoine Pitrou1ba94692017-06-25 03:21:49 +0200226@status("Misc/NEWS.d updated with `blurb`", modal=True)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000227def reported_news(file_paths):
Antoine Pitrou1ba94692017-06-25 03:21:49 +0200228 """Check if Misc/NEWS.d has been changed."""
229 return any(p.startswith(os.path.join('Misc', 'NEWS.d', 'next'))
230 for p in file_paths)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000231
Ross Lagerwall6c52c572012-03-11 19:21:07 +0200232@status("configure regenerated", modal=True, info=str)
233def regenerated_configure(file_paths):
234 """Check if configure has been regenerated."""
Matthias Klose5ce31cc2012-03-14 23:17:31 +0100235 if 'configure.ac' in file_paths:
Ross Lagerwall6c52c572012-03-11 19:21:07 +0200236 return "yes" if 'configure' in file_paths else "no"
237 else:
238 return "not needed"
239
240@status("pyconfig.h.in regenerated", modal=True, info=str)
241def regenerated_pyconfig_h_in(file_paths):
242 """Check if pyconfig.h.in has been regenerated."""
Matthias Klose5ce31cc2012-03-14 23:17:31 +0100243 if 'configure.ac' in file_paths:
Ross Lagerwall6c52c572012-03-11 19:21:07 +0200244 return "yes" if 'pyconfig.h.in' in file_paths else "no"
245 else:
246 return "not needed"
Christian Heimesada8c3b2008-03-18 18:26:33 +0000247
Brett Cannon70cb1872017-06-24 16:51:23 -0700248def travis(pull_request):
249 if pull_request == 'false':
250 print('Not a pull request; skipping')
251 return
252 base_branch = get_base_branch()
253 file_paths = changed_files(base_branch)
254 python_files = [fn for fn in file_paths if fn.endswith('.py')]
255 c_files = [fn for fn in file_paths if fn.endswith(('.c', '.h'))]
256 doc_files = [fn for fn in file_paths if fn.startswith('Doc') and
257 fn.endswith(('.rst', '.inc'))]
258 fixed = []
259 fixed.extend(normalize_whitespace(python_files))
260 fixed.extend(normalize_c_whitespace(c_files))
261 fixed.extend(normalize_docs_whitespace(doc_files))
262 if not fixed:
263 print('No whitespace issues found')
264 else:
265 print(f'Please fix the {len(fixed)} file(s) with whitespace issues')
266 print('(on UNIX you can run `make patchcheck` to make the fixes)')
267 sys.exit(1)
268
Christian Heimesada8c3b2008-03-18 18:26:33 +0000269def main():
Nick Coghlan482f7a22017-03-12 13:19:08 +1000270 base_branch = get_base_branch()
271 file_paths = changed_files(base_branch)
Brett Cannon058173e2010-07-04 22:05:34 +0000272 python_files = [fn for fn in file_paths if fn.endswith('.py')]
273 c_files = [fn for fn in file_paths if fn.endswith(('.c', '.h'))]
Georg Brandl24f07172014-10-19 11:54:08 +0200274 doc_files = [fn for fn in file_paths if fn.startswith('Doc') and
275 fn.endswith(('.rst', '.inc'))]
Antoine Pitrou1ba94692017-06-25 03:21:49 +0200276 misc_files = {p for p in file_paths if p.startswith('Misc')}
Brett Cannon058173e2010-07-04 22:05:34 +0000277 # PEP 8 whitespace rules enforcement.
278 normalize_whitespace(python_files)
Georg Brandla9afb682010-10-21 12:49:28 +0000279 # C rules enforcement.
280 normalize_c_whitespace(c_files)
281 # Doc whitespace enforcement.
282 normalize_docs_whitespace(doc_files)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000283 # Docs updated.
Georg Brandla9afb682010-10-21 12:49:28 +0000284 docs_modified(doc_files)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000285 # Misc/ACKS changed.
Terry Jan Reedy6e2711b2013-07-21 20:57:44 -0400286 credit_given(misc_files)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000287 # Misc/NEWS changed.
Terry Jan Reedy6e2711b2013-07-21 20:57:44 -0400288 reported_news(misc_files)
Ross Lagerwall6c52c572012-03-11 19:21:07 +0200289 # Regenerated configure, if necessary.
290 regenerated_configure(file_paths)
291 # Regenerated pyconfig.h.in, if necessary.
292 regenerated_pyconfig_h_in(file_paths)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000293
294 # Test suite run and passed.
Éric Araujofbc5ff62011-08-12 17:50:08 +0200295 if python_files or c_files:
Ezio Melotti5e12bb72013-01-11 14:07:47 +0200296 end = " and check for refleaks?" if c_files else "?"
Éric Araujofbc5ff62011-08-12 17:50:08 +0200297 print()
Ezio Melotti5e12bb72013-01-11 14:07:47 +0200298 print("Did you run the test suite" + end)
Christian Heimesada8c3b2008-03-18 18:26:33 +0000299
300
301if __name__ == '__main__':
Brett Cannon70cb1872017-06-24 16:51:23 -0700302 import argparse
303 parser = argparse.ArgumentParser(description=__doc__)
304 parser.add_argument('--travis',
305 help='Perform pass/fail checks')
306 args = parser.parse_args()
307 if args.travis:
308 travis(args.travis)
309 else:
310 main()