blob: 37803656aa20894f880c660cae4fe2c73b4fef3a [file] [log] [blame]
Serge Guelton16228bc2019-01-03 15:44:24 +00001#!/usr/bin/env python
Simon Pilgrim5334a2c2018-04-06 12:36:27 +00002
3"""A script to generate FileCheck statements for 'opt' analysis tests.
4
5This script is a utility to update LLVM opt analysis test cases with new
6FileCheck patterns. It can either update all of the tests in the file or
7a single test function.
8
9Example usage:
10$ update_analyze_test_checks.py --opt=../bin/opt test/foo.ll
11
12Workflow:
131. Make a compiler patch that requires updating some number of FileCheck lines
14 in regression test files.
152. Save the patch and revert it from your local work area.
163. Update the RUN-lines in the affected regression tests to look canonical.
17 Example: "; RUN: opt < %s -analyze -cost-model -S | FileCheck %s"
184. Refresh the FileCheck lines for either the entire file or select functions by
19 running this script.
205. Commit the fresh baseline of checks.
216. Apply your patch from step 1 and rebuild your local binaries.
227. Re-run this script on affected regression tests.
238. Check the diffs to ensure the script has done something reasonable.
249. Submit a patch including the regression test diffs for review.
25
26A common pattern is to have the script insert complete checking of every
27instruction. Then, edit it down to only check the relevant instructions.
28The script is designed to make adding checks to a test case fast, it is *not*
29designed to be authoratitive about what constitutes a good test!
30"""
31
Serge Guelton4a274782019-01-03 14:11:33 +000032from __future__ import print_function
33
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000034import argparse
Simon Pilgrimf509fe42019-03-05 10:44:37 +000035import glob
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000036import itertools
37import os # Used to advertise this file's name ("autogenerated_note").
38import string
39import subprocess
40import sys
41import tempfile
42import re
43
44from UpdateTestChecks import common
45
46ADVERT = '; NOTE: Assertions have been autogenerated by '
47
48# RegEx: this is where the magic happens.
49
50IR_FUNCTION_RE = re.compile('^\s*define\s+(?:internal\s+)?[^@]*@([\w-]+)\s*\(')
51
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000052def main():
53 from argparse import RawTextHelpFormatter
54 parser = argparse.ArgumentParser(description=__doc__, formatter_class=RawTextHelpFormatter)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000055 parser.add_argument('--opt-binary', default='opt',
56 help='The opt binary used to generate the test case')
57 parser.add_argument(
58 '--function', help='The function in the test file to update')
59 parser.add_argument('tests', nargs='+')
Alex Richardson61873942019-11-20 13:19:48 +000060 args = common.parse_commandline_args(parser)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000061
David Bolvansky7169ea32019-08-07 14:44:50 +000062 script_name = os.path.basename(__file__)
63 autogenerated_note = (ADVERT + 'utils/' + script_name)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000064
65 opt_basename = os.path.basename(args.opt_binary)
66 if (opt_basename != "opt"):
David Bolvansky7169ea32019-08-07 14:44:50 +000067 common.error('Unexpected opt name: ' + opt_basename)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000068 sys.exit(1)
69
Simon Pilgrimf509fe42019-03-05 10:44:37 +000070 test_paths = [test for pattern in args.tests for test in glob.glob(pattern)]
71 for test in test_paths:
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000072 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +000073 print('Scanning for RUN lines in test file: %s' % (test,), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000074 with open(test) as f:
75 input_lines = [l.rstrip() for l in f]
76
David Bolvansky7169ea32019-08-07 14:44:50 +000077 first_line = input_lines[0] if input_lines else ""
78 if 'autogenerated' in first_line and script_name not in first_line:
79 common.warn("Skipping test which wasn't autogenerated by " + script_name + ": " + test)
80 continue
81
82 if args.update_only:
83 if not first_line or 'autogenerated' not in first_line:
84 common.warn("Skipping test which isn't autogenerated: " + test)
85 continue
86
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000087 raw_lines = [m.group(1)
88 for m in [common.RUN_LINE_RE.match(l) for l in input_lines] if m]
89 run_lines = [raw_lines[0]] if len(raw_lines) > 0 else []
90 for l in raw_lines[1:]:
91 if run_lines[-1].endswith("\\"):
92 run_lines[-1] = run_lines[-1].rstrip("\\") + " " + l
93 else:
94 run_lines.append(l)
95
96 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +000097 print('Found %d RUN lines:' % (len(run_lines),), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000098 for l in run_lines:
Serge Guelton4a274782019-01-03 14:11:33 +000099 print(' RUN: ' + l, file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000100
101 prefix_list = []
102 for l in run_lines:
David Bolvansky7169ea32019-08-07 14:44:50 +0000103 if '|' not in l:
104 common.warn('Skipping unparseable RUN line: ' + l)
105 continue
106
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000107 (tool_cmd, filecheck_cmd) = tuple([cmd.strip() for cmd in l.split('|', 1)])
David Bolvansky45be5e42019-07-29 17:41:00 +0000108 common.verify_filecheck_prefixes(filecheck_cmd)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000109
110 if not tool_cmd.startswith(opt_basename + ' '):
David Bolvansky7169ea32019-08-07 14:44:50 +0000111 common.warn('WSkipping non-%s RUN line: %s' % (opt_basename, l))
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000112 continue
113
114 if not filecheck_cmd.startswith('FileCheck '):
David Bolvansky7169ea32019-08-07 14:44:50 +0000115 common.warn('Skipping non-FileChecked RUN line: ' + l)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000116 continue
117
118 tool_cmd_args = tool_cmd[len(opt_basename):].strip()
119 tool_cmd_args = tool_cmd_args.replace('< %s', '').replace('%s', '').strip()
120
121 check_prefixes = [item for m in common.CHECK_PREFIX_RE.finditer(filecheck_cmd)
122 for item in m.group(1).split(',')]
123 if not check_prefixes:
124 check_prefixes = ['CHECK']
125
126 # FIXME: We should use multiple check prefixes to common check lines. For
127 # now, we just ignore all but the last.
128 prefix_list.append((check_prefixes, tool_cmd_args))
129
130 func_dict = {}
131 for prefixes, _ in prefix_list:
132 for prefix in prefixes:
133 func_dict.update({prefix: dict()})
134 for prefixes, opt_args in prefix_list:
135 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000136 print('Extracted opt cmd: ' + opt_basename + ' ' + opt_args, file=sys.stderr)
137 print('Extracted FileCheck prefixes: ' + str(prefixes), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000138
139 raw_tool_outputs = common.invoke_tool(args.opt_binary, opt_args, test)
140
141 # Split analysis outputs by "Printing analysis " declarations.
142 for raw_tool_output in re.split(r'Printing analysis ', raw_tool_outputs):
143 common.build_function_body_dictionary(
144 common.ANALYZE_FUNCTION_RE, common.scrub_body, [],
Johannes Doerfert3598b812019-10-10 12:08:21 -0500145 raw_tool_output, prefixes, func_dict, args.verbose, False)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000146
147 is_in_function = False
148 is_in_function_start = False
149 prefix_set = set([prefix for prefixes, _ in prefix_list for prefix in prefixes])
150 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000151 print('Rewriting FileCheck prefixes: %s' % (prefix_set,), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000152 output_lines = []
153 output_lines.append(autogenerated_note)
154
155 for input_line in input_lines:
156 if is_in_function_start:
157 if input_line == '':
158 continue
159 if input_line.lstrip().startswith(';'):
160 m = common.CHECK_RE.match(input_line)
161 if not m or m.group(1) not in prefix_set:
162 output_lines.append(input_line)
163 continue
164
165 # Print out the various check lines here.
166 common.add_analyze_checks(output_lines, ';', prefix_list, func_dict, func_name)
167 is_in_function_start = False
168
169 if is_in_function:
170 if common.should_add_line_to_output(input_line, prefix_set):
171 # This input line of the function body will go as-is into the output.
172 # Except make leading whitespace uniform: 2 spaces.
173 input_line = common.SCRUB_LEADING_WHITESPACE_RE.sub(r' ', input_line)
174 output_lines.append(input_line)
175 else:
176 continue
177 if input_line.strip() == '}':
178 is_in_function = False
179 continue
180
181 # Discard any previous script advertising.
182 if input_line.startswith(ADVERT):
183 continue
184
185 # If it's outside a function, it just gets copied to the output.
186 output_lines.append(input_line)
187
188 m = IR_FUNCTION_RE.match(input_line)
189 if not m:
190 continue
191 func_name = m.group(1)
192 if args.function is not None and func_name != args.function:
193 # When filtering on a specific function, skip all others.
194 continue
195 is_in_function = is_in_function_start = True
196
197 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000198 print('Writing %d lines to %s...' % (len(output_lines), test), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000199
200 with open(test, 'wb') as f:
Simon Pilgrimd82bd4d2019-01-30 16:15:59 +0000201 f.writelines(['{}\n'.format(l).encode('utf-8') for l in output_lines])
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000202
203
204if __name__ == '__main__':
205 main()