blob: 0463bc01982d5dfedb25e6e61cabb0baeb138a11 [file] [log] [blame]
Simon Pilgrim5334a2c2018-04-06 12:36:27 +00001#!/usr/bin/env python2.7
2
3"""A script to generate FileCheck statements for 'opt' analysis tests.
4
5This script is a utility to update LLVM opt analysis test cases with new
6FileCheck patterns. It can either update all of the tests in the file or
7a single test function.
8
9Example usage:
10$ update_analyze_test_checks.py --opt=../bin/opt test/foo.ll
11
12Workflow:
131. Make a compiler patch that requires updating some number of FileCheck lines
14 in regression test files.
152. Save the patch and revert it from your local work area.
163. Update the RUN-lines in the affected regression tests to look canonical.
17 Example: "; RUN: opt < %s -analyze -cost-model -S | FileCheck %s"
184. Refresh the FileCheck lines for either the entire file or select functions by
19 running this script.
205. Commit the fresh baseline of checks.
216. Apply your patch from step 1 and rebuild your local binaries.
227. Re-run this script on affected regression tests.
238. Check the diffs to ensure the script has done something reasonable.
249. Submit a patch including the regression test diffs for review.
25
26A common pattern is to have the script insert complete checking of every
27instruction. Then, edit it down to only check the relevant instructions.
28The script is designed to make adding checks to a test case fast, it is *not*
29designed to be authoratitive about what constitutes a good test!
30"""
31
Serge Guelton4a274782019-01-03 14:11:33 +000032from __future__ import print_function
33
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000034import argparse
35import itertools
36import os # Used to advertise this file's name ("autogenerated_note").
37import string
38import subprocess
39import sys
40import tempfile
41import re
42
43from UpdateTestChecks import common
44
45ADVERT = '; NOTE: Assertions have been autogenerated by '
46
47# RegEx: this is where the magic happens.
48
49IR_FUNCTION_RE = re.compile('^\s*define\s+(?:internal\s+)?[^@]*@([\w-]+)\s*\(')
50
51
52
53
54
55def main():
56 from argparse import RawTextHelpFormatter
57 parser = argparse.ArgumentParser(description=__doc__, formatter_class=RawTextHelpFormatter)
58 parser.add_argument('-v', '--verbose', action='store_true',
59 help='Show verbose output')
60 parser.add_argument('--opt-binary', default='opt',
61 help='The opt binary used to generate the test case')
62 parser.add_argument(
63 '--function', help='The function in the test file to update')
64 parser.add_argument('tests', nargs='+')
65 args = parser.parse_args()
66
67 autogenerated_note = (ADVERT + 'utils/' + os.path.basename(__file__))
68
69 opt_basename = os.path.basename(args.opt_binary)
70 if (opt_basename != "opt"):
Serge Guelton4a274782019-01-03 14:11:33 +000071 print('ERROR: Unexpected opt name: ' + opt_basename, file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000072 sys.exit(1)
73
74 for test in args.tests:
75 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +000076 print('Scanning for RUN lines in test file: %s' % (test,), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000077 with open(test) as f:
78 input_lines = [l.rstrip() for l in f]
79
80 raw_lines = [m.group(1)
81 for m in [common.RUN_LINE_RE.match(l) for l in input_lines] if m]
82 run_lines = [raw_lines[0]] if len(raw_lines) > 0 else []
83 for l in raw_lines[1:]:
84 if run_lines[-1].endswith("\\"):
85 run_lines[-1] = run_lines[-1].rstrip("\\") + " " + l
86 else:
87 run_lines.append(l)
88
89 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +000090 print('Found %d RUN lines:' % (len(run_lines),), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000091 for l in run_lines:
Serge Guelton4a274782019-01-03 14:11:33 +000092 print(' RUN: ' + l, file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +000093
94 prefix_list = []
95 for l in run_lines:
96 (tool_cmd, filecheck_cmd) = tuple([cmd.strip() for cmd in l.split('|', 1)])
97
98 if not tool_cmd.startswith(opt_basename + ' '):
Serge Guelton4a274782019-01-03 14:11:33 +000099 print('WARNING: Skipping non-%s RUN line: %s' % (opt_basename, l), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000100 continue
101
102 if not filecheck_cmd.startswith('FileCheck '):
Serge Guelton4a274782019-01-03 14:11:33 +0000103 print('WARNING: Skipping non-FileChecked RUN line: ' + l, file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000104 continue
105
106 tool_cmd_args = tool_cmd[len(opt_basename):].strip()
107 tool_cmd_args = tool_cmd_args.replace('< %s', '').replace('%s', '').strip()
108
109 check_prefixes = [item for m in common.CHECK_PREFIX_RE.finditer(filecheck_cmd)
110 for item in m.group(1).split(',')]
111 if not check_prefixes:
112 check_prefixes = ['CHECK']
113
114 # FIXME: We should use multiple check prefixes to common check lines. For
115 # now, we just ignore all but the last.
116 prefix_list.append((check_prefixes, tool_cmd_args))
117
118 func_dict = {}
119 for prefixes, _ in prefix_list:
120 for prefix in prefixes:
121 func_dict.update({prefix: dict()})
122 for prefixes, opt_args in prefix_list:
123 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000124 print('Extracted opt cmd: ' + opt_basename + ' ' + opt_args, file=sys.stderr)
125 print('Extracted FileCheck prefixes: ' + str(prefixes), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000126
127 raw_tool_outputs = common.invoke_tool(args.opt_binary, opt_args, test)
128
129 # Split analysis outputs by "Printing analysis " declarations.
130 for raw_tool_output in re.split(r'Printing analysis ', raw_tool_outputs):
131 common.build_function_body_dictionary(
132 common.ANALYZE_FUNCTION_RE, common.scrub_body, [],
133 raw_tool_output, prefixes, func_dict, args.verbose)
134
135 is_in_function = False
136 is_in_function_start = False
137 prefix_set = set([prefix for prefixes, _ in prefix_list for prefix in prefixes])
138 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000139 print('Rewriting FileCheck prefixes: %s' % (prefix_set,), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000140 output_lines = []
141 output_lines.append(autogenerated_note)
142
143 for input_line in input_lines:
144 if is_in_function_start:
145 if input_line == '':
146 continue
147 if input_line.lstrip().startswith(';'):
148 m = common.CHECK_RE.match(input_line)
149 if not m or m.group(1) not in prefix_set:
150 output_lines.append(input_line)
151 continue
152
153 # Print out the various check lines here.
154 common.add_analyze_checks(output_lines, ';', prefix_list, func_dict, func_name)
155 is_in_function_start = False
156
157 if is_in_function:
158 if common.should_add_line_to_output(input_line, prefix_set):
159 # This input line of the function body will go as-is into the output.
160 # Except make leading whitespace uniform: 2 spaces.
161 input_line = common.SCRUB_LEADING_WHITESPACE_RE.sub(r' ', input_line)
162 output_lines.append(input_line)
163 else:
164 continue
165 if input_line.strip() == '}':
166 is_in_function = False
167 continue
168
169 # Discard any previous script advertising.
170 if input_line.startswith(ADVERT):
171 continue
172
173 # If it's outside a function, it just gets copied to the output.
174 output_lines.append(input_line)
175
176 m = IR_FUNCTION_RE.match(input_line)
177 if not m:
178 continue
179 func_name = m.group(1)
180 if args.function is not None and func_name != args.function:
181 # When filtering on a specific function, skip all others.
182 continue
183 is_in_function = is_in_function_start = True
184
185 if args.verbose:
Serge Guelton4a274782019-01-03 14:11:33 +0000186 print('Writing %d lines to %s...' % (len(output_lines), test), file=sys.stderr)
Simon Pilgrim5334a2c2018-04-06 12:36:27 +0000187
188 with open(test, 'wb') as f:
189 f.writelines([l + '\n' for l in output_lines])
190
191
192if __name__ == '__main__':
193 main()