[llvm-exegesis] [NFC] Fixing typo.
[llvm-complete.git] / utils / update_analyze_test_checks.py
blob4d1d912aba865565c070568c1735b6665d30a6a7
1 #!/usr/bin/env python
3 """A script to generate FileCheck statements for 'opt' analysis tests.
5 This script is a utility to update LLVM opt analysis test cases with new
6 FileCheck patterns. It can either update all of the tests in the file or
7 a single test function.
9 Example usage:
10 $ update_analyze_test_checks.py --opt=../bin/opt test/foo.ll
12 Workflow:
13 1. Make a compiler patch that requires updating some number of FileCheck lines
14 in regression test files.
15 2. Save the patch and revert it from your local work area.
16 3. Update the RUN-lines in the affected regression tests to look canonical.
17 Example: "; RUN: opt < %s -analyze -cost-model -S | FileCheck %s"
18 4. Refresh the FileCheck lines for either the entire file or select functions by
19 running this script.
20 5. Commit the fresh baseline of checks.
21 6. Apply your patch from step 1 and rebuild your local binaries.
22 7. Re-run this script on affected regression tests.
23 8. Check the diffs to ensure the script has done something reasonable.
24 9. Submit a patch including the regression test diffs for review.
26 A common pattern is to have the script insert complete checking of every
27 instruction. Then, edit it down to only check the relevant instructions.
28 The script is designed to make adding checks to a test case fast, it is *not*
29 designed to be authoratitive about what constitutes a good test!
30 """
32 from __future__ import print_function
34 import argparse
35 import itertools
36 import os # Used to advertise this file's name ("autogenerated_note").
37 import string
38 import subprocess
39 import sys
40 import tempfile
41 import re
43 from UpdateTestChecks import common
45 ADVERT = '; NOTE: Assertions have been autogenerated by '
47 # RegEx: this is where the magic happens.
49 IR_FUNCTION_RE = re.compile('^\s*define\s+(?:internal\s+)?[^@]*@([\w-]+)\s*\(')
55 def main():
56 from argparse import RawTextHelpFormatter
57 parser = argparse.ArgumentParser(description=__doc__, formatter_class=RawTextHelpFormatter)
58 parser.add_argument('-v', '--verbose', action='store_true',
59 help='Show verbose output')
60 parser.add_argument('--opt-binary', default='opt',
61 help='The opt binary used to generate the test case')
62 parser.add_argument(
63 '--function', help='The function in the test file to update')
64 parser.add_argument('tests', nargs='+')
65 args = parser.parse_args()
67 autogenerated_note = (ADVERT + 'utils/' + os.path.basename(__file__))
69 opt_basename = os.path.basename(args.opt_binary)
70 if (opt_basename != "opt"):
71 print('ERROR: Unexpected opt name: ' + opt_basename, file=sys.stderr)
72 sys.exit(1)
74 for test in args.tests:
75 if args.verbose:
76 print('Scanning for RUN lines in test file: %s' % (test,), file=sys.stderr)
77 with open(test) as f:
78 input_lines = [l.rstrip() for l in f]
80 raw_lines = [m.group(1)
81 for m in [common.RUN_LINE_RE.match(l) for l in input_lines] if m]
82 run_lines = [raw_lines[0]] if len(raw_lines) > 0 else []
83 for l in raw_lines[1:]:
84 if run_lines[-1].endswith("\\"):
85 run_lines[-1] = run_lines[-1].rstrip("\\") + " " + l
86 else:
87 run_lines.append(l)
89 if args.verbose:
90 print('Found %d RUN lines:' % (len(run_lines),), file=sys.stderr)
91 for l in run_lines:
92 print(' RUN: ' + l, file=sys.stderr)
94 prefix_list = []
95 for l in run_lines:
96 (tool_cmd, filecheck_cmd) = tuple([cmd.strip() for cmd in l.split('|', 1)])
98 if not tool_cmd.startswith(opt_basename + ' '):
99 print('WARNING: Skipping non-%s RUN line: %s' % (opt_basename, l), file=sys.stderr)
100 continue
102 if not filecheck_cmd.startswith('FileCheck '):
103 print('WARNING: Skipping non-FileChecked RUN line: ' + l, file=sys.stderr)
104 continue
106 tool_cmd_args = tool_cmd[len(opt_basename):].strip()
107 tool_cmd_args = tool_cmd_args.replace('< %s', '').replace('%s', '').strip()
109 check_prefixes = [item for m in common.CHECK_PREFIX_RE.finditer(filecheck_cmd)
110 for item in m.group(1).split(',')]
111 if not check_prefixes:
112 check_prefixes = ['CHECK']
114 # FIXME: We should use multiple check prefixes to common check lines. For
115 # now, we just ignore all but the last.
116 prefix_list.append((check_prefixes, tool_cmd_args))
118 func_dict = {}
119 for prefixes, _ in prefix_list:
120 for prefix in prefixes:
121 func_dict.update({prefix: dict()})
122 for prefixes, opt_args in prefix_list:
123 if args.verbose:
124 print('Extracted opt cmd: ' + opt_basename + ' ' + opt_args, file=sys.stderr)
125 print('Extracted FileCheck prefixes: ' + str(prefixes), file=sys.stderr)
127 raw_tool_outputs = common.invoke_tool(args.opt_binary, opt_args, test)
129 # Split analysis outputs by "Printing analysis " declarations.
130 for raw_tool_output in re.split(r'Printing analysis ', raw_tool_outputs):
131 common.build_function_body_dictionary(
132 common.ANALYZE_FUNCTION_RE, common.scrub_body, [],
133 raw_tool_output, prefixes, func_dict, args.verbose)
135 is_in_function = False
136 is_in_function_start = False
137 prefix_set = set([prefix for prefixes, _ in prefix_list for prefix in prefixes])
138 if args.verbose:
139 print('Rewriting FileCheck prefixes: %s' % (prefix_set,), file=sys.stderr)
140 output_lines = []
141 output_lines.append(autogenerated_note)
143 for input_line in input_lines:
144 if is_in_function_start:
145 if input_line == '':
146 continue
147 if input_line.lstrip().startswith(';'):
148 m = common.CHECK_RE.match(input_line)
149 if not m or m.group(1) not in prefix_set:
150 output_lines.append(input_line)
151 continue
153 # Print out the various check lines here.
154 common.add_analyze_checks(output_lines, ';', prefix_list, func_dict, func_name)
155 is_in_function_start = False
157 if is_in_function:
158 if common.should_add_line_to_output(input_line, prefix_set):
159 # This input line of the function body will go as-is into the output.
160 # Except make leading whitespace uniform: 2 spaces.
161 input_line = common.SCRUB_LEADING_WHITESPACE_RE.sub(r' ', input_line)
162 output_lines.append(input_line)
163 else:
164 continue
165 if input_line.strip() == '}':
166 is_in_function = False
167 continue
169 # Discard any previous script advertising.
170 if input_line.startswith(ADVERT):
171 continue
173 # If it's outside a function, it just gets copied to the output.
174 output_lines.append(input_line)
176 m = IR_FUNCTION_RE.match(input_line)
177 if not m:
178 continue
179 func_name = m.group(1)
180 if args.function is not None and func_name != args.function:
181 # When filtering on a specific function, skip all others.
182 continue
183 is_in_function = is_in_function_start = True
185 if args.verbose:
186 print('Writing %d lines to %s...' % (len(output_lines), test), file=sys.stderr)
188 with open(test, 'wb') as f:
189 f.writelines(['{}\n'.format(l).encode('utf-8') for l in output_lines])
192 if __name__ == '__main__':
193 main()