forked from OSchip/llvm-project
409 lines
14 KiB
Python
409 lines
14 KiB
Python
#===- perf-helper.py - Clang Python Bindings -----------------*- python -*--===#
|
|
#
|
|
# The LLVM Compiler Infrastructure
|
|
#
|
|
# This file is distributed under the University of Illinois Open Source
|
|
# License. See LICENSE.TXT for details.
|
|
#
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
from __future__ import print_function
|
|
|
|
import sys
|
|
import os
|
|
import subprocess
|
|
import argparse
|
|
import time
|
|
import bisect
|
|
import shlex
|
|
import tempfile
|
|
|
|
test_env = { 'PATH' : os.environ['PATH'] }
|
|
|
|
def findFilesWithExtension(path, extension):
|
|
filenames = []
|
|
for root, dirs, files in os.walk(path):
|
|
for filename in files:
|
|
if filename.endswith(extension):
|
|
filenames.append(os.path.join(root, filename))
|
|
return filenames
|
|
|
|
def clean(args):
|
|
if len(args) != 2:
|
|
print('Usage: %s clean <path> <extension>\n' % __file__ +
|
|
'\tRemoves all files with extension from <path>.')
|
|
return 1
|
|
for filename in findFilesWithExtension(args[0], args[1]):
|
|
os.remove(filename)
|
|
return 0
|
|
|
|
def merge(args):
|
|
if len(args) != 3:
|
|
print('Usage: %s clean <llvm-profdata> <output> <path>\n' % __file__ +
|
|
'\tMerges all profraw files from path into output.')
|
|
return 1
|
|
cmd = [args[0], 'merge', '-o', args[1]]
|
|
cmd.extend(findFilesWithExtension(args[2], "profraw"))
|
|
subprocess.check_call(cmd)
|
|
return 0
|
|
|
|
def dtrace(args):
|
|
parser = argparse.ArgumentParser(prog='perf-helper dtrace',
|
|
description='dtrace wrapper for order file generation')
|
|
parser.add_argument('--buffer-size', metavar='size', type=int, required=False,
|
|
default=1, help='dtrace buffer size in MB (default 1)')
|
|
parser.add_argument('--use-oneshot', required=False, action='store_true',
|
|
help='Use dtrace\'s oneshot probes')
|
|
parser.add_argument('--use-ustack', required=False, action='store_true',
|
|
help='Use dtrace\'s ustack to print function names')
|
|
parser.add_argument('--cc1', required=False, action='store_true',
|
|
help='Execute cc1 directly (don\'t profile the driver)')
|
|
parser.add_argument('cmd', nargs='*', help='')
|
|
|
|
# Use python's arg parser to handle all leading option arguments, but pass
|
|
# everything else through to dtrace
|
|
first_cmd = next(arg for arg in args if not arg.startswith("--"))
|
|
last_arg_idx = args.index(first_cmd)
|
|
|
|
opts = parser.parse_args(args[:last_arg_idx])
|
|
cmd = args[last_arg_idx:]
|
|
|
|
if opts.cc1:
|
|
cmd = get_cc1_command_for_args(cmd, test_env)
|
|
|
|
if opts.use_oneshot:
|
|
target = "oneshot$target:::entry"
|
|
else:
|
|
target = "pid$target:::entry"
|
|
predicate = '%s/probemod=="%s"/' % (target, os.path.basename(cmd[0]))
|
|
log_timestamp = 'printf("dtrace-TS: %d\\n", timestamp)'
|
|
if opts.use_ustack:
|
|
action = 'ustack(1);'
|
|
else:
|
|
action = 'printf("dtrace-Symbol: %s\\n", probefunc);'
|
|
dtrace_script = "%s { %s; %s }" % (predicate, log_timestamp, action)
|
|
|
|
dtrace_args = []
|
|
if not os.geteuid() == 0:
|
|
print(
|
|
'Script must be run as root, or you must add the following to your sudoers:'
|
|
+ '%%admin ALL=(ALL) NOPASSWD: /usr/sbin/dtrace')
|
|
dtrace_args.append("sudo")
|
|
|
|
dtrace_args.extend((
|
|
'dtrace', '-xevaltime=exec',
|
|
'-xbufsize=%dm' % (opts.buffer_size),
|
|
'-q', '-n', dtrace_script,
|
|
'-c', ' '.join(cmd)))
|
|
|
|
if sys.platform == "darwin":
|
|
dtrace_args.append('-xmangled')
|
|
|
|
start_time = time.time()
|
|
|
|
with open("%d.dtrace" % os.getpid(), "w") as f:
|
|
f.write("### Command: %s" % dtrace_args)
|
|
subprocess.check_call(dtrace_args, stdout=f, stderr=subprocess.PIPE)
|
|
|
|
elapsed = time.time() - start_time
|
|
print("... data collection took %.4fs" % elapsed)
|
|
|
|
return 0
|
|
|
|
def get_cc1_command_for_args(cmd, env):
|
|
# Find the cc1 command used by the compiler. To do this we execute the
|
|
# compiler with '-###' to figure out what it wants to do.
|
|
cmd = cmd + ['-###']
|
|
cc_output = subprocess.check_output(cmd, stderr=subprocess.STDOUT, env=env).strip()
|
|
cc_commands = []
|
|
for ln in cc_output.split('\n'):
|
|
# Filter out known garbage.
|
|
if (ln == 'Using built-in specs.' or
|
|
ln.startswith('Configured with:') or
|
|
ln.startswith('Target:') or
|
|
ln.startswith('Thread model:') or
|
|
ln.startswith('InstalledDir:') or
|
|
ln.startswith('LLVM Profile Note') or
|
|
' version ' in ln):
|
|
continue
|
|
cc_commands.append(ln)
|
|
|
|
if len(cc_commands) != 1:
|
|
print('Fatal error: unable to determine cc1 command: %r' % cc_output)
|
|
exit(1)
|
|
|
|
cc1_cmd = shlex.split(cc_commands[0])
|
|
if not cc1_cmd:
|
|
print('Fatal error: unable to determine cc1 command: %r' % cc_output)
|
|
exit(1)
|
|
|
|
return cc1_cmd
|
|
|
|
def cc1(args):
|
|
parser = argparse.ArgumentParser(prog='perf-helper cc1',
|
|
description='cc1 wrapper for order file generation')
|
|
parser.add_argument('cmd', nargs='*', help='')
|
|
|
|
# Use python's arg parser to handle all leading option arguments, but pass
|
|
# everything else through to dtrace
|
|
first_cmd = next(arg for arg in args if not arg.startswith("--"))
|
|
last_arg_idx = args.index(first_cmd)
|
|
|
|
opts = parser.parse_args(args[:last_arg_idx])
|
|
cmd = args[last_arg_idx:]
|
|
|
|
# clear the profile file env, so that we don't generate profdata
|
|
# when capturing the cc1 command
|
|
cc1_env = test_env
|
|
cc1_env["LLVM_PROFILE_FILE"] = os.devnull
|
|
cc1_cmd = get_cc1_command_for_args(cmd, cc1_env)
|
|
|
|
subprocess.check_call(cc1_cmd)
|
|
return 0
|
|
|
|
def parse_dtrace_symbol_file(path, all_symbols, all_symbols_set,
|
|
missing_symbols, opts):
|
|
def fix_mangling(symbol):
|
|
if sys.platform == "darwin":
|
|
if symbol[0] != '_' and symbol != 'start':
|
|
symbol = '_' + symbol
|
|
return symbol
|
|
|
|
def get_symbols_with_prefix(symbol):
|
|
start_index = bisect.bisect_left(all_symbols, symbol)
|
|
for s in all_symbols[start_index:]:
|
|
if not s.startswith(symbol):
|
|
break
|
|
yield s
|
|
|
|
# Extract the list of symbols from the given file, which is assumed to be
|
|
# the output of a dtrace run logging either probefunc or ustack(1) and
|
|
# nothing else. The dtrace -xdemangle option needs to be used.
|
|
#
|
|
# This is particular to OS X at the moment, because of the '_' handling.
|
|
with open(path) as f:
|
|
current_timestamp = None
|
|
for ln in f:
|
|
# Drop leading and trailing whitespace.
|
|
ln = ln.strip()
|
|
if not ln.startswith("dtrace-"):
|
|
continue
|
|
|
|
# If this is a timestamp specifier, extract it.
|
|
if ln.startswith("dtrace-TS: "):
|
|
_,data = ln.split(': ', 1)
|
|
if not data.isdigit():
|
|
print("warning: unrecognized timestamp line %r, ignoring" % ln,
|
|
file=sys.stderr)
|
|
continue
|
|
current_timestamp = int(data)
|
|
continue
|
|
elif ln.startswith("dtrace-Symbol: "):
|
|
|
|
_,ln = ln.split(': ', 1)
|
|
if not ln:
|
|
continue
|
|
|
|
# If there is a '`' in the line, assume it is a ustack(1) entry in
|
|
# the form of <modulename>`<modulefunc>, where <modulefunc> is never
|
|
# truncated (but does need the mangling patched).
|
|
if '`' in ln:
|
|
yield (current_timestamp, fix_mangling(ln.split('`',1)[1]))
|
|
continue
|
|
|
|
# Otherwise, assume this is a probefunc printout. DTrace on OS X
|
|
# seems to have a bug where it prints the mangled version of symbols
|
|
# which aren't C++ mangled. We just add a '_' to anything but start
|
|
# which doesn't already have a '_'.
|
|
symbol = fix_mangling(ln)
|
|
|
|
# If we don't know all the symbols, or the symbol is one of them,
|
|
# just return it.
|
|
if not all_symbols_set or symbol in all_symbols_set:
|
|
yield (current_timestamp, symbol)
|
|
continue
|
|
|
|
# Otherwise, we have a symbol name which isn't present in the
|
|
# binary. We assume it is truncated, and try to extend it.
|
|
|
|
# Get all the symbols with this prefix.
|
|
possible_symbols = list(get_symbols_with_prefix(symbol))
|
|
if not possible_symbols:
|
|
continue
|
|
|
|
# If we found too many possible symbols, ignore this as a prefix.
|
|
if len(possible_symbols) > 100:
|
|
print( "warning: ignoring symbol %r " % symbol +
|
|
"(no match and too many possible suffixes)", file=sys.stderr)
|
|
continue
|
|
|
|
# Report that we resolved a missing symbol.
|
|
if opts.show_missing_symbols and symbol not in missing_symbols:
|
|
print("warning: resolved missing symbol %r" % symbol, file=sys.stderr)
|
|
missing_symbols.add(symbol)
|
|
|
|
# Otherwise, treat all the possible matches as having occurred. This
|
|
# is an over-approximation, but it should be ok in practice.
|
|
for s in possible_symbols:
|
|
yield (current_timestamp, s)
|
|
|
|
def uniq(list):
|
|
seen = set()
|
|
for item in list:
|
|
if item not in seen:
|
|
yield item
|
|
seen.add(item)
|
|
|
|
def form_by_call_order(symbol_lists):
|
|
# Simply strategy, just return symbols in order of occurrence, even across
|
|
# multiple runs.
|
|
return uniq(s for symbols in symbol_lists for s in symbols)
|
|
|
|
def form_by_call_order_fair(symbol_lists):
|
|
# More complicated strategy that tries to respect the call order across all
|
|
# of the test cases, instead of giving a huge preference to the first test
|
|
# case.
|
|
|
|
# First, uniq all the lists.
|
|
uniq_lists = [list(uniq(symbols)) for symbols in symbol_lists]
|
|
|
|
# Compute the successors for each list.
|
|
succs = {}
|
|
for symbols in uniq_lists:
|
|
for a,b in zip(symbols[:-1], symbols[1:]):
|
|
succs[a] = items = succs.get(a, [])
|
|
if b not in items:
|
|
items.append(b)
|
|
|
|
# Emit all the symbols, but make sure to always emit all successors from any
|
|
# call list whenever we see a symbol.
|
|
#
|
|
# There isn't much science here, but this sometimes works better than the
|
|
# more naive strategy. Then again, sometimes it doesn't so more research is
|
|
# probably needed.
|
|
return uniq(s
|
|
for symbols in symbol_lists
|
|
for node in symbols
|
|
for s in ([node] + succs.get(node,[])))
|
|
|
|
def form_by_frequency(symbol_lists):
|
|
# Form the order file by just putting the most commonly occurring symbols
|
|
# first. This assumes the data files didn't use the oneshot dtrace method.
|
|
|
|
counts = {}
|
|
for symbols in symbol_lists:
|
|
for a in symbols:
|
|
counts[a] = counts.get(a,0) + 1
|
|
|
|
by_count = counts.items()
|
|
by_count.sort(key = lambda (_,n): -n)
|
|
return [s for s,n in by_count]
|
|
|
|
def form_by_random(symbol_lists):
|
|
# Randomize the symbols.
|
|
merged_symbols = uniq(s for symbols in symbol_lists
|
|
for s in symbols)
|
|
random.shuffle(merged_symbols)
|
|
return merged_symbols
|
|
|
|
def form_by_alphabetical(symbol_lists):
|
|
# Alphabetize the symbols.
|
|
merged_symbols = list(set(s for symbols in symbol_lists for s in symbols))
|
|
merged_symbols.sort()
|
|
return merged_symbols
|
|
|
|
methods = dict((name[len("form_by_"):],value)
|
|
for name,value in locals().items() if name.startswith("form_by_"))
|
|
|
|
def genOrderFile(args):
|
|
parser = argparse.ArgumentParser(
|
|
"%prog [options] <dtrace data file directories>]")
|
|
parser.add_argument('input', nargs='+', help='')
|
|
parser.add_argument("--binary", metavar="PATH", type=str, dest="binary_path",
|
|
help="Path to the binary being ordered (for getting all symbols)",
|
|
default=None)
|
|
parser.add_argument("--output", dest="output_path",
|
|
help="path to output order file to write", default=None, required=True,
|
|
metavar="PATH")
|
|
parser.add_argument("--show-missing-symbols", dest="show_missing_symbols",
|
|
help="show symbols which are 'fixed up' to a valid name (requires --binary)",
|
|
action="store_true", default=None)
|
|
parser.add_argument("--output-unordered-symbols",
|
|
dest="output_unordered_symbols_path",
|
|
help="write a list of the unordered symbols to PATH (requires --binary)",
|
|
default=None, metavar="PATH")
|
|
parser.add_argument("--method", dest="method",
|
|
help="order file generation method to use", choices=methods.keys(),
|
|
default='call_order')
|
|
opts = parser.parse_args(args)
|
|
|
|
# If the user gave us a binary, get all the symbols in the binary by
|
|
# snarfing 'nm' output.
|
|
if opts.binary_path is not None:
|
|
output = subprocess.check_output(['nm', '-P', opts.binary_path])
|
|
lines = output.split("\n")
|
|
all_symbols = [ln.split(' ',1)[0]
|
|
for ln in lines
|
|
if ln.strip()]
|
|
print("found %d symbols in binary" % len(all_symbols))
|
|
all_symbols.sort()
|
|
else:
|
|
all_symbols = []
|
|
all_symbols_set = set(all_symbols)
|
|
|
|
# Compute the list of input files.
|
|
input_files = []
|
|
for dirname in opts.input:
|
|
input_files.extend(findFilesWithExtension(dirname, "dtrace"))
|
|
|
|
# Load all of the input files.
|
|
print("loading from %d data files" % len(input_files))
|
|
missing_symbols = set()
|
|
timestamped_symbol_lists = [
|
|
list(parse_dtrace_symbol_file(path, all_symbols, all_symbols_set,
|
|
missing_symbols, opts))
|
|
for path in input_files]
|
|
|
|
# Reorder each symbol list.
|
|
symbol_lists = []
|
|
for timestamped_symbols_list in timestamped_symbol_lists:
|
|
timestamped_symbols_list.sort()
|
|
symbol_lists.append([symbol for _,symbol in timestamped_symbols_list])
|
|
|
|
# Execute the desire order file generation method.
|
|
method = methods.get(opts.method)
|
|
result = list(method(symbol_lists))
|
|
|
|
# Report to the user on what percentage of symbols are present in the order
|
|
# file.
|
|
num_ordered_symbols = len(result)
|
|
if all_symbols:
|
|
print("note: order file contains %d/%d symbols (%.2f%%)" % (
|
|
num_ordered_symbols, len(all_symbols),
|
|
100.*num_ordered_symbols/len(all_symbols)), file=sys.stderr)
|
|
|
|
if opts.output_unordered_symbols_path:
|
|
ordered_symbols_set = set(result)
|
|
with open(opts.output_unordered_symbols_path, 'w') as f:
|
|
f.write("\n".join(s for s in all_symbols if s not in ordered_symbols_set))
|
|
|
|
# Write the order file.
|
|
with open(opts.output_path, 'w') as f:
|
|
f.write("\n".join(result))
|
|
f.write("\n")
|
|
|
|
return 0
|
|
|
|
commands = {'clean' : clean,
|
|
'merge' : merge,
|
|
'dtrace' : dtrace,
|
|
'cc1' : cc1,
|
|
'gen-order-file' : genOrderFile}
|
|
|
|
def main():
|
|
f = commands[sys.argv[1]]
|
|
sys.exit(f(sys.argv[2:]))
|
|
|
|
if __name__ == '__main__':
|
|
main()
|