409 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
			
		
		
	
	
			409 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
#===- perf-helper.py - Clang Python Bindings -----------------*- python -*--===#
 | 
						|
#
 | 
						|
#                     The LLVM Compiler Infrastructure
 | 
						|
#
 | 
						|
# This file is distributed under the University of Illinois Open Source
 | 
						|
# License. See LICENSE.TXT for details.
 | 
						|
#
 | 
						|
#===------------------------------------------------------------------------===#
 | 
						|
 | 
						|
from __future__ import print_function
 | 
						|
 | 
						|
import sys
 | 
						|
import os
 | 
						|
import subprocess
 | 
						|
import argparse
 | 
						|
import time
 | 
						|
import bisect
 | 
						|
import shlex
 | 
						|
import tempfile
 | 
						|
 | 
						|
test_env = { 'PATH'    : os.environ['PATH'] }
 | 
						|
 | 
						|
def findFilesWithExtension(path, extension):
 | 
						|
  filenames = []
 | 
						|
  for root, dirs, files in os.walk(path): 
 | 
						|
    for filename in files:
 | 
						|
      if filename.endswith(extension):
 | 
						|
        filenames.append(os.path.join(root, filename))
 | 
						|
  return filenames
 | 
						|
 | 
						|
def clean(args):
 | 
						|
  if len(args) != 2:
 | 
						|
    print('Usage: %s clean <path> <extension>\n' % __file__ +
 | 
						|
      '\tRemoves all files with extension from <path>.')
 | 
						|
    return 1
 | 
						|
  for filename in findFilesWithExtension(args[0], args[1]):
 | 
						|
    os.remove(filename)
 | 
						|
  return 0
 | 
						|
 | 
						|
def merge(args):
 | 
						|
  if len(args) != 3:
 | 
						|
    print('Usage: %s clean <llvm-profdata> <output> <path>\n' % __file__ +
 | 
						|
      '\tMerges all profraw files from path into output.')
 | 
						|
    return 1
 | 
						|
  cmd = [args[0], 'merge', '-o', args[1]]
 | 
						|
  cmd.extend(findFilesWithExtension(args[2], "profraw"))
 | 
						|
  subprocess.check_call(cmd)
 | 
						|
  return 0
 | 
						|
 | 
						|
def dtrace(args):
 | 
						|
  parser = argparse.ArgumentParser(prog='perf-helper dtrace',
 | 
						|
    description='dtrace wrapper for order file generation')
 | 
						|
  parser.add_argument('--buffer-size', metavar='size', type=int, required=False,
 | 
						|
    default=1, help='dtrace buffer size in MB (default 1)')
 | 
						|
  parser.add_argument('--use-oneshot', required=False, action='store_true',
 | 
						|
    help='Use dtrace\'s oneshot probes')
 | 
						|
  parser.add_argument('--use-ustack', required=False, action='store_true',
 | 
						|
    help='Use dtrace\'s ustack to print function names')
 | 
						|
  parser.add_argument('--cc1', required=False, action='store_true',
 | 
						|
    help='Execute cc1 directly (don\'t profile the driver)')
 | 
						|
  parser.add_argument('cmd', nargs='*', help='')
 | 
						|
 | 
						|
  # Use python's arg parser to handle all leading option arguments, but pass
 | 
						|
  # everything else through to dtrace
 | 
						|
  first_cmd = next(arg for arg in args if not arg.startswith("--"))
 | 
						|
  last_arg_idx = args.index(first_cmd)
 | 
						|
 | 
						|
  opts = parser.parse_args(args[:last_arg_idx])
 | 
						|
  cmd = args[last_arg_idx:]
 | 
						|
 | 
						|
  if opts.cc1:
 | 
						|
    cmd = get_cc1_command_for_args(cmd, test_env)
 | 
						|
 | 
						|
  if opts.use_oneshot:
 | 
						|
      target = "oneshot$target:::entry"
 | 
						|
  else:
 | 
						|
      target = "pid$target:::entry"
 | 
						|
  predicate = '%s/probemod=="%s"/' % (target, os.path.basename(cmd[0]))
 | 
						|
  log_timestamp = 'printf("dtrace-TS: %d\\n", timestamp)'
 | 
						|
  if opts.use_ustack:
 | 
						|
      action = 'ustack(1);'
 | 
						|
  else:
 | 
						|
      action = 'printf("dtrace-Symbol: %s\\n", probefunc);'
 | 
						|
  dtrace_script = "%s { %s; %s }" % (predicate, log_timestamp, action)
 | 
						|
 | 
						|
  dtrace_args = []
 | 
						|
  if not os.geteuid() == 0:
 | 
						|
    print(
 | 
						|
      'Script must be run as root, or you must add the following to your sudoers:'
 | 
						|
      + '%%admin ALL=(ALL) NOPASSWD: /usr/sbin/dtrace')
 | 
						|
    dtrace_args.append("sudo")
 | 
						|
 | 
						|
  dtrace_args.extend((
 | 
						|
      'dtrace', '-xevaltime=exec',
 | 
						|
      '-xbufsize=%dm' % (opts.buffer_size),
 | 
						|
      '-q', '-n', dtrace_script, 
 | 
						|
      '-c', ' '.join(cmd)))
 | 
						|
 | 
						|
  if sys.platform == "darwin":
 | 
						|
    dtrace_args.append('-xmangled')
 | 
						|
 | 
						|
  start_time = time.time()
 | 
						|
 | 
						|
  with open("%d.dtrace" % os.getpid(), "w") as f:
 | 
						|
    f.write("### Command: %s" % dtrace_args)
 | 
						|
    subprocess.check_call(dtrace_args, stdout=f, stderr=subprocess.PIPE)
 | 
						|
 | 
						|
  elapsed = time.time() - start_time
 | 
						|
  print("... data collection took %.4fs" % elapsed)
 | 
						|
 | 
						|
  return 0
 | 
						|
 | 
						|
def get_cc1_command_for_args(cmd, env):
 | 
						|
  # Find the cc1 command used by the compiler. To do this we execute the
 | 
						|
  # compiler with '-###' to figure out what it wants to do.
 | 
						|
  cmd = cmd + ['-###']
 | 
						|
  cc_output = subprocess.check_output(cmd, stderr=subprocess.STDOUT, env=env).strip()
 | 
						|
  cc_commands = []
 | 
						|
  for ln in cc_output.split('\n'):
 | 
						|
      # Filter out known garbage.
 | 
						|
      if (ln == 'Using built-in specs.' or
 | 
						|
          ln.startswith('Configured with:') or
 | 
						|
          ln.startswith('Target:') or
 | 
						|
          ln.startswith('Thread model:') or
 | 
						|
          ln.startswith('InstalledDir:') or
 | 
						|
          ln.startswith('LLVM Profile Note') or
 | 
						|
          ' version ' in ln):
 | 
						|
          continue
 | 
						|
      cc_commands.append(ln)
 | 
						|
 | 
						|
  if len(cc_commands) != 1:
 | 
						|
      print('Fatal error: unable to determine cc1 command: %r' % cc_output)
 | 
						|
      exit(1)
 | 
						|
 | 
						|
  cc1_cmd = shlex.split(cc_commands[0])
 | 
						|
  if not cc1_cmd:
 | 
						|
      print('Fatal error: unable to determine cc1 command: %r' % cc_output)
 | 
						|
      exit(1)
 | 
						|
 | 
						|
  return cc1_cmd
 | 
						|
 | 
						|
def cc1(args):
 | 
						|
  parser = argparse.ArgumentParser(prog='perf-helper cc1',
 | 
						|
    description='cc1 wrapper for order file generation')
 | 
						|
  parser.add_argument('cmd', nargs='*', help='')
 | 
						|
 | 
						|
  # Use python's arg parser to handle all leading option arguments, but pass
 | 
						|
  # everything else through to dtrace
 | 
						|
  first_cmd = next(arg for arg in args if not arg.startswith("--"))
 | 
						|
  last_arg_idx = args.index(first_cmd)
 | 
						|
 | 
						|
  opts = parser.parse_args(args[:last_arg_idx])
 | 
						|
  cmd = args[last_arg_idx:]
 | 
						|
 | 
						|
  # clear the profile file env, so that we don't generate profdata
 | 
						|
  # when capturing the cc1 command
 | 
						|
  cc1_env = test_env
 | 
						|
  cc1_env["LLVM_PROFILE_FILE"] = os.devnull
 | 
						|
  cc1_cmd = get_cc1_command_for_args(cmd, cc1_env)
 | 
						|
 | 
						|
  subprocess.check_call(cc1_cmd)
 | 
						|
  return 0
 | 
						|
 | 
						|
def parse_dtrace_symbol_file(path, all_symbols, all_symbols_set,
 | 
						|
                             missing_symbols, opts):
 | 
						|
  def fix_mangling(symbol):
 | 
						|
    if sys.platform == "darwin":
 | 
						|
      if symbol[0] != '_' and symbol != 'start':
 | 
						|
          symbol = '_' + symbol
 | 
						|
    return symbol
 | 
						|
 | 
						|
  def get_symbols_with_prefix(symbol):
 | 
						|
    start_index = bisect.bisect_left(all_symbols, symbol)
 | 
						|
    for s in all_symbols[start_index:]:
 | 
						|
      if not s.startswith(symbol):
 | 
						|
        break
 | 
						|
      yield s
 | 
						|
 | 
						|
  # Extract the list of symbols from the given file, which is assumed to be
 | 
						|
  # the output of a dtrace run logging either probefunc or ustack(1) and
 | 
						|
  # nothing else. The dtrace -xdemangle option needs to be used.
 | 
						|
  #
 | 
						|
  # This is particular to OS X at the moment, because of the '_' handling.
 | 
						|
  with open(path) as f:
 | 
						|
    current_timestamp = None
 | 
						|
    for ln in f:
 | 
						|
      # Drop leading and trailing whitespace.
 | 
						|
      ln = ln.strip()
 | 
						|
      if not ln.startswith("dtrace-"):
 | 
						|
        continue
 | 
						|
 | 
						|
      # If this is a timestamp specifier, extract it.
 | 
						|
      if ln.startswith("dtrace-TS: "):
 | 
						|
        _,data = ln.split(': ', 1)
 | 
						|
        if not data.isdigit():
 | 
						|
          print("warning: unrecognized timestamp line %r, ignoring" % ln,
 | 
						|
            file=sys.stderr)
 | 
						|
          continue
 | 
						|
        current_timestamp = int(data)
 | 
						|
        continue
 | 
						|
      elif ln.startswith("dtrace-Symbol: "):
 | 
						|
 | 
						|
        _,ln = ln.split(': ', 1)
 | 
						|
        if not ln:
 | 
						|
          continue
 | 
						|
 | 
						|
        # If there is a '`' in the line, assume it is a ustack(1) entry in
 | 
						|
        # the form of <modulename>`<modulefunc>, where <modulefunc> is never
 | 
						|
        # truncated (but does need the mangling patched).
 | 
						|
        if '`' in ln:
 | 
						|
          yield (current_timestamp, fix_mangling(ln.split('`',1)[1]))
 | 
						|
          continue
 | 
						|
 | 
						|
        # Otherwise, assume this is a probefunc printout. DTrace on OS X
 | 
						|
        # seems to have a bug where it prints the mangled version of symbols
 | 
						|
        # which aren't C++ mangled. We just add a '_' to anything but start
 | 
						|
        # which doesn't already have a '_'.
 | 
						|
        symbol = fix_mangling(ln)
 | 
						|
 | 
						|
        # If we don't know all the symbols, or the symbol is one of them,
 | 
						|
        # just return it.
 | 
						|
        if not all_symbols_set or symbol in all_symbols_set:
 | 
						|
          yield (current_timestamp, symbol)
 | 
						|
          continue
 | 
						|
 | 
						|
        # Otherwise, we have a symbol name which isn't present in the
 | 
						|
        # binary. We assume it is truncated, and try to extend it.
 | 
						|
 | 
						|
        # Get all the symbols with this prefix.
 | 
						|
        possible_symbols = list(get_symbols_with_prefix(symbol))
 | 
						|
        if not possible_symbols:
 | 
						|
          continue
 | 
						|
 | 
						|
        # If we found too many possible symbols, ignore this as a prefix.
 | 
						|
        if len(possible_symbols) > 100:
 | 
						|
          print( "warning: ignoring symbol %r " % symbol +
 | 
						|
            "(no match and too many possible suffixes)", file=sys.stderr) 
 | 
						|
          continue
 | 
						|
 | 
						|
        # Report that we resolved a missing symbol.
 | 
						|
        if opts.show_missing_symbols and symbol not in missing_symbols:
 | 
						|
          print("warning: resolved missing symbol %r" % symbol, file=sys.stderr)
 | 
						|
          missing_symbols.add(symbol)
 | 
						|
 | 
						|
        # Otherwise, treat all the possible matches as having occurred. This
 | 
						|
        # is an over-approximation, but it should be ok in practice.
 | 
						|
        for s in possible_symbols:
 | 
						|
          yield (current_timestamp, s)
 | 
						|
 | 
						|
def uniq(list):
 | 
						|
  seen = set()
 | 
						|
  for item in list:
 | 
						|
    if item not in seen:
 | 
						|
      yield item
 | 
						|
      seen.add(item)
 | 
						|
 | 
						|
def form_by_call_order(symbol_lists):
 | 
						|
  # Simply strategy, just return symbols in order of occurrence, even across
 | 
						|
  # multiple runs.
 | 
						|
  return uniq(s for symbols in symbol_lists for s in symbols)
 | 
						|
 | 
						|
def form_by_call_order_fair(symbol_lists):
 | 
						|
  # More complicated strategy that tries to respect the call order across all
 | 
						|
  # of the test cases, instead of giving a huge preference to the first test
 | 
						|
  # case.
 | 
						|
 | 
						|
  # First, uniq all the lists.
 | 
						|
  uniq_lists = [list(uniq(symbols)) for symbols in symbol_lists]
 | 
						|
 | 
						|
  # Compute the successors for each list.
 | 
						|
  succs = {}
 | 
						|
  for symbols in uniq_lists:
 | 
						|
    for a,b in zip(symbols[:-1], symbols[1:]):
 | 
						|
      succs[a] = items = succs.get(a, [])
 | 
						|
      if b not in items:
 | 
						|
        items.append(b)
 | 
						|
  
 | 
						|
  # Emit all the symbols, but make sure to always emit all successors from any
 | 
						|
  # call list whenever we see a symbol.
 | 
						|
  #
 | 
						|
  # There isn't much science here, but this sometimes works better than the
 | 
						|
  # more naive strategy. Then again, sometimes it doesn't so more research is
 | 
						|
  # probably needed.
 | 
						|
  return uniq(s
 | 
						|
    for symbols in symbol_lists
 | 
						|
    for node in symbols
 | 
						|
    for s in ([node] + succs.get(node,[])))
 | 
						|
 
 | 
						|
def form_by_frequency(symbol_lists):
 | 
						|
  # Form the order file by just putting the most commonly occurring symbols
 | 
						|
  # first. This assumes the data files didn't use the oneshot dtrace method.
 | 
						|
 
 | 
						|
  counts = {}
 | 
						|
  for symbols in symbol_lists:
 | 
						|
    for a in symbols:
 | 
						|
      counts[a] = counts.get(a,0) + 1
 | 
						|
 | 
						|
  by_count = counts.items()
 | 
						|
  by_count.sort(key = lambda (_,n): -n)
 | 
						|
  return [s for s,n in by_count]
 | 
						|
 
 | 
						|
def form_by_random(symbol_lists):
 | 
						|
  # Randomize the symbols.
 | 
						|
  merged_symbols = uniq(s for symbols in symbol_lists
 | 
						|
                          for s in symbols)
 | 
						|
  random.shuffle(merged_symbols)
 | 
						|
  return merged_symbols
 | 
						|
 
 | 
						|
def form_by_alphabetical(symbol_lists):
 | 
						|
  # Alphabetize the symbols.
 | 
						|
  merged_symbols = list(set(s for symbols in symbol_lists for s in symbols))
 | 
						|
  merged_symbols.sort()
 | 
						|
  return merged_symbols
 | 
						|
 | 
						|
methods = dict((name[len("form_by_"):],value)
 | 
						|
  for name,value in locals().items() if name.startswith("form_by_"))
 | 
						|
 | 
						|
def genOrderFile(args):
 | 
						|
  parser = argparse.ArgumentParser(
 | 
						|
    "%prog  [options] <dtrace data file directories>]")
 | 
						|
  parser.add_argument('input', nargs='+', help='')
 | 
						|
  parser.add_argument("--binary", metavar="PATH", type=str, dest="binary_path",
 | 
						|
    help="Path to the binary being ordered (for getting all symbols)",
 | 
						|
    default=None)
 | 
						|
  parser.add_argument("--output", dest="output_path",
 | 
						|
    help="path to output order file to write", default=None, required=True,
 | 
						|
    metavar="PATH")
 | 
						|
  parser.add_argument("--show-missing-symbols", dest="show_missing_symbols",
 | 
						|
    help="show symbols which are 'fixed up' to a valid name (requires --binary)",
 | 
						|
    action="store_true", default=None)
 | 
						|
  parser.add_argument("--output-unordered-symbols",
 | 
						|
    dest="output_unordered_symbols_path",
 | 
						|
    help="write a list of the unordered symbols to PATH (requires --binary)",
 | 
						|
    default=None, metavar="PATH")
 | 
						|
  parser.add_argument("--method", dest="method",
 | 
						|
    help="order file generation method to use", choices=methods.keys(),
 | 
						|
    default='call_order')
 | 
						|
  opts = parser.parse_args(args)
 | 
						|
 | 
						|
  # If the user gave us a binary, get all the symbols in the binary by
 | 
						|
  # snarfing 'nm' output.
 | 
						|
  if opts.binary_path is not None:
 | 
						|
     output = subprocess.check_output(['nm', '-P', opts.binary_path])
 | 
						|
     lines = output.split("\n")
 | 
						|
     all_symbols = [ln.split(' ',1)[0]
 | 
						|
                    for ln in lines
 | 
						|
                    if ln.strip()]
 | 
						|
     print("found %d symbols in binary" % len(all_symbols))
 | 
						|
     all_symbols.sort()
 | 
						|
  else:
 | 
						|
     all_symbols = []
 | 
						|
  all_symbols_set = set(all_symbols)
 | 
						|
 | 
						|
  # Compute the list of input files.
 | 
						|
  input_files = []
 | 
						|
  for dirname in opts.input:
 | 
						|
    input_files.extend(findFilesWithExtension(dirname, "dtrace"))
 | 
						|
 | 
						|
  # Load all of the input files.
 | 
						|
  print("loading from %d data files" % len(input_files))
 | 
						|
  missing_symbols = set()
 | 
						|
  timestamped_symbol_lists = [
 | 
						|
      list(parse_dtrace_symbol_file(path, all_symbols, all_symbols_set,
 | 
						|
                                    missing_symbols, opts))
 | 
						|
      for path in input_files]
 | 
						|
 | 
						|
  # Reorder each symbol list.
 | 
						|
  symbol_lists = []
 | 
						|
  for timestamped_symbols_list in timestamped_symbol_lists:
 | 
						|
    timestamped_symbols_list.sort()
 | 
						|
    symbol_lists.append([symbol for _,symbol in timestamped_symbols_list])
 | 
						|
 | 
						|
  # Execute the desire order file generation method.
 | 
						|
  method = methods.get(opts.method)
 | 
						|
  result = list(method(symbol_lists))
 | 
						|
 | 
						|
  # Report to the user on what percentage of symbols are present in the order
 | 
						|
  # file.
 | 
						|
  num_ordered_symbols = len(result)
 | 
						|
  if all_symbols:
 | 
						|
    print("note: order file contains %d/%d symbols (%.2f%%)" % (
 | 
						|
      num_ordered_symbols, len(all_symbols),
 | 
						|
      100.*num_ordered_symbols/len(all_symbols)), file=sys.stderr)
 | 
						|
 | 
						|
  if opts.output_unordered_symbols_path:
 | 
						|
    ordered_symbols_set = set(result)
 | 
						|
    with open(opts.output_unordered_symbols_path, 'w') as f:
 | 
						|
      f.write("\n".join(s for s in all_symbols if s not in ordered_symbols_set))
 | 
						|
 | 
						|
  # Write the order file.
 | 
						|
  with open(opts.output_path, 'w') as f:
 | 
						|
    f.write("\n".join(result))
 | 
						|
    f.write("\n")
 | 
						|
 | 
						|
  return 0
 | 
						|
 | 
						|
commands = {'clean' : clean,
 | 
						|
  'merge' : merge, 
 | 
						|
  'dtrace' : dtrace,
 | 
						|
  'cc1' : cc1,
 | 
						|
  'gen-order-file' : genOrderFile}
 | 
						|
 | 
						|
def main():
 | 
						|
  f = commands[sys.argv[1]]
 | 
						|
  sys.exit(f(sys.argv[2:]))
 | 
						|
 | 
						|
if __name__ == '__main__':
 | 
						|
  main()
 |