aboutsummaryrefslogtreecommitdiff
path: root/binary_search_tool/bisect_driver.py
diff options
context:
space:
mode:
authorCassidy Burden <cburden@google.com>2016-07-25 11:23:13 -0700
committerchrome-bot <chrome-bot@chromium.org>2016-07-29 09:38:04 -0700
commit28683f7dacd94801e9a0d4b28e5aa8a700fc3d6f (patch)
tree2c815155b590dc6779206e44b8965aa877ff234d /binary_search_tool/bisect_driver.py
parentf67b68da6d8ed5e8e84409a1c78be4d457e792b4 (diff)
downloadtoolchain-utils-28683f7dacd94801e9a0d4b28e5aa8a700fc3d6f.tar.gz
binary search tool: Add compiler wrapper for Android bisection
Add compiler wrapper similar to ChromeOS object bisector's compiler wrapper. bisect_driver.py is a modified version of bisect.py from the ChromeOS sysroot_wrapper. compiler_wrapper.py is a simple skeleton script used to invoke bisect_driver, and it is meant to be replaced by a more robust compiler wrapper. TEST=Populated android objects and triaged CQ-DEPEND=CL:*270730 Change-Id: I4dfc676f6b659c2da8dbd01fd858c477ffbdeb9f Reviewed-on: https://chrome-internal-review.googlesource.com/270783 Commit-Ready: Cassidy Burden <cburden@google.com> Tested-by: Cassidy Burden <cburden@google.com> Reviewed-by: Luis Lozano <llozano@chromium.org>
Diffstat (limited to 'binary_search_tool/bisect_driver.py')
-rw-r--r--binary_search_tool/bisect_driver.py266
1 files changed, 266 insertions, 0 deletions
diff --git a/binary_search_tool/bisect_driver.py b/binary_search_tool/bisect_driver.py
new file mode 100644
index 00000000..6c4d406c
--- /dev/null
+++ b/binary_search_tool/bisect_driver.py
@@ -0,0 +1,266 @@
+# Copyright 2016 Google Inc. All Rights Reserved.
+#
+# This script is used to help the compiler wrapper in the Android build system
+# bisect for bad object files.
+
+"""Utilities for bisection of Android object files.
+
+This module contains a set of utilities to allow bisection between
+two sets (good and bad) of object files. Mostly used to find compiler
+bugs.
+
+Design doc:
+https://docs.google.com/document/d/1yDgaUIa2O5w6dc3sSTe1ry-1ehKajTGJGQCbyn0fcEM
+"""
+
+from __future__ import print_function
+
+import os
+import shutil
+import subprocess
+import sys
+
+VALID_MODES = ['POPULATE_GOOD', 'POPULATE_BAD', 'TRIAGE']
+DEP_CACHE = 'dep'
+GOOD_CACHE = 'good'
+BAD_CACHE = 'bad'
+LIST_FILE = os.path.join(GOOD_CACHE, '_LIST')
+
+CONTINUE_ON_MISSING = os.environ.get('BISECT_CONTINUE_ON_MISSING', None) == '1'
+
+
+class Error(Exception):
+ """The general compiler wrapper error class."""
+ pass
+
+
+def log_to_file(path, execargs, link_from=None, link_to=None):
+ """Common logging function.
+
+ Log current working directory, current execargs, and a from-to relationship
+ between files.
+ """
+ with open(path, 'a') as log:
+ log.write('cd: %s; %s\n' % (os.getcwd(), ' '.join(execargs)))
+ if link_from and link_to:
+ log.write('%s -> %s\n' % (link_from, link_to))
+
+
+def exec_and_return(execargs):
+ """Execute process and return.
+
+ Execute according to execargs and return immediately. Don't inspect
+ stderr or stdout.
+ """
+ return subprocess.call(execargs)
+
+
+def in_bad_set(obj_file):
+ """Check if object file is in bad set.
+
+ The binary search tool creates two files for each search iteration listing
+ the full set of bad objects and full set of good objects. We use this to
+ determine where an object file should be linked from (good or bad).
+ """
+ bad_set_file = os.environ.get('BISECT_BAD_SET')
+ ret = subprocess.call(['grep', '-x', '-q', obj_file, bad_set_file])
+ return ret == 0
+
+
+def makedirs(path):
+ """Try to create directories in path."""
+ try:
+ os.makedirs(path)
+ except os.error:
+ if not os.path.isdir(path):
+ raise
+
+
+def get_obj_path(execargs):
+ """Get the object path for the object file in the list of arguments.
+
+ Returns:
+ Tuple of object path from execution args (-o argument) and full object
+ path. If no object being outputted or output doesn't end in ".o" then return
+ empty strings.
+ """
+ try:
+ i = execargs.index('-o')
+ except ValueError:
+ return "", ""
+
+ obj_path = execargs[i+1]
+ if not obj_path.endswith(('.o',)):
+ # TODO: what suffixes do we need to contemplate
+ # TODO: add this as a warning
+ # TODO: need to handle -r compilations
+ return "", ""
+
+ return obj_path, os.path.join(os.getcwd(), obj_path)
+
+
+def get_dep_path(execargs):
+ """Get the dep file path for the dep file in the list of arguments.
+
+ Returns:
+ Tuple of dependency file path from execution args (-o argument) and full
+ dependency file path. If no dependency being outputted then return empty
+ strings.
+ """
+ try:
+ i = execargs.index('-MF')
+ except ValueError:
+ return "", ""
+
+ dep_path = execargs[i+1]
+ return dep_path, os.path.join(os.getcwd(), dep_path)
+
+
+def in_object_list(obj_name, list_filename):
+ """Check if object file name exist in file with object list."""
+ if not obj_name:
+ return False
+
+ with open(list_filename, 'r') as list_file:
+ for line in list_file:
+ if line.strip() == obj_name:
+ return True
+
+ return False
+
+
+def generate_side_effects(execargs, bisect_dir):
+ """Generate compiler side effects.
+
+ Generate and cache side effects so that we can trick make into thinking
+ the compiler is actually called during triaging.
+ """
+ # TODO(cburden): Cache .dwo files
+
+ # Cache dependency files
+ dep_path, _ = get_dep_path(execargs)
+ if not dep_path:
+ return
+
+ bisect_path = os.path.join(bisect_dir, DEP_CACHE, dep_path)
+ bisect_path_dir = os.path.dirname(bisect_path)
+ makedirs(bisect_path_dir)
+ pop_log = os.path.join(bisect_dir, DEP_CACHE, '_POPULATE_LOG')
+ log_to_file(pop_log, execargs, link_from=dep_path, link_to=bisect_path)
+
+ try:
+ if os.path.exists(dep_path):
+ shutil.copy2(dep_path, bisect_path)
+ except Exception:
+ print('Could not get dep file', file=sys.stderr)
+ raise
+
+
+def bisect_populate(execargs, bisect_dir, population_name):
+ """Add necessary information to the bisect cache for the given execution.
+
+ Extract the necessary information for bisection from the compiler
+ execution arguments and put it into the bisection cache. This
+ includes copying the created object file, adding the object
+ file path to the cache list and keeping a log of the execution.
+
+ Args:
+ execargs: compiler execution arguments.
+ bisect_dir: bisection directory.
+ population_name: name of the cache being populated (good/bad).
+ """
+ retval = exec_and_return(execargs)
+ if retval:
+ return retval
+
+ population_dir = os.path.join(bisect_dir, population_name)
+ makedirs(population_dir)
+ pop_log = os.path.join(population_dir, '_POPULATE_LOG')
+ log_to_file(pop_log, execargs)
+
+ obj_path, _ = get_obj_path(execargs)
+ if not obj_path:
+ return
+
+ bisect_path = os.path.join(population_dir, obj_path)
+ bisect_path_dir = os.path.dirname(bisect_path)
+ makedirs(bisect_path_dir)
+
+ try:
+ if os.path.exists(obj_path):
+ shutil.copy2(obj_path, bisect_path)
+ # Set cache object to be read-only so later compilations can't
+ # accidentally overwrite it.
+ os.chmod(bisect_path, 0444)
+ except Exception:
+ print('Could not populate bisect cache', file=sys.stderr)
+ raise
+
+ with open(os.path.join(population_dir, '_LIST'), 'a') as object_list:
+ object_list.write('%s\n' % obj_path)
+
+ # Cache the side effects generated by good compiler
+ if population_name == GOOD_CACHE:
+ generate_side_effects(execargs, bisect_dir)
+
+
+def bisect_triage(execargs, bisect_dir):
+ obj_path, _ = get_obj_path(execargs)
+ obj_list = os.path.join(bisect_dir, LIST_FILE)
+
+ # If the output isn't an object file just call compiler
+ if not obj_path:
+ return exec_and_return(execargs)
+
+ # If this isn't a bisected object just call compiler
+ # This shouldn't happen!
+ if not in_object_list(obj_path, obj_list):
+ if CONTINUE_ON_MISSING:
+ log_file = os.path.join(bisect_dir, '_MISSING_CACHED_OBJ_LOG')
+ log_to_file(log_file, execargs, link_from='? compiler', link_to=obj_path)
+ return exec_and_return(execargs)
+ else:
+ raise Error(('%s is missing from cache! To ignore export '
+ 'BISECT_CONTINUE_ON_MISSING=1. See documentation for more '
+ 'details on this option.' % obj_path))
+
+ # Generate compiler side effects. Trick Make into thinking compiler was
+ # actually executed.
+
+ # If dependency is generated from this call, link it from dependency cache
+ dep_path, full_dep_path = get_dep_path(execargs)
+ if dep_path:
+ cached_dep_path = os.path.join(bisect_dir, DEP_CACHE, dep_path)
+ if os.path.exists(cached_dep_path):
+ if os.path.exists(full_dep_path):
+ os.remove(full_dep_path)
+ os.link(cached_dep_path, full_dep_path)
+ else:
+ raise Error(('%s is missing from dependency cache! Unsure how to '
+ 'proceed. Make will now crash.' % cached_dep_path))
+
+ # If generated object file happened to be pruned/cleaned by Make then link it
+ # over from cache again.
+ if not os.path.exists(obj_path):
+ cache = BAD_CACHE if in_bad_set(obj_path) else GOOD_CACHE
+ cached_obj_path = os.path.join(bisect_dir, cache, obj_path)
+ if os.path.exists(cached_obj_path):
+ os.link(cached_obj_path, obj_path)
+ else:
+ raise Error('%s does not exist in %s cache' % (obj_path, cache))
+
+ # This is just used for debugging and stats gathering
+ log_file = os.path.join(bisect_dir, '_MISSING_OBJ_LOG')
+ log_to_file(log_file, execargs, link_from=cached_obj_path, link_to=obj_path)
+
+
+def bisect_driver(bisect_stage, bisect_dir, execargs):
+ """Call appropriate bisection stage according to value in bisect_stage."""
+ if bisect_stage == 'POPULATE_GOOD':
+ bisect_populate(execargs, bisect_dir, GOOD_CACHE)
+ elif bisect_stage == 'POPULATE_BAD':
+ bisect_populate(execargs, bisect_dir, BAD_CACHE)
+ elif bisect_stage == 'TRIAGE':
+ bisect_triage(execargs, bisect_dir)
+ else:
+ raise ValueError('wrong value for BISECT_STAGE: %s' % bisect_stage)