Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(746)

Unified Diff: tools/findit/findit_for_clusterfuzz.py

Issue 468823003: [Findit] findit algorithms and a cluster-fuzz implementation. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: addressed codereview Created 6 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: tools/findit/findit_for_clusterfuzz.py
diff --git a/tools/findit/findit_for_clusterfuzz.py b/tools/findit/findit_for_clusterfuzz.py
new file mode 100644
index 0000000000000000000000000000000000000000..70c89c540d27842718e3e15b2f136cecf3433710
--- /dev/null
+++ b/tools/findit/findit_for_clusterfuzz.py
@@ -0,0 +1,145 @@
+# Copyright (c) 2014 The Chromium Authors. All rights reserved.
+# Use of this source code is governed by a BSD-style license that can be
+# found in the LICENSE file.
+
+import logging
+
+import chromium_deps
+import crash_utils
+import findit_for_crash as findit
+import stacktrace
+
+
+def SplitStacktrace(stacktrace_string):
+ """Preprocesses stacktrace string into two parts, release and debug.
+
+ Args:
+ stacktrace_string: A string representation of stacktrace,
+ in clusterfuzz format.
+
+ Returns:
+ A tuple of list of strings, release build stacktrace and
+ debug build stacktrace.
+ """
+ # Make sure we only parse release/debug build stacktrace, and ignore
+ # unsymbolised stacktrace.
+ in_release_or_debug_stacktrace = False
+ release_build_stacktrace_lines = None
+ debug_build_stacktrace_lines = None
+ current_stacktrace_lines = []
+
+ # Iterate through all lines in stacktrace.
+ for line in stacktrace_string.splitlines():
+ line = line.strip()
+
+ # If the line starts with +, it signifies the start of new stacktrace.
+ if line.startswith('+'):
+ if 'Release Build Stacktrace' in line:
+ in_release_or_debug_stacktrace = True
+ current_stacktrace_lines = []
+ release_build_stacktrace_lines = current_stacktrace_lines
+
+ elif 'Debug Build Stacktrace' in line:
+ in_release_or_debug_stacktrace = True
+ current_stacktrace_lines = []
+ debug_build_stacktrace_lines = current_stacktrace_lines
+
+ # If the stacktrace is neither release/debug build stacktrace, ignore
+ # all lines after it until we encounter release/debug build stacktrace.
+ else:
+ in_release_or_debug_stacktrace = False
+
+ # This case, it must be that the line is an actual stack frame, so add to
+ # the current stacktrace.
+ elif in_release_or_debug_stacktrace:
+ current_stacktrace_lines.append(line)
+
+ return (release_build_stacktrace_lines, debug_build_stacktrace_lines)
+
+
+def FindCulpritCLs(stacktrace_string,
+ build_type,
+ chrome_regression=None,
+ component_regression=None,
+ chrome_crash_revision=None,
+ component_crash_revision=None,
+ crashing_component=None):
+ """Returns json format of the result, a list of result.Result objects.
stgao 2014/08/18 22:37:07 Seems json format is wrong now?
jeun 2014/08/18 23:52:13 Done.
+
+ Args:
+ stacktrace_string: A string representing stacktrace.
+ build_type: The type of the job.
+ chrome_regression: A string, chrome regression from clusterfuzz, in format
+ '123456:123457'
+ component_regression: A string, component regression in the same format.
+ chrome_crash_revision: A crash revision of chrome, in string.
+ component_crash_revision: A crash revision of the component,
+ if component build.
+ crashing_component: Yet to be decided.
+
+ Returns:
+ A list of result objects, along with the short description on where the
+ result is from.
+ """
+ build_type = build_type.lower()
+ if 'android' in build_type or 'syzyasan' in build_type:
Martin Barbella 2014/08/19 02:51:35 Why are these job types being skipped explicitly?
jeun 2014/08/19 18:30:06 The stacktrace parsing for them is not supported.
+ return ('This build type is currently not supported.', [])
+
+ logging.basicConfig(filename='errors.log', level=logging.WARNING,
stgao 2014/08/18 22:37:07 Findit should not write any log. It is the respon
jeun 2014/08/18 23:52:13 Does this mean anything other than this file shoul
+ filemode='w+')
+
+ crash_revision_dict = {}
+ regression_dict = {}
+
+ # TODO(jeun): Come up with a good way to connect crashing component name to
Martin Barbella 2014/08/19 02:51:35 What work is still needed to be done here? I thoug
jeun 2014/08/19 18:30:05 Since we started parsing DEPS file for regression
+ # its path.
+ if component_regression or component_crash_revision:
+ return ('This feature is not supported.', [])
stgao 2014/08/18 22:37:07 "Component builds are not supported yet."
jeun 2014/08/18 23:52:13 Done.
+
+ # If chrome regression is available, parse DEPS file.
+ chrome_regression = crash_utils.SplitRange(chrome_regression)
+ if chrome_regression:
+ chrome_regression_start = chrome_regression[0]
+ chrome_regression_end = chrome_regression[1]
+
+ # If the regression is not reliable, do not parse regression information.
Martin Barbella 2014/08/19 02:51:35 A regression range starting with 0 has nothing to
jeun 2014/08/19 18:30:05 Done.
+ if chrome_regression_start != '0':
+ regression_dict = chromium_deps.GetChromiumComponentRange(
+ chrome_regression_start, chrome_regression_end)
+
+ # Parse crash revision.
+ if chrome_crash_revision:
+ crash_revision_dict = chromium_deps.GetChromiumComponents(
stgao 2014/08/18 22:37:06 Do we need to verify |chrome_crash_revision| is no
jeun 2014/08/18 23:52:13 Yes, in case we only have component crash revision
+ chrome_crash_revision)
+
+ # Parsed DEPS is used to normalize the stacktrace. Since parsed regression
+ # and parsed crash state essentially contain same information, use either.
+ if regression_dict:
+ parsed_deps = regression_dict
+ elif crash_revision_dict:
+ parsed_deps = crash_revision_dict
+ else:
+ return ('No regression and crash revision information available.', [])
Martin Barbella 2014/08/19 02:51:35 If someone runs into an error, they probably don't
jeun 2014/08/19 18:30:05 Done.
+
+ # Split stacktrace into release build/debug build and parse them.
+ (release_build_stacktrace, debug_build_stacktrace) = SplitStacktrace(
+ stacktrace_string)
+ parsed_release_build_stacktrace = stacktrace.Stacktrace(
+ release_build_stacktrace, build_type, parsed_deps)
+ parsed_debug_build_stacktrace = stacktrace.Stacktrace(
+ debug_build_stacktrace, build_type, parsed_deps)
+
+ # Get a highest priority callstack from stacktrace, with release build
+ # stacktrace in higher priority than debug build stacktace.
+ if parsed_release_build_stacktrace.stack_list:
+ main_stack = parsed_release_build_stacktrace.GetCrashStack()
stgao 2014/08/18 22:37:06 What's main stack? What it is for? Why only handle
jeun 2014/08/18 23:52:13 Done.
+ elif parsed_debug_build_stacktrace.stack_list:
+ main_stack = parsed_debug_build_stacktrace.GetCrashStack()
+ else:
+ return ('Stacktrace is malformed.', [])
+
+ # Run the algorithm on the parsed stacktrace, and return the JSON.
stgao 2014/08/18 22:37:07 We are not returning JSON any more, right?
jeun 2014/08/18 23:52:13 Done.
+ stacktrace_list = [parsed_release_build_stacktrace,
+ parsed_debug_build_stacktrace]
+ return findit.FindItForCrash(
+ stacktrace_list, main_stack, regression_dict, crash_revision_dict)

Powered by Google App Engine
This is Rietveld 408576698