chrome/chrome_watcher/kasko_util.cc - Issue 2086403002: Remove the Kasko based out of process browser hang instrumentation.

Unified Diff: chrome/chrome_watcher/kasko_util.cc

Issue 2086403002: Remove the Kasko based out of process browser hang instrumentation. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Merge Created 4 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: chrome/chrome_watcher/kasko_util.cc

diff --git a/chrome/chrome_watcher/kasko_util.cc b/chrome/chrome_watcher/kasko_util.cc

deleted file mode 100644

index 5102d459a67faf11a2caf97b28122dfbc9ba3943..0000000000000000000000000000000000000000

--- a/chrome/chrome_watcher/kasko_util.cc

+++ /dev/null

@@ -1,399 +0,0 @@

-// Use of this source code is governed by a BSD-style license that can be

-// found in the LICENSE file.

-#include "chrome/chrome_watcher/kasko_util.h"

-#include <sddl.h>

-#include <memory>

-#include <set>

-#include <string>

-#include <utility>

-#include <vector>

-#include "base/base_paths.h"

-#include "base/bind.h"

-#include "base/callback_helpers.h"

-#include "base/environment.h"

-#include "base/files/file_path.h"

-#include "base/format_macros.h"

-#include "base/macros.h"

-#include "base/path_service.h"

-#include "base/strings/string_number_conversions.h"

-#include "base/strings/string_util.h"

-#include "base/strings/stringprintf.h"

-#include "base/strings/utf_string_conversions.h"

-#include "base/win/wait_chain.h"

-#include "base/win/win_util.h"

-#include "chrome/chrome_watcher/chrome_watcher_main_api.h"

-#include "chrome/chrome_watcher/system_load_estimator.h"

-#include "components/crash/content/app/crashpad.h"

-#include "components/memory_pressure/direct_memory_pressure_calculator_win.h"

-#include "components/memory_pressure/memory_pressure_calculator.h"

-#include "syzygy/kasko/api/reporter.h"

-namespace {

-using MemoryPressureLevel =

- memory_pressure::MemoryPressureCalculator::MemoryPressureLevel;

-// Labels a crash report to the server as a hang report.

-const wchar_t kHangReportCrashKey[] = L"hang-report";

-// Helper function for determining the crash server to use. Defaults to the

-// standard crash server, but can be overridden via an environment variable.

-// Enables easy integration testing.

-base::string16 GetKaskoCrashServerUrl() {

- static const char kKaskoCrashServerUrl[] = "KASKO_CRASH_SERVER_URL";

- static const wchar_t kDefaultKaskoCrashServerUrl[] =

- L"https://clients2.google.com/cr/report";

- std::unique_ptr<base::Environment> env(base::Environment::Create());

- std::string env_var;

- if (env->GetVar(kKaskoCrashServerUrl, &env_var)) {

- return base::UTF8ToUTF16(env_var);

- }

- return kDefaultKaskoCrashServerUrl;

-// Helper function for determining the crash reports directory to use. Defaults

-// to the browser data directory, but can be overridden via an environment

-// variable. Enables easy integration testing.

-base::FilePath GetKaskoCrashReportsBaseDir(

- const base::char16* browser_data_directory) {

- static const char kKaskoCrashReportBaseDir[] = "KASKO_CRASH_REPORTS_BASE_DIR";

- std::unique_ptr<base::Environment> env(base::Environment::Create());

- std::string env_var;

- if (env->GetVar(kKaskoCrashReportBaseDir, &env_var)) {

- return base::FilePath(base::UTF8ToUTF16(env_var));

- }

- return base::FilePath(browser_data_directory);

-struct EventSourceDeregisterer {

- using pointer = HANDLE;

- void operator()(HANDLE event_source_handle) const {

- if (!::DeregisterEventSource(event_source_handle))

- DPLOG(ERROR) << "DeregisterEventSource";

- }

-};

-using ScopedEventSourceHandle =

- std::unique_ptr<HANDLE, EventSourceDeregisterer>;

-struct SidDeleter {

- using pointer = PSID;

- void operator()(PSID sid) const {

- if (::LocalFree(sid) != nullptr)

- DPLOG(ERROR) << "LocalFree";

- }

-};

-using ScopedSid = std::unique_ptr<PSID, SidDeleter>;

-void OnCrashReportUpload(void* context,

- const base::char16* report_id,

- const base::char16* minidump_path,

- const base::char16* const* keys,

- const base::char16* const* values) {

- // Open the event source.

- ScopedEventSourceHandle event_source_handle(

- ::RegisterEventSource(nullptr, L"Chrome"));

- if (!event_source_handle) {

- PLOG(ERROR) << "RegisterEventSource";

- return;

- }

- // Get the user's SID for the log record.

- base::string16 sid_string;

- PSID sid = nullptr;

- if (base::win::GetUserSidString(&sid_string) && !sid_string.empty()) {

- if (!::ConvertStringSidToSid(sid_string.c_str(), &sid))

- DPLOG(ERROR) << "ConvertStringSidToSid";

- DCHECK(sid);

- }

- // Ensure cleanup on scope exit.

- ScopedSid scoped_sid;

- if (sid)

- scoped_sid.reset(sid);

- // Generate the message.

- // Note that the format of this message must match the consumer in

- // chrome/browser/crash_upload_list_win.cc.

- base::string16 message =

- L"Crash uploaded. Id=" + base::string16(report_id) + L".";

- // Matches Omaha.

- const int kCrashUploadEventId = 2;

- // Report the event.

- const base::char16* strings[] = {message.c_str()};

- if (!::ReportEvent(event_source_handle.get(), EVENTLOG_INFORMATION_TYPE,

- 0, // category

- kCrashUploadEventId, sid,

- 1, // count

- 0, strings, nullptr)) {

- DPLOG(ERROR);

- }

-void AddCrashKey(const wchar_t *key, const wchar_t *value,

- std::vector<kasko::api::CrashKey> *crash_keys) {

- DCHECK(key);

- DCHECK(value);

- DCHECK(crash_keys);

- crash_keys->resize(crash_keys->size() + 1);

- kasko::api::CrashKey& crash_key = crash_keys->back();

- base::wcslcpy(crash_key.name, key, kasko::api::CrashKey::kNameMaxLength);

- base::wcslcpy(crash_key.value, value, kasko::api::CrashKey::kValueMaxLength);

-// that is of type ThreadType and belongs to a process that is valid for the

-// capture of a crash dump. Returns true if such a node was found.

-bool GetLastValidNodeInfo(const base::win::WaitChainNodeVector& wait_chain,

- base::Process* process,

- DWORD* thread_id) {

- // The last thread in the wait chain is nominated as the hung thread.

- base::win::WaitChainNodeVector::const_reverse_iterator it;

- for (it = wait_chain.rbegin(); it != wait_chain.rend(); ++it) {

- if (it->ObjectType != WctThreadType)

- continue;

- auto current_process = base::Process::Open(it->ThreadObject.ProcessId);

- if (EnsureTargetProcessValidForCapture(current_process)) {

- *process = std::move(current_process);

- *thread_id = it->ThreadObject.ThreadId;

- return true;

- }

- return false;

-// Adds the entire wait chain to |crash_keys|.

-//

-// As an example (key : value):

-// hung-process-wait-chain-00 : Thread 10242 in process 4554 with status Blocked

-// hung-process-wait-chain-01 : Lock of type ThreadWait with status Owned

-// hung-process-wait-chain-02 : Thread 77221 in process 4554 with status Blocked

-//

-void AddWaitChainToCrashKeys(const base::win::WaitChainNodeVector& wait_chain,

- std::vector<kasko::api::CrashKey>* crash_keys) {

- for (size_t i = 0; i < wait_chain.size(); i++) {

- AddCrashKey(

- base::StringPrintf(L"hung-process-wait-chain-%02" PRIuS, i).c_str(),

- base::win::WaitChainNodeToString(wait_chain[i]).c_str(), crash_keys);

- }

-base::FilePath GetExeFilePathForProcess(const base::Process& process) {

- wchar_t exe_name[MAX_PATH];

- DWORD exe_name_len = arraysize(exe_name);

- // Note: requesting the Win32 path format.

- if (::QueryFullProcessImageName(process.Handle(), 0, exe_name,

- &exe_name_len) == 0) {

- DPLOG(ERROR) << "Failed to get executable name for process";

- return base::FilePath();

- }

- // QueryFullProcessImageName's documentation does not specify behavior when

- // the buffer is too small, but we know that GetModuleFileNameEx succeeds and

- // truncates the returned name in such a case. Given that paths of arbitrary

- // length may exist, the conservative approach is to reject names when

- // the returned length is that of the buffer.

- if (exe_name_len > 0 && exe_name_len < arraysize(exe_name))

- return base::FilePath(exe_name);

- return base::FilePath();

-// Adds the executable base name for each unique pid found in the |wait_chain|

-// to the |crash_keys|.

-void AddProcessExeNameToCrashKeys(

- const base::win::WaitChainNodeVector& wait_chain,

- std::vector<kasko::api::CrashKey>* crash_keys) {

- std::set<DWORD> unique_pids;

- for (size_t i = 0; i < wait_chain.size(); i += 2)

- unique_pids.insert(wait_chain[i].ThreadObject.ProcessId);

- for (DWORD pid : unique_pids) {

- // This is racy on the pid but for the purposes of this function, some error

- // threshold can be tolerated. Hopefully the race doesn't happen often.

- base::Process process(

- base::Process::OpenWithAccess(pid, PROCESS_QUERY_LIMITED_INFORMATION));

- base::string16 exe_file_path = L"N/A";

- if (process.IsValid())

- exe_file_path = GetExeFilePathForProcess(process).BaseName().value();

- AddCrashKey(

- base::StringPrintf(L"hung-process-wait-chain-pid-%u", pid).c_str(),

- exe_file_path.c_str(), crash_keys);

- }

-void AddSystemLoadInformation(std::vector<kasko::api::CrashKey>* crash_keys) {

- DCHECK(crash_keys);

- // Add memory pressure level.

- memory_pressure::DirectMemoryPressureCalculator memory_calculator;

- const wchar_t* memory_pressure_level = L"";

- switch (memory_calculator.CalculateCurrentPressureLevel()) {

- case MemoryPressureLevel::MEMORY_PRESSURE_LEVEL_NONE:

- memory_pressure_level = L"none-or-unknown";

- break;

- case MemoryPressureLevel::MEMORY_PRESSURE_LEVEL_MODERATE:

- memory_pressure_level = L"moderate";

- break;

- case MemoryPressureLevel::MEMORY_PRESSURE_LEVEL_CRITICAL:

- memory_pressure_level = L"critical";

- break;

- }

- AddCrashKey(L"memory-pressure", memory_pressure_level, crash_keys);

- // Add measures of cpu and disk load.

- chrome_watcher::SystemLoadEstimator::Estimate load_estimate = {};

- if (!chrome_watcher::SystemLoadEstimator::Measure(&load_estimate))

- return;

- AddCrashKey(L"cpu-load-percent",

- base::IntToString16(load_estimate.cpu_load_pct).c_str(),

- crash_keys);

- AddCrashKey(L"disk-idle-percent",

- base::IntToString16(load_estimate.disk_idle_pct).c_str(),

- crash_keys);

- AddCrashKey(L"disk-avg-queue-len",

- base::IntToString16(load_estimate.avg_disk_queue_len).c_str(),

- crash_keys);

-} // namespace

-bool InitializeKaskoReporter(const base::string16& endpoint,

- const base::char16* browser_data_directory) {

- base::string16 crash_server = GetKaskoCrashServerUrl();

- base::FilePath crash_reports_base_dir =

- GetKaskoCrashReportsBaseDir(browser_data_directory);

- return kasko::api::InitializeReporter(

- endpoint.c_str(),

- crash_server.c_str(),

- crash_reports_base_dir.Append(L"Crash Reports").value().c_str(),

- crash_reports_base_dir.Append(kPermanentlyFailedReportsSubdir)

- .value()

- .c_str(),

- &OnCrashReportUpload,

- nullptr);

-void ShutdownKaskoReporter() {

- kasko::api::ShutdownReporter();

-bool EnsureTargetProcessValidForCapture(const base::Process& process) {

- // Ensure the target process's executable is inside the current Chrome

- // directory.

- base::FilePath chrome_dir;

- if (!PathService::Get(base::DIR_EXE, &chrome_dir))

- return false;

- return chrome_dir.IsParent(GetExeFilePathForProcess(process));

-void DumpHungProcess(DWORD main_thread_id, const base::string16& channel,

- const base::char16* hang_type,

- const base::Process& process) {

- // Read the Crashpad module annotations for the process.

- std::vector<kasko::api::CrashKey> annotations;

- crash_reporter::ReadMainModuleAnnotationsForKasko(process, &annotations);

- // Label the report as a hang report.

- AddCrashKey(kHangReportCrashKey, hang_type, &annotations);

- // Note: system load is measured as early as possible, as it is potentially

- // more volatile than wait chain information.

- // TODO(manzagop): consider continuous load observation, instead of punctual

- // observation, which may fail to observe load.

- AddSystemLoadInformation(&annotations);

- // Use the Wait Chain Traversal API to determine the hung thread. Defaults to

- // UI thread on error. The wait chain may point to a different thread in a

- // different process for the hung thread.

- DWORD hung_thread_id = main_thread_id;

- base::Process hung_process = process.Duplicate();

- base::win::WaitChainNodeVector wait_chain;

- bool is_deadlock = false;

- base::string16 thread_chain_failure_reason;

- DWORD thread_chain_last_error = ERROR_SUCCESS;

- if (base::win::GetThreadWaitChain(main_thread_id, &wait_chain, &is_deadlock,

- &thread_chain_failure_reason,

- &thread_chain_last_error)) {

- bool found_valid_node =

- GetLastValidNodeInfo(wait_chain, &hung_process, &hung_thread_id);

- DCHECK(found_valid_node);

- // Add some interesting data about the wait chain to the crash keys.

- AddCrashKey(L"hung-process-is-deadlock", is_deadlock ? L"true" : L"false",

- &annotations);

- AddWaitChainToCrashKeys(wait_chain, &annotations);

- AddProcessExeNameToCrashKeys(wait_chain, &annotations);

- } else {

- // The call to GetThreadWaitChain() failed. Include the reason inside the

- // report using crash keys.

- // TODO(pmonette): Remove this when UMA is added to wait_chain.cc.

- AddCrashKey(L"hung-process-wait-chain-failure-reason",

- thread_chain_failure_reason.c_str(), &annotations);

- AddCrashKey(L"hung-process-wait-chain-last-error",

- base::UintToString16(thread_chain_last_error).c_str(),

- &annotations);

- }

- std::vector<const base::char16*> key_buffers;

- std::vector<const base::char16*> value_buffers;

- for (const auto& crash_key : annotations) {

- key_buffers.push_back(crash_key.name);

- value_buffers.push_back(crash_key.value);

- }

- key_buffers.push_back(nullptr);

- value_buffers.push_back(nullptr);

- // Synthesize an exception for the hung thread. Populate the record with the

- // current context of the thread to get the stack trace bucketed on the crash

- // backend.

- CONTEXT thread_context = {};

- EXCEPTION_RECORD exception_record = {};

- exception_record.ExceptionCode = EXCEPTION_ARRAY_BOUNDS_EXCEEDED;

- EXCEPTION_POINTERS exception_pointers = {&exception_record, &thread_context};

- base::win::ScopedHandle hung_thread(::OpenThread(

- THREAD_SUSPEND_RESUME | THREAD_GET_CONTEXT | THREAD_QUERY_INFORMATION,

- FALSE, hung_thread_id));

- bool have_context = false;

- if (hung_thread.IsValid()) {

- DWORD suspend_count = ::SuspendThread(hung_thread.Get());

- const DWORD kSuspendFailed = static_cast<DWORD>(-1);

- if (suspend_count != kSuspendFailed) {

- // Best effort capture of the context.

- thread_context.ContextFlags = CONTEXT_FLOATING_POINT | CONTEXT_SEGMENTS |

- CONTEXT_INTEGER | CONTEXT_CONTROL;

- if (::GetThreadContext(hung_thread.Get(), &thread_context) == TRUE)

- have_context = true;

- ::ResumeThread(hung_thread.Get());

- }

- // TODO(manzagop): consider making the dump-type channel-dependent.

- if (have_context) {

- kasko::api::SendReportForProcess(

- hung_process.Handle(), hung_thread_id, &exception_pointers,

- kasko::api::LARGER_DUMP_TYPE, key_buffers.data(), value_buffers.data());

- } else {

- kasko::api::SendReportForProcess(hung_process.Handle(), 0, nullptr,

- kasko::api::LARGER_DUMP_TYPE,

- key_buffers.data(), value_buffers.data());

- }

« no previous file with comments | « chrome/chrome_watcher/kasko_util.h ('k') | third_party/kasko/BUILD.gn » ('j') | no next file with comments »