Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(1657)

Side by Side Diff: base/profiler/stack_sampling_profiler_win.cc

Issue 1016563004: Statistical stack profiler for Windows x64 (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@lkcr
Patch Set: record IPs for invalid modules Created 5 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 // Copyright 2015 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "base/profiler/stack_sampling_profiler.h"
6
7 #include <dbghelp.h>
8 #include <map>
9 #include <utility>
10 #include <windows.h>
11
12 #include "base/logging.h"
13 #include "base/time/time.h"
14 #include "base/win/pe_image.h"
15 #include "base/win/scoped_handle.h"
16
17 namespace base {
18
19 namespace {
20
21 class NativeStackSamplerWin : public StackSamplingProfiler::NativeStackSampler {
22 public:
23 explicit NativeStackSamplerWin(win::ScopedHandle thread_handle);
24 ~NativeStackSamplerWin() override;
25
26 // StackSamplingProfiler::NativeStackSampler:
27 void ProfileRecordingStarting(
28 StackSamplingProfiler::Profile* profile) override;
29 void RecordStackSample(StackSamplingProfiler::Sample* sample) override;
30 void ProfileRecordingStopped() override;
31
32 private:
33 static bool GetModuleInfo(HMODULE module,
34 StackSamplingProfiler::Module* module_info);
35
36 void CopyToSample(const void* const instruction_pointers[],
37 const HMODULE modules[],
38 int stack_depth,
39 StackSamplingProfiler::Sample* sample,
40 std::vector<StackSamplingProfiler::Module>* module_infos);
41
42 win::ScopedHandle thread_handle_;
43 // Weak. Points to the profile being recorded between
44 // ProfileRecordingStarting() and ProfileRecordingStopped().
45 StackSamplingProfiler::Profile* current_profile_;
46 // Maps a module to the module's index within current_profile_->modules.
47 std::map<HMODULE, int> profile_module_index_;
48
49 DISALLOW_COPY_AND_ASSIGN(NativeStackSamplerWin);
50 };
51
52 // Walk the stack represented by |context| from the current frame downwards,
53 // recording the instruction pointers for each frame in |instruction_pointers|.
54 int RecordStack(CONTEXT* context,
55 int max_stack_size,
56 const void* instruction_pointers[],
57 bool* last_frame_is_unknown_function) {
58 #ifdef _WIN64
59 *last_frame_is_unknown_function = false;
60
61 IMAGEHLP_SYMBOL64 sym;
62 sym.SizeOfStruct = sizeof(sym);
63 sym.MaxNameLength = 0;
64
65 for (int i = 0; i < max_stack_size; ++i) {
66 // Try to look up unwind metadata for the current function.
67 ULONG64 image_base;
68 PRUNTIME_FUNCTION runtime_function =
69 RtlLookupFunctionEntry(context->Rip, &image_base, nullptr);
70
71 instruction_pointers[i] = reinterpret_cast<void*>(context->Rip);
72
73 if (runtime_function) {
74 KNONVOLATILE_CONTEXT_POINTERS nvcontext = {0};
75 void* handler_data;
76 ULONG64 establisher_frame;
77 RtlVirtualUnwind(0, image_base, context->Rip, runtime_function, context,
zturner 2015/03/18 23:04:37 Did you consider using RtlCaptureStackBacktrace?
danduong 2015/03/18 23:20:48 As far as I know, RtlCaptureStackBackTrace cannot
78 &handler_data, &establisher_frame, &nvcontext);
79 } else {
80 // If we don't have a RUNTIME_FUNCTION, then we've encountered
81 // a leaf function. Adjust the stack appropriately.
82 context->Rip = *reinterpret_cast<PDWORD64>(context->Rsp);
83 context->Rsp += 8;
84 *last_frame_is_unknown_function = true;
85 }
86
87 if (!context->Rip)
88 return i;
89 }
90 return max_stack_size;
91 #else
92 return 0;
zturner 2015/03/18 23:04:37 Is there any desire to support x86? RtlVirtualUnw
danduong 2015/03/18 23:20:47 We'll focus on x64 for now. StackWalk64, I've hear
93 #endif
94 }
95
96 // Fills in |modules| corresponding to the pointers to code in |addresses|.
97 void FindModulesForAddresses(const void* const addresses[], HMODULE modules[],
98 int stack_depth,
99 bool last_frame_is_unknown_function) {
100 const int module_frames = last_frame_is_unknown_function ? stack_depth - 1 :
101 stack_depth;
102 for (int i = 0; i < module_frames; ++i) {
103 HMODULE module = NULL;
104 if (GetModuleHandleEx(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS |
105 GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
zturner 2015/03/18 23:04:37 Why not increment the module's refcount? You stor
Mike Wittman 2015/03/19 00:15:44 Incrementing the refcount led to deadlock previous
106 reinterpret_cast<LPCTSTR>(addresses[i]),
107 &module)) {
108 // HMODULE is the base address of the module.
109 DCHECK_LT(reinterpret_cast<const void*>(module), addresses[i]);
110 modules[i] = module;
111 }
112 }
113 for (int i = module_frames; i < stack_depth; ++i)
zturner 2015/03/18 23:04:37 Alternatively, you could memset() the entire array
Mike Wittman 2015/03/19 00:15:44 Used a zero initializer.
114 modules[stack_depth - 1] = NULL;
zturner 2015/03/18 23:04:37 What about addresses? You're going to end up with
Mike Wittman 2015/03/19 00:15:44 Done.
115 }
116
117 // Suspends the thread with |thread_handle|, records the stack into
118 // |instruction_pointers| and the corresponding modules into |modules|, then
119 // resumes the thread. Returns the size of the stack.
120 int SuspendThreadAndRecordStack(HANDLE thread_handle, int max_stack_size,
121 const void* instruction_pointers[],
122 HMODULE modules[]) {
123 if (::SuspendThread(thread_handle) == -1) {
zturner 2015/03/18 23:04:37 Just to be certain, this will never be equal to th
Mike Wittman 2015/03/19 00:15:43 Yes, this is only ever called on the profiler thre
124 LOG(ERROR) << "SuspendThread failed: " << GetLastError();
125 return 0;
126 }
127
128 CONTEXT thread_context = {0};
129 thread_context.ContextFlags = CONTEXT_ALL;
zturner 2015/03/18 23:04:37 Do you actually need CONTEXT_ALL? CONTEXT_FULL is
Mike Wittman 2015/03/19 00:15:44 CONTEXT_FULL appears to be sufficient.
130 if (!::GetThreadContext(thread_handle, &thread_context)) {
131 LOG(ERROR) << "GetThreadContext failed: " << GetLastError();
132 }
133
134 bool last_frame_is_unknown_function = false;
135 int stack_depth = RecordStack(&thread_context, max_stack_size,
136 instruction_pointers,
137 &last_frame_is_unknown_function);
138
139 if (::ResumeThread(thread_handle) == -1)
140 LOG(ERROR) << "ResumeThread failed: " << GetLastError();
141
142 FindModulesForAddresses(instruction_pointers, modules, stack_depth,
143 last_frame_is_unknown_function);
144
145 return stack_depth;
146 }
147
148 } // namespace
149
150 scoped_ptr<StackSamplingProfiler::NativeStackSampler>
151 StackSamplingProfiler::NativeStackSampler::Create(PlatformThreadId thread_id) {
152 #if _WIN64
153 // Get the thread's handle.
154 HANDLE thread_handle = ::OpenThread(THREAD_ALL_ACCESS, FALSE, thread_id);
zturner 2015/03/18 23:04:37 THREAD_GET_CONTEXT | THREAD_SUSPEND_RESUME | THREA
Mike Wittman 2015/03/19 00:15:44 Done.
155 DCHECK(thread_handle) << "OpenThread failed";
156
157 return scoped_ptr<NativeStackSampler>(new NativeStackSamplerWin(
158 win::ScopedHandle(thread_handle)));
159 #else
160 return scoped_ptr<NativeStackSampler>();
161 #endif
162 }
163
164 NativeStackSamplerWin::NativeStackSamplerWin(win::ScopedHandle thread_handle)
165 : thread_handle_(thread_handle.Take()) {
166 #ifdef _WIN64
167 if (RtlVirtualUnwind == nullptr && RtlLookupFunctionEntry == nullptr) {
168 const HMODULE nt_dll_handle = ::GetModuleHandle(L"ntdll.dll");
zturner 2015/03/18 23:04:37 You should probably handle the case where nt_dll_h
Mike Wittman 2015/03/19 00:15:44 Done.
169 reinterpret_cast<void*&>(RtlVirtualUnwind) =
170 ::GetProcAddress(nt_dll_handle, "RtlVirtualUnwind");
171 reinterpret_cast<void*&>(RtlLookupFunctionEntry) =
172 ::GetProcAddress(nt_dll_handle, "RtlLookupFunctionEntry");
173 }
174 #endif
175 }
176
177 NativeStackSamplerWin::~NativeStackSamplerWin() {
178 }
179
180 void NativeStackSamplerWin::ProfileRecordingStarting(
181 StackSamplingProfiler::Profile* profile) {
182 current_profile_ = profile;
183 profile_module_index_.clear();
184 }
185
186 void NativeStackSamplerWin::RecordStackSample(
187 StackSamplingProfiler::Sample* sample) {
188 DCHECK(current_profile_);
189
190 const int max_stack_size = 64;
191 const void* instruction_pointers[max_stack_size];
192 HMODULE modules[max_stack_size];
zturner 2015/03/18 23:04:37 If you initialize these two arrays with "= {0}" th
Mike Wittman 2015/03/19 00:15:44 Done.
193
194 int stack_depth = SuspendThreadAndRecordStack(
195 thread_handle_.Get(), max_stack_size, instruction_pointers, modules);
196 CopyToSample(instruction_pointers, modules, stack_depth, sample,
197 &current_profile_->modules);
198 }
199
200 void NativeStackSamplerWin::ProfileRecordingStopped() {
201 current_profile_ = nullptr;
202 }
203
204 // static
205 bool NativeStackSamplerWin::GetModuleInfo(
206 HMODULE module,
207 StackSamplingProfiler::Module* module_info) {
208 wchar_t module_name[MAX_PATH];
209 DWORD result_length =
210 GetModuleFileName(module, module_name, arraysize(module_name));
211 if (result_length == 0)
212 return false;
213
214 module_info->filename = base::FilePath(module_name);
215
216 module_info->base_address = reinterpret_cast<const void*>(module);
217
218 GUID guid;
219 DWORD age;
220 win::PEImage(module).GetDebugId(&guid, &age);
zturner 2015/03/18 23:04:37 Is this present for release / optimized builds?
danduong 2015/03/18 23:20:47 Should be. Minidumps include the debugIds of the m
221 module_info->id.insert(module_info->id.end(),
222 reinterpret_cast<char*>(&guid),
223 reinterpret_cast<char*>(&guid + 1));
224 module_info->id.insert(module_info->id.end(),
225 reinterpret_cast<char*>(&age),
226 reinterpret_cast<char*>(&age + 1));
227
228 return true;
229 }
230
231 void NativeStackSamplerWin::CopyToSample(
232 const void* const instruction_pointers[],
233 const HMODULE modules[],
234 int stack_depth,
235 StackSamplingProfiler::Sample* sample,
236 std::vector<StackSamplingProfiler::Module>* module_infos) {
237 sample->clear();
238 sample->reserve(stack_depth);
239
240 for (int i = 0; i < stack_depth; ++i) {
241 sample->push_back(StackSamplingProfiler::Frame());
242 StackSamplingProfiler::Frame& frame = sample->back();
243
244 frame.instruction_pointer = instruction_pointers[i];
245
246 // Record an invalid module index if we don't have a valid module.
247 if (!modules[i]) {
248 frame.module_index = -1;
249 continue;
250 }
251
252 auto loc = profile_module_index_.find(modules[i]);
253 if (loc == profile_module_index_.end()) {
254 StackSamplingProfiler::Module module_info;
255 // Record an invalid module index if we have a module but can't find
256 // information on it.
257 if (!GetModuleInfo(modules[i], &module_info)) {
258 frame.module_index = -1;
259 continue;
260 }
261 module_infos->push_back(module_info);
262 loc = profile_module_index_.insert(std::make_pair(
263 modules[i], static_cast<int>(module_infos->size() - 1))).first;
264 }
265
266 frame.module_index = loc->second;
267 }
268 }
269
270 } // namespace base
OLDNEW
« base/profiler/stack_sampling_profiler.cc ('K') | « base/profiler/stack_sampling_profiler_unittest.cc ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698