| OLD | NEW |
| (Empty) |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | |
| 2 // Use of this source code is governed by a BSD-style license that can be | |
| 3 // found in the LICENSE file. | |
| 4 | |
| 5 #include "chrome/browser/crash_handler_host_linux.h" | |
| 6 | |
| 7 #include <stdint.h> | |
| 8 #include <stdlib.h> | |
| 9 #include <sys/socket.h> | |
| 10 #include <sys/syscall.h> | |
| 11 #include <unistd.h> | |
| 12 | |
| 13 #include "base/bind.h" | |
| 14 #include "base/bind_helpers.h" | |
| 15 #include "base/files/file_path.h" | |
| 16 #include "base/format_macros.h" | |
| 17 #include "base/linux_util.h" | |
| 18 #include "base/logging.h" | |
| 19 #include "base/memory/singleton.h" | |
| 20 #include "base/message_loop/message_loop.h" | |
| 21 #include "base/path_service.h" | |
| 22 #include "base/posix/eintr_wrapper.h" | |
| 23 #include "base/rand_util.h" | |
| 24 #include "base/strings/string_util.h" | |
| 25 #include "base/strings/stringprintf.h" | |
| 26 #include "base/threading/thread.h" | |
| 27 #include "breakpad/src/client/linux/handler/exception_handler.h" | |
| 28 #include "breakpad/src/client/linux/minidump_writer/linux_dumper.h" | |
| 29 #include "breakpad/src/client/linux/minidump_writer/minidump_writer.h" | |
| 30 #include "chrome/app/breakpad_linux_impl.h" | |
| 31 #include "content/public/browser/browser_thread.h" | |
| 32 | |
| 33 #if defined(OS_ANDROID) | |
| 34 #include <sys/linux-syscalls.h> | |
| 35 | |
| 36 #define SYS_read __NR_read | |
| 37 #endif | |
| 38 | |
| 39 using content::BrowserThread; | |
| 40 using google_breakpad::ExceptionHandler; | |
| 41 | |
| 42 namespace { | |
| 43 | |
| 44 // The length of the control message: | |
| 45 const unsigned kControlMsgSize = | |
| 46 CMSG_SPACE(2*sizeof(int)) + CMSG_SPACE(sizeof(struct ucred)); | |
| 47 // The length of the regular payload: | |
| 48 const unsigned kCrashContextSize = sizeof(ExceptionHandler::CrashContext); | |
| 49 | |
| 50 // Handles the crash dump and frees the allocated BreakpadInfo struct. | |
| 51 void CrashDumpTask(CrashHandlerHostLinux* handler, BreakpadInfo* info) { | |
| 52 if (handler->IsShuttingDown()) | |
| 53 return; | |
| 54 | |
| 55 HandleCrashDump(*info); | |
| 56 delete[] info->filename; | |
| 57 delete[] info->process_type; | |
| 58 delete[] info->distro; | |
| 59 delete info->crash_keys; | |
| 60 delete info; | |
| 61 } | |
| 62 | |
| 63 } // namespace | |
| 64 | |
| 65 // Since instances of CrashHandlerHostLinux are leaked, they are only destroyed | |
| 66 // at the end of the processes lifetime, which is greater in span than the | |
| 67 // lifetime of the IO message loop. Thus, all calls to base::Bind() use | |
| 68 // non-refcounted pointers. | |
| 69 | |
| 70 CrashHandlerHostLinux::CrashHandlerHostLinux(const std::string& process_type, | |
| 71 const base::FilePath& dumps_path, | |
| 72 bool upload) | |
| 73 : process_type_(process_type), | |
| 74 dumps_path_(dumps_path), | |
| 75 upload_(upload), | |
| 76 shutting_down_(false), | |
| 77 worker_pool_token_(BrowserThread::GetBlockingPool()->GetSequenceToken()) { | |
| 78 int fds[2]; | |
| 79 // We use SOCK_SEQPACKET rather than SOCK_DGRAM to prevent the process from | |
| 80 // sending datagrams to other sockets on the system. The sandbox may prevent | |
| 81 // the process from calling socket() to create new sockets, but it'll still | |
| 82 // inherit some sockets. With PF_UNIX+SOCK_DGRAM, it can call sendmsg to send | |
| 83 // a datagram to any (abstract) socket on the same system. With | |
| 84 // SOCK_SEQPACKET, this is prevented. | |
| 85 CHECK_EQ(socketpair(AF_UNIX, SOCK_SEQPACKET, 0, fds), 0); | |
| 86 static const int on = 1; | |
| 87 | |
| 88 // Enable passcred on the server end of the socket | |
| 89 CHECK_EQ(setsockopt(fds[1], SOL_SOCKET, SO_PASSCRED, &on, sizeof(on)), 0); | |
| 90 | |
| 91 process_socket_ = fds[0]; | |
| 92 browser_socket_ = fds[1]; | |
| 93 | |
| 94 BrowserThread::PostTask( | |
| 95 BrowserThread::IO, FROM_HERE, | |
| 96 base::Bind(&CrashHandlerHostLinux::Init, base::Unretained(this))); | |
| 97 } | |
| 98 | |
| 99 CrashHandlerHostLinux::~CrashHandlerHostLinux() { | |
| 100 (void) HANDLE_EINTR(close(process_socket_)); | |
| 101 (void) HANDLE_EINTR(close(browser_socket_)); | |
| 102 } | |
| 103 | |
| 104 void CrashHandlerHostLinux::StartUploaderThread() { | |
| 105 uploader_thread_.reset( | |
| 106 new base::Thread(std::string(process_type_ + "_crash_uploader").c_str())); | |
| 107 uploader_thread_->Start(); | |
| 108 } | |
| 109 | |
| 110 void CrashHandlerHostLinux::Init() { | |
| 111 base::MessageLoopForIO* ml = base::MessageLoopForIO::current(); | |
| 112 CHECK(ml->WatchFileDescriptor( | |
| 113 browser_socket_, true /* persistent */, | |
| 114 base::MessageLoopForIO::WATCH_READ, | |
| 115 &file_descriptor_watcher_, this)); | |
| 116 ml->AddDestructionObserver(this); | |
| 117 } | |
| 118 | |
| 119 void CrashHandlerHostLinux::OnFileCanWriteWithoutBlocking(int fd) { | |
| 120 NOTREACHED(); | |
| 121 } | |
| 122 | |
| 123 void CrashHandlerHostLinux::OnFileCanReadWithoutBlocking(int fd) { | |
| 124 DCHECK_EQ(fd, browser_socket_); | |
| 125 | |
| 126 // A process has crashed and has signaled us by writing a datagram | |
| 127 // to the death signal socket. The datagram contains the crash context needed | |
| 128 // for writing the minidump as well as a file descriptor and a credentials | |
| 129 // block so that they can't lie about their pid. | |
| 130 // | |
| 131 // The message sender is in chrome/app/breakpad_linux.cc. | |
| 132 | |
| 133 struct msghdr msg = {0}; | |
| 134 struct iovec iov[kCrashIovSize]; | |
| 135 | |
| 136 // Freed in WriteDumpFile(); | |
| 137 char* crash_context = new char[kCrashContextSize]; | |
| 138 // Freed in CrashDumpTask(); | |
| 139 char* distro = new char[kDistroSize + 1]; | |
| 140 #if defined(ADDRESS_SANITIZER) | |
| 141 asan_report_str_ = new char[kMaxAsanReportSize + 1]; | |
| 142 #endif | |
| 143 | |
| 144 // Freed in CrashDumpTask(). | |
| 145 CrashKeyStorage* crash_keys = new CrashKeyStorage; | |
| 146 google_breakpad::SerializedNonAllocatingMap* serialized_crash_keys; | |
| 147 size_t crash_keys_size = crash_keys->Serialize( | |
| 148 const_cast<const google_breakpad::SerializedNonAllocatingMap**>( | |
| 149 &serialized_crash_keys)); | |
| 150 | |
| 151 char* tid_buf_addr = NULL; | |
| 152 int tid_fd = -1; | |
| 153 uint64_t uptime; | |
| 154 size_t oom_size; | |
| 155 char control[kControlMsgSize]; | |
| 156 const ssize_t expected_msg_size = | |
| 157 kCrashContextSize + | |
| 158 kDistroSize + 1 + | |
| 159 sizeof(tid_buf_addr) + sizeof(tid_fd) + | |
| 160 sizeof(uptime) + | |
| 161 #if defined(ADDRESS_SANITIZER) | |
| 162 kMaxAsanReportSize + 1 + | |
| 163 #endif | |
| 164 sizeof(oom_size) + | |
| 165 crash_keys_size; | |
| 166 iov[0].iov_base = crash_context; | |
| 167 iov[0].iov_len = kCrashContextSize; | |
| 168 iov[1].iov_base = distro; | |
| 169 iov[1].iov_len = kDistroSize + 1; | |
| 170 iov[2].iov_base = &tid_buf_addr; | |
| 171 iov[2].iov_len = sizeof(tid_buf_addr); | |
| 172 iov[3].iov_base = &tid_fd; | |
| 173 iov[3].iov_len = sizeof(tid_fd); | |
| 174 iov[4].iov_base = &uptime; | |
| 175 iov[4].iov_len = sizeof(uptime); | |
| 176 iov[5].iov_base = &oom_size; | |
| 177 iov[5].iov_len = sizeof(oom_size); | |
| 178 iov[6].iov_base = serialized_crash_keys; | |
| 179 iov[6].iov_len = crash_keys_size; | |
| 180 #if defined(ADDRESS_SANITIZER) | |
| 181 iov[7].iov_base = asan_report_str_; | |
| 182 iov[7].iov_len = kMaxAsanReportSize + 1; | |
| 183 #endif | |
| 184 msg.msg_iov = iov; | |
| 185 msg.msg_iovlen = kCrashIovSize; | |
| 186 msg.msg_control = control; | |
| 187 msg.msg_controllen = kControlMsgSize; | |
| 188 | |
| 189 const ssize_t msg_size = HANDLE_EINTR(recvmsg(browser_socket_, &msg, 0)); | |
| 190 if (msg_size != expected_msg_size) { | |
| 191 LOG(ERROR) << "Error reading from death signal socket. Crash dumping" | |
| 192 << " is disabled." | |
| 193 << " msg_size:" << msg_size | |
| 194 << " errno:" << errno; | |
| 195 file_descriptor_watcher_.StopWatchingFileDescriptor(); | |
| 196 return; | |
| 197 } | |
| 198 | |
| 199 if (msg.msg_controllen != kControlMsgSize || | |
| 200 msg.msg_flags & ~MSG_TRUNC) { | |
| 201 LOG(ERROR) << "Received death signal message with the wrong size;" | |
| 202 << " msg.msg_controllen:" << msg.msg_controllen | |
| 203 << " msg.msg_flags:" << msg.msg_flags | |
| 204 << " kCrashContextSize:" << kCrashContextSize | |
| 205 << " kControlMsgSize:" << kControlMsgSize; | |
| 206 return; | |
| 207 } | |
| 208 | |
| 209 // Walk the control payload an extract the file descriptor and validated pid. | |
| 210 pid_t crashing_pid = -1; | |
| 211 int partner_fd = -1; | |
| 212 int signal_fd = -1; | |
| 213 for (struct cmsghdr *hdr = CMSG_FIRSTHDR(&msg); hdr; | |
| 214 hdr = CMSG_NXTHDR(&msg, hdr)) { | |
| 215 if (hdr->cmsg_level != SOL_SOCKET) | |
| 216 continue; | |
| 217 if (hdr->cmsg_type == SCM_RIGHTS) { | |
| 218 const unsigned len = hdr->cmsg_len - | |
| 219 (((uint8_t*)CMSG_DATA(hdr)) - (uint8_t*)hdr); | |
| 220 DCHECK_EQ(len % sizeof(int), 0u); | |
| 221 const unsigned num_fds = len / sizeof(int); | |
| 222 if (num_fds != 2) { | |
| 223 // A nasty process could try and send us too many descriptors and | |
| 224 // force a leak. | |
| 225 LOG(ERROR) << "Death signal contained wrong number of descriptors;" | |
| 226 << " num_fds:" << num_fds; | |
| 227 for (unsigned i = 0; i < num_fds; ++i) | |
| 228 (void) HANDLE_EINTR(close(reinterpret_cast<int*>(CMSG_DATA(hdr))[i])); | |
| 229 return; | |
| 230 } else { | |
| 231 partner_fd = reinterpret_cast<int*>(CMSG_DATA(hdr))[0]; | |
| 232 signal_fd = reinterpret_cast<int*>(CMSG_DATA(hdr))[1]; | |
| 233 } | |
| 234 } else if (hdr->cmsg_type == SCM_CREDENTIALS) { | |
| 235 const struct ucred *cred = | |
| 236 reinterpret_cast<struct ucred*>(CMSG_DATA(hdr)); | |
| 237 crashing_pid = cred->pid; | |
| 238 } | |
| 239 } | |
| 240 | |
| 241 if (crashing_pid == -1 || partner_fd == -1 || signal_fd == -1) { | |
| 242 LOG(ERROR) << "Death signal message didn't contain all expected control" | |
| 243 << " messages"; | |
| 244 if (partner_fd >= 0) | |
| 245 (void) HANDLE_EINTR(close(partner_fd)); | |
| 246 if (signal_fd >= 0) | |
| 247 (void) HANDLE_EINTR(close(signal_fd)); | |
| 248 return; | |
| 249 } | |
| 250 | |
| 251 // Kernel bug workaround (broken in 2.6.30 and 2.6.32, working in 2.6.38). | |
| 252 // The kernel doesn't translate PIDs in SCM_CREDENTIALS across PID | |
| 253 // namespaces. Thus |crashing_pid| might be garbage from our point of view. | |
| 254 // In the future we can remove this workaround, but we have to wait a couple | |
| 255 // of years to be sure that it's worked its way out into the world. | |
| 256 // TODO(thestig) Remove the workaround when Ubuntu Lucid is deprecated. | |
| 257 | |
| 258 // The crashing process closes its copy of the signal_fd immediately after | |
| 259 // calling sendmsg(). We can thus not reliably look for with with | |
| 260 // FindProcessHoldingSocket(). But by necessity, it has to keep the | |
| 261 // partner_fd open until the crashdump is complete. | |
| 262 ino_t inode_number; | |
| 263 if (!base::FileDescriptorGetInode(&inode_number, partner_fd)) { | |
| 264 LOG(WARNING) << "Failed to get inode number for passed socket"; | |
| 265 (void) HANDLE_EINTR(close(partner_fd)); | |
| 266 (void) HANDLE_EINTR(close(signal_fd)); | |
| 267 return; | |
| 268 } | |
| 269 (void) HANDLE_EINTR(close(partner_fd)); | |
| 270 | |
| 271 pid_t actual_crashing_pid = -1; | |
| 272 if (!base::FindProcessHoldingSocket(&actual_crashing_pid, inode_number)) { | |
| 273 LOG(WARNING) << "Failed to find process holding other end of crash reply " | |
| 274 "socket"; | |
| 275 (void) HANDLE_EINTR(close(signal_fd)); | |
| 276 return; | |
| 277 } | |
| 278 | |
| 279 crashing_pid = actual_crashing_pid; | |
| 280 | |
| 281 // The crashing TID set inside the compromised context via | |
| 282 // sys_gettid() in ExceptionHandler::HandleSignal might be wrong (if | |
| 283 // the kernel supports PID namespacing) and may need to be | |
| 284 // translated. | |
| 285 // | |
| 286 // We expect the crashing thread to be in sys_read(), waiting for us to | |
| 287 // write to |signal_fd|. Most newer kernels where we have the different pid | |
| 288 // namespaces also have /proc/[pid]/syscall, so we can look through | |
| 289 // |actual_crashing_pid|'s thread group and find the thread that's in the | |
| 290 // read syscall with the right arguments. | |
| 291 | |
| 292 std::string expected_syscall_data; | |
| 293 // /proc/[pid]/syscall is formatted as follows: | |
| 294 // syscall_number arg1 ... arg6 sp pc | |
| 295 // but we just check syscall_number through arg3. | |
| 296 base::StringAppendF(&expected_syscall_data, "%d 0x%x %p 0x1 ", | |
| 297 SYS_read, tid_fd, tid_buf_addr); | |
| 298 bool syscall_supported = false; | |
| 299 pid_t crashing_tid = | |
| 300 base::FindThreadIDWithSyscall(crashing_pid, | |
| 301 expected_syscall_data, | |
| 302 &syscall_supported); | |
| 303 if (crashing_tid == -1) { | |
| 304 // We didn't find the thread we want. Maybe it didn't reach | |
| 305 // sys_read() yet or the thread went away. We'll just take a | |
| 306 // guess here and assume the crashing thread is the thread group | |
| 307 // leader. If procfs syscall is not supported by the kernel, then | |
| 308 // we assume the kernel also does not support TID namespacing and | |
| 309 // trust the TID passed by the crashing process. | |
| 310 LOG(WARNING) << "Could not translate tid - assuming crashing thread is " | |
| 311 "thread group leader; syscall_supported=" << syscall_supported; | |
| 312 crashing_tid = crashing_pid; | |
| 313 } | |
| 314 | |
| 315 ExceptionHandler::CrashContext* bad_context = | |
| 316 reinterpret_cast<ExceptionHandler::CrashContext*>(crash_context); | |
| 317 bad_context->tid = crashing_tid; | |
| 318 | |
| 319 // Freed in CrashDumpTask(); | |
| 320 BreakpadInfo* info = new BreakpadInfo; | |
| 321 | |
| 322 info->fd = -1; | |
| 323 info->process_type_length = process_type_.length(); | |
| 324 char* process_type_str = new char[info->process_type_length + 1]; | |
| 325 process_type_.copy(process_type_str, info->process_type_length); | |
| 326 process_type_str[info->process_type_length] = '\0'; | |
| 327 info->process_type = process_type_str; | |
| 328 | |
| 329 info->distro_length = strlen(distro); | |
| 330 info->distro = distro; | |
| 331 #if defined(OS_ANDROID) | |
| 332 // Nothing gets uploaded in android. | |
| 333 info->upload = false; | |
| 334 #else | |
| 335 info->upload = upload_; | |
| 336 #endif | |
| 337 | |
| 338 info->crash_keys = crash_keys; | |
| 339 | |
| 340 #if defined(ADDRESS_SANITIZER) | |
| 341 info->asan_report_str = asan_report_str_; | |
| 342 info->asan_report_length = strlen(asan_report_str_); | |
| 343 #endif | |
| 344 info->process_start_time = uptime; | |
| 345 info->oom_size = oom_size; | |
| 346 | |
| 347 BrowserThread::GetBlockingPool()->PostSequencedWorkerTask( | |
| 348 worker_pool_token_, | |
| 349 FROM_HERE, | |
| 350 base::Bind(&CrashHandlerHostLinux::WriteDumpFile, | |
| 351 base::Unretained(this), | |
| 352 info, | |
| 353 crashing_pid, | |
| 354 crash_context, | |
| 355 signal_fd)); | |
| 356 } | |
| 357 | |
| 358 void CrashHandlerHostLinux::WriteDumpFile(BreakpadInfo* info, | |
| 359 pid_t crashing_pid, | |
| 360 char* crash_context, | |
| 361 int signal_fd) { | |
| 362 DCHECK(BrowserThread::GetBlockingPool()->IsRunningSequenceOnCurrentThread( | |
| 363 worker_pool_token_)); | |
| 364 | |
| 365 base::FilePath dumps_path("/tmp"); | |
| 366 PathService::Get(base::DIR_TEMP, &dumps_path); | |
| 367 if (!info->upload) | |
| 368 dumps_path = dumps_path_; | |
| 369 const uint64 rand = base::RandUint64(); | |
| 370 const std::string minidump_filename = | |
| 371 base::StringPrintf("%s/chromium-%s-minidump-%016" PRIx64 ".dmp", | |
| 372 dumps_path.value().c_str(), | |
| 373 process_type_.c_str(), | |
| 374 rand); | |
| 375 | |
| 376 if (!google_breakpad::WriteMinidump(minidump_filename.c_str(), | |
| 377 kMaxMinidumpFileSize, | |
| 378 crashing_pid, crash_context, | |
| 379 kCrashContextSize, | |
| 380 google_breakpad::MappingList(), | |
| 381 google_breakpad::AppMemoryList())) { | |
| 382 LOG(ERROR) << "Failed to write crash dump for pid " << crashing_pid; | |
| 383 } | |
| 384 #if defined(ADDRESS_SANITIZER) | |
| 385 // Create a temporary file holding the AddressSanitizer report. | |
| 386 const std::string log_filename = | |
| 387 base::StringPrintf("%s/chromium-%s-minidump-%016" PRIx64 ".log", | |
| 388 dumps_path.value().c_str(), | |
| 389 process_type_.c_str(), | |
| 390 rand); | |
| 391 FILE* logfile = fopen(log_filename.c_str(), "w"); | |
| 392 CHECK(logfile); | |
| 393 fprintf(logfile, "%s", asan_report_str_); | |
| 394 fclose(logfile); | |
| 395 #endif | |
| 396 | |
| 397 delete[] crash_context; | |
| 398 | |
| 399 // Freed in CrashDumpTask(); | |
| 400 char* minidump_filename_str = new char[minidump_filename.length() + 1]; | |
| 401 minidump_filename.copy(minidump_filename_str, minidump_filename.length()); | |
| 402 minidump_filename_str[minidump_filename.length()] = '\0'; | |
| 403 info->filename = minidump_filename_str; | |
| 404 #if defined(ADDRESS_SANITIZER) | |
| 405 char* minidump_log_filename_str = new char[minidump_filename.length() + 1]; | |
| 406 minidump_filename.copy(minidump_log_filename_str, minidump_filename.length()); | |
| 407 memcpy(minidump_log_filename_str + minidump_filename.length() - 3, "log", 3); | |
| 408 minidump_log_filename_str[minidump_filename.length()] = '\0'; | |
| 409 info->log_filename = minidump_log_filename_str; | |
| 410 #endif | |
| 411 info->pid = crashing_pid; | |
| 412 | |
| 413 BrowserThread::PostTask( | |
| 414 BrowserThread::IO, FROM_HERE, | |
| 415 base::Bind(&CrashHandlerHostLinux::QueueCrashDumpTask, | |
| 416 base::Unretained(this), | |
| 417 info, | |
| 418 signal_fd)); | |
| 419 } | |
| 420 | |
| 421 void CrashHandlerHostLinux::QueueCrashDumpTask(BreakpadInfo* info, | |
| 422 int signal_fd) { | |
| 423 DCHECK(BrowserThread::CurrentlyOn(BrowserThread::IO)); | |
| 424 | |
| 425 // Send the done signal to the process: it can exit now. | |
| 426 struct msghdr msg = {0}; | |
| 427 struct iovec done_iov; | |
| 428 done_iov.iov_base = const_cast<char*>("\x42"); | |
| 429 done_iov.iov_len = 1; | |
| 430 msg.msg_iov = &done_iov; | |
| 431 msg.msg_iovlen = 1; | |
| 432 | |
| 433 (void) HANDLE_EINTR(sendmsg(signal_fd, &msg, MSG_DONTWAIT | MSG_NOSIGNAL)); | |
| 434 (void) HANDLE_EINTR(close(signal_fd)); | |
| 435 | |
| 436 uploader_thread_->message_loop()->PostTask( | |
| 437 FROM_HERE, | |
| 438 base::Bind(&CrashDumpTask, base::Unretained(this), info)); | |
| 439 } | |
| 440 | |
| 441 void CrashHandlerHostLinux::WillDestroyCurrentMessageLoop() { | |
| 442 file_descriptor_watcher_.StopWatchingFileDescriptor(); | |
| 443 | |
| 444 // If we are quitting and there are crash dumps in the queue, turn them into | |
| 445 // no-ops. | |
| 446 shutting_down_ = true; | |
| 447 uploader_thread_->Stop(); | |
| 448 } | |
| 449 | |
| 450 bool CrashHandlerHostLinux::IsShuttingDown() const { | |
| 451 return shutting_down_; | |
| 452 } | |
| OLD | NEW |