OLD | NEW |
(Empty) | |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. |
| 4 |
| 5 #include "chrome/app/image_pre_reader_win.h" |
| 6 |
| 7 #include <windows.h> |
| 8 #include <algorithm> |
| 9 #include <limits> |
| 10 #include <vector> |
| 11 |
| 12 #include "base/logging.h" |
| 13 #include "base/memory/scoped_ptr.h" |
| 14 #include "base/threading/thread_restrictions.h" |
| 15 #include "base/win/pe_image.h" |
| 16 #include "base/win/scoped_handle.h" |
| 17 #include "base/win/windows_version.h" |
| 18 |
| 19 namespace { |
| 20 |
| 21 // The minimum buffer size to allocate when reading the PE file headers. |
| 22 // |
| 23 // The PE file headers usually fit into a single 1KB page, and a PE file must |
| 24 // at least contain the initial page with the headers. That said, as long as |
| 25 // we expect at least sizeof(IMAGE_DOS_HEADER) bytes, we're ok. |
| 26 const size_t kMinHeaderBufferSize = 0x400; |
| 27 |
| 28 // A handy symbolic constant. |
| 29 const size_t kOneHundredPercent = 100; |
| 30 |
| 31 static_assert(kMinHeaderBufferSize >= sizeof(IMAGE_DOS_HEADER), |
| 32 "kMinHeaderBufferSize must be at least as big as the dos header"); |
| 33 |
| 34 // This struct provides a deallocation functor for use with scoped_ptr<T> |
| 35 // allocated with ::VirtualAlloc(). |
| 36 struct VirtualFreeDeleter { |
| 37 void operator() (void* ptr) { |
| 38 ::VirtualFree(ptr, 0, MEM_RELEASE); |
| 39 } |
| 40 }; |
| 41 |
| 42 // A wrapper for the Win32 ::SetFilePointer() function with some error checking. |
| 43 bool SetFilePointer(HANDLE file_handle, size_t position) { |
| 44 return position <= static_cast<size_t>(std::numeric_limits<LONG>::max()) && |
| 45 ::SetFilePointer(file_handle, |
| 46 static_cast<LONG>(position), |
| 47 NULL, |
| 48 FILE_BEGIN) != INVALID_SET_FILE_POINTER; |
| 49 } |
| 50 |
| 51 // A helper function to read the next |bytes_to_read| bytes from the file |
| 52 // given by |file_handle| into |buffer|. |
| 53 bool ReadNextBytes(HANDLE file_handle, void* buffer, size_t bytes_to_read) { |
| 54 DCHECK(file_handle != INVALID_HANDLE_VALUE); |
| 55 DCHECK(buffer != NULL); |
| 56 DCHECK(bytes_to_read > 0); |
| 57 |
| 58 DWORD bytes_read = 0; |
| 59 return bytes_to_read <= std::numeric_limits<DWORD>::max() && |
| 60 ::ReadFile(file_handle, |
| 61 buffer, |
| 62 static_cast<DWORD>(bytes_to_read), |
| 63 &bytes_read, |
| 64 NULL) && |
| 65 bytes_read == bytes_to_read; |
| 66 } |
| 67 |
| 68 // A helper function to extend the |current_buffer| of bytes such that it |
| 69 // contains |desired_length| bytes read from the file given by |file_handle|. |
| 70 // |
| 71 // It is assumed that |file_handle| has been used to sequentially populate |
| 72 // |current_buffer| thus far and is already positioned at the appropriate |
| 73 // read location. |
| 74 bool ReadMissingBytes(HANDLE file_handle, |
| 75 std::vector<uint8>* current_buffer, |
| 76 size_t desired_length) { |
| 77 DCHECK(file_handle != INVALID_HANDLE_VALUE); |
| 78 DCHECK(current_buffer != NULL); |
| 79 |
| 80 size_t current_length = current_buffer->size(); |
| 81 if (current_length >= desired_length) |
| 82 return true; |
| 83 |
| 84 size_t bytes_to_read = desired_length - current_length; |
| 85 current_buffer->resize(desired_length); |
| 86 return ReadNextBytes(file_handle, |
| 87 &(current_buffer->at(current_length)), |
| 88 bytes_to_read); |
| 89 } |
| 90 |
| 91 // Return a |percentage| of the number of initialized bytes in the given |
| 92 // |section|. |
| 93 // |
| 94 // This returns a percentage of the lesser of the size of the raw data in |
| 95 // the section and the virtual size of the section. |
| 96 // |
| 97 // Note that sections can have their tails implicitly initialized to zero |
| 98 // (i.e., their virtual size is larger than the raw size) and that raw data |
| 99 // is padded to the PE page size if the entire section is initialized (i.e., |
| 100 // their raw data size will be larger than the virtual size). |
| 101 // |
| 102 // Any data after the initialized portion of the section will be soft-faulted |
| 103 // in (very quickly) as needed, so we don't need to include it in the returned |
| 104 // length. |
| 105 size_t GetPercentageOfSectionLength(const IMAGE_SECTION_HEADER* section, |
| 106 size_t percentage) { |
| 107 DCHECK(section != NULL); |
| 108 DCHECK_GT(percentage, 0u); |
| 109 DCHECK_LE(percentage, kOneHundredPercent); |
| 110 |
| 111 size_t initialized_length = std::min(section->SizeOfRawData, |
| 112 section->Misc.VirtualSize); |
| 113 |
| 114 if (initialized_length == 0) |
| 115 return 0; |
| 116 |
| 117 size_t length = (initialized_length * percentage) / kOneHundredPercent; |
| 118 |
| 119 return std::max<size_t>(length, 1); |
| 120 } |
| 121 |
| 122 // Helper function to read through a |percentage| of the given |section| |
| 123 // of the file denoted by |file_handle|. The |temp_buffer| is (re)used as |
| 124 // a transient storage area as the section is read in chunks of |
| 125 // |temp_buffer_size| bytes. |
| 126 bool ReadThroughSection(HANDLE file_handle, |
| 127 const IMAGE_SECTION_HEADER* section, |
| 128 size_t percentage, |
| 129 void* temp_buffer, |
| 130 size_t temp_buffer_size) { |
| 131 DCHECK(file_handle != INVALID_HANDLE_VALUE); |
| 132 DCHECK(section != NULL); |
| 133 DCHECK_LE(percentage, kOneHundredPercent); |
| 134 DCHECK(temp_buffer != NULL); |
| 135 DCHECK(temp_buffer_size > 0); |
| 136 |
| 137 size_t bytes_to_read = GetPercentageOfSectionLength(section, percentage); |
| 138 if (bytes_to_read == 0) |
| 139 return true; |
| 140 |
| 141 if (!SetFilePointer(file_handle, section->PointerToRawData)) |
| 142 return false; |
| 143 |
| 144 // Read all chunks except the last one. |
| 145 while (bytes_to_read > temp_buffer_size) { |
| 146 if (!ReadNextBytes(file_handle, temp_buffer, temp_buffer_size)) |
| 147 return false; |
| 148 bytes_to_read -= temp_buffer_size; |
| 149 } |
| 150 |
| 151 // Read the last (possibly partial) chunk and return. |
| 152 DCHECK(bytes_to_read > 0); |
| 153 DCHECK(bytes_to_read <= temp_buffer_size); |
| 154 return ReadNextBytes(file_handle, temp_buffer, bytes_to_read); |
| 155 } |
| 156 |
| 157 // A helper function to touch all pages in the range |
| 158 // [base_addr, base_addr + length). |
| 159 void TouchPagesInRange(void* base_addr, size_t length) { |
| 160 DCHECK(base_addr != NULL); |
| 161 DCHECK(length > 0); |
| 162 |
| 163 // Get the system info so we know the page size. Also, make sure we use a |
| 164 // non-zero value for the page size; GetSystemInfo() is hookable/patchable, |
| 165 // and you never know what shenanigans someone could get up to. |
| 166 SYSTEM_INFO system_info = {}; |
| 167 GetSystemInfo(&system_info); |
| 168 if (system_info.dwPageSize == 0) |
| 169 system_info.dwPageSize = 4096; |
| 170 |
| 171 // We don't want to read outside the byte range (which could trigger an |
| 172 // access violation), so let's figure out the exact locations of the first |
| 173 // and final bytes we want to read. |
| 174 volatile uint8* touch_ptr = reinterpret_cast<uint8*>(base_addr); |
| 175 volatile uint8* final_touch_ptr = touch_ptr + length - 1; |
| 176 |
| 177 // Read the memory in the range [touch_ptr, final_touch_ptr] with a stride |
| 178 // of the system page size, to ensure that it's been paged in. |
| 179 uint8 dummy; |
| 180 while (touch_ptr < final_touch_ptr) { |
| 181 dummy = *touch_ptr; |
| 182 touch_ptr += system_info.dwPageSize; |
| 183 } |
| 184 dummy = *final_touch_ptr; |
| 185 } |
| 186 |
| 187 } // namespace |
| 188 |
| 189 bool ImagePreReader::PartialPreReadImageOnDisk(const wchar_t* file_path, |
| 190 size_t percentage, |
| 191 size_t max_chunk_size) { |
| 192 // TODO(rogerm): change this to have the number of bytes pre-read per |
| 193 // section be driven by a static table within the PE file (defaulting to |
| 194 // full read if it's not there?) that's initialized by the optimization |
| 195 // toolchain. |
| 196 DCHECK(file_path != NULL); |
| 197 |
| 198 if (percentage == 0) |
| 199 return true; |
| 200 |
| 201 if (percentage > kOneHundredPercent) |
| 202 percentage = kOneHundredPercent; |
| 203 |
| 204 // Validate/setup max_chunk_size, imposing a 1MB minimum on the chunk size. |
| 205 const size_t kMinChunkSize = 1024 * 1024; |
| 206 max_chunk_size = std::max(max_chunk_size, kMinChunkSize); |
| 207 |
| 208 // Open the file. |
| 209 base::win::ScopedHandle file( |
| 210 CreateFile(file_path, |
| 211 GENERIC_READ, |
| 212 FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE, |
| 213 NULL, |
| 214 OPEN_EXISTING, |
| 215 FILE_FLAG_SEQUENTIAL_SCAN, |
| 216 NULL)); |
| 217 |
| 218 if (!file.IsValid()) |
| 219 return false; |
| 220 |
| 221 // Allocate a resizable buffer for the headers. We initially reserve as much |
| 222 // space as we typically see as the header size for chrome.dll and other |
| 223 // PE images. |
| 224 std::vector<uint8> headers; |
| 225 headers.reserve(kMinHeaderBufferSize); |
| 226 |
| 227 // Read, hopefully, all of the headers. |
| 228 if (!ReadMissingBytes(file.Get(), &headers, kMinHeaderBufferSize)) |
| 229 return false; |
| 230 |
| 231 // The DOS header starts at offset 0 and allows us to get the offset of the |
| 232 // NT headers. Let's ensure we've read enough to capture the NT headers. |
| 233 size_t nt_headers_start = |
| 234 reinterpret_cast<IMAGE_DOS_HEADER*>(&headers[0])->e_lfanew; |
| 235 size_t nt_headers_end = nt_headers_start + sizeof(IMAGE_NT_HEADERS); |
| 236 if (!ReadMissingBytes(file.Get(), &headers, nt_headers_end)) |
| 237 return false; |
| 238 |
| 239 // Now that we've got the NT headers we can get the total header size, |
| 240 // including all of the section headers. Let's ensure we've read enough |
| 241 // to capture all of the header data. |
| 242 size_t size_of_headers = reinterpret_cast<IMAGE_NT_HEADERS*>( |
| 243 &headers[nt_headers_start])->OptionalHeader.SizeOfHeaders; |
| 244 if (!ReadMissingBytes(file.Get(), &headers, size_of_headers)) |
| 245 return false; |
| 246 |
| 247 // Now we have all of the headers. This is enough to let us use the PEImage |
| 248 // wrapper to query the structure of the image. |
| 249 base::win::PEImage pe_image(reinterpret_cast<HMODULE>(&headers[0])); |
| 250 CHECK(pe_image.VerifyMagic()); |
| 251 |
| 252 // Allocate a buffer to hold the pre-read bytes. |
| 253 scoped_ptr<uint8, VirtualFreeDeleter> buffer( |
| 254 static_cast<uint8*>( |
| 255 ::VirtualAlloc(NULL, max_chunk_size, MEM_COMMIT, PAGE_READWRITE))); |
| 256 if (buffer.get() == NULL) |
| 257 return false; |
| 258 |
| 259 // Iterate over each section, reading in a percentage of each. |
| 260 const IMAGE_SECTION_HEADER* section = NULL; |
| 261 for (UINT i = 0; (section = pe_image.GetSectionHeader(i)) != NULL; ++i) { |
| 262 CHECK_LE(reinterpret_cast<const uint8*>(section + 1), |
| 263 &headers[0] + headers.size()); |
| 264 if (!ReadThroughSection(file.Get(), section, percentage, buffer.get(), |
| 265 max_chunk_size)) { |
| 266 return false; |
| 267 } |
| 268 } |
| 269 |
| 270 // We're done. |
| 271 return true; |
| 272 } |
| 273 |
| 274 bool ImagePreReader::PartialPreReadImageInMemory(const wchar_t* file_path, |
| 275 size_t percentage) { |
| 276 // TODO(rogerm): change this to have the number of bytes pre-read per |
| 277 // section be driven by a static table within the PE file (defaulting to |
| 278 // full read if it's not there?) that's initialized by the optimization |
| 279 // toolchain. |
| 280 DCHECK(file_path != NULL); |
| 281 |
| 282 if (percentage == 0) |
| 283 return true; |
| 284 |
| 285 if (percentage > kOneHundredPercent) |
| 286 percentage = kOneHundredPercent; |
| 287 |
| 288 HMODULE dll_module = ::LoadLibraryExW( |
| 289 file_path, |
| 290 NULL, |
| 291 LOAD_WITH_ALTERED_SEARCH_PATH | DONT_RESOLVE_DLL_REFERENCES); |
| 292 |
| 293 if (!dll_module) |
| 294 return false; |
| 295 |
| 296 base::win::PEImage pe_image(dll_module); |
| 297 CHECK(pe_image.VerifyMagic()); |
| 298 |
| 299 // Iterate over each section, stepping through a percentage of each to page |
| 300 // it in off the disk. |
| 301 const IMAGE_SECTION_HEADER* section = NULL; |
| 302 for (UINT i = 0; (section = pe_image.GetSectionHeader(i)) != NULL; ++i) { |
| 303 // Get the extent we want to touch. |
| 304 size_t length = GetPercentageOfSectionLength(section, percentage); |
| 305 if (length == 0) |
| 306 continue; |
| 307 uint8* start = |
| 308 static_cast<uint8*>(pe_image.RVAToAddr(section->VirtualAddress)); |
| 309 |
| 310 // Verify that the extent we're going to touch falls inside the section |
| 311 // we expect it to (and by implication, inside the pe_image). |
| 312 CHECK_EQ(section, |
| 313 pe_image.GetImageSectionFromAddr(start)); |
| 314 CHECK_EQ(section, |
| 315 pe_image.GetImageSectionFromAddr(start + length - 1)); |
| 316 |
| 317 // Page in the section range. |
| 318 TouchPagesInRange(start, length); |
| 319 } |
| 320 |
| 321 FreeLibrary(dll_module); |
| 322 |
| 323 return true; |
| 324 } |
| 325 |
| 326 bool ImagePreReader::PreReadImage(const wchar_t* file_path, |
| 327 size_t size_to_read, |
| 328 size_t step_size) { |
| 329 base::ThreadRestrictions::AssertIOAllowed(); |
| 330 if (base::win::GetVersion() > base::win::VERSION_XP) { |
| 331 // Vista+ branch. On these OSes, the forced reads through the DLL actually |
| 332 // slows warm starts. The solution is to sequentially read file contents |
| 333 // with an optional cap on total amount to read. |
| 334 base::win::ScopedHandle file( |
| 335 CreateFile(file_path, |
| 336 GENERIC_READ, |
| 337 FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE, |
| 338 NULL, |
| 339 OPEN_EXISTING, |
| 340 FILE_FLAG_SEQUENTIAL_SCAN, |
| 341 NULL)); |
| 342 |
| 343 if (!file.IsValid()) |
| 344 return false; |
| 345 |
| 346 // Default to 1MB sequential reads. |
| 347 const DWORD actual_step_size = std::max(static_cast<DWORD>(step_size), |
| 348 static_cast<DWORD>(1024*1024)); |
| 349 LPVOID buffer = ::VirtualAlloc(NULL, |
| 350 actual_step_size, |
| 351 MEM_COMMIT, |
| 352 PAGE_READWRITE); |
| 353 |
| 354 if (buffer == NULL) |
| 355 return false; |
| 356 |
| 357 DWORD len; |
| 358 size_t total_read = 0; |
| 359 while (::ReadFile(file.Get(), buffer, actual_step_size, &len, NULL) && |
| 360 len > 0 && |
| 361 (size_to_read ? total_read < size_to_read : true)) { |
| 362 total_read += static_cast<size_t>(len); |
| 363 } |
| 364 ::VirtualFree(buffer, 0, MEM_RELEASE); |
| 365 } else { |
| 366 // WinXP branch. Here, reading the DLL from disk doesn't do |
| 367 // what we want so instead we pull the pages into memory by loading |
| 368 // the DLL and touching pages at a stride. We use the system's page |
| 369 // size as the stride, ignoring the passed in step_size, to make sure |
| 370 // each page in the range is touched. |
| 371 HMODULE dll_module = ::LoadLibraryExW( |
| 372 file_path, |
| 373 NULL, |
| 374 LOAD_WITH_ALTERED_SEARCH_PATH | DONT_RESOLVE_DLL_REFERENCES); |
| 375 |
| 376 if (!dll_module) |
| 377 return false; |
| 378 |
| 379 base::win::PEImage pe_image(dll_module); |
| 380 CHECK(pe_image.VerifyMagic()); |
| 381 |
| 382 // We don't want to read past the end of the module (which could trigger |
| 383 // an access violation), so make sure to check the image size. |
| 384 PIMAGE_NT_HEADERS nt_headers = pe_image.GetNTHeaders(); |
| 385 size_t dll_module_length = std::min( |
| 386 size_to_read ? size_to_read : ~0, |
| 387 static_cast<size_t>(nt_headers->OptionalHeader.SizeOfImage)); |
| 388 |
| 389 // Page in then release the module. |
| 390 TouchPagesInRange(dll_module, dll_module_length); |
| 391 FreeLibrary(dll_module); |
| 392 } |
| 393 |
| 394 return true; |
| 395 } |
| 396 |
| 397 bool ImagePreReader::PartialPreReadImage(const wchar_t* file_path, |
| 398 size_t percentage, |
| 399 size_t max_chunk_size) { |
| 400 base::ThreadRestrictions::AssertIOAllowed(); |
| 401 |
| 402 if (percentage >= kOneHundredPercent) { |
| 403 // If we're reading the whole image, we don't need to parse headers and |
| 404 // navigate sections, the basic PreReadImage() can be used to just step |
| 405 // blindly through the entire file / address-space. |
| 406 return PreReadImage(file_path, 0, max_chunk_size); |
| 407 } |
| 408 |
| 409 if (base::win::GetVersion() > base::win::VERSION_XP) { |
| 410 // Vista+ branch. On these OSes, we warm up the Image by reading its |
| 411 // file off the disk. |
| 412 return PartialPreReadImageOnDisk(file_path, percentage, max_chunk_size); |
| 413 } |
| 414 |
| 415 // WinXP branch. For XP, reading the image from disk doesn't do what we want |
| 416 // so instead we pull the pages into memory by loading the DLL and touching |
| 417 // initialized pages at a stride. |
| 418 return PartialPreReadImageInMemory(file_path, percentage); |
| 419 } |
OLD | NEW |