// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "chrome/app/image_pre_reader_win.h" #include <windows.h> #include <algorithm> #include <limits> #include <vector> #include "base/logging.h" #include "base/memory/scoped_ptr.h" #include "base/threading/thread_restrictions.h" #include "base/win/pe_image.h" #include "base/win/scoped_handle.h" #include "base/win/windows_version.h" namespace { // The minimum buffer size to allocate when reading the PE file headers. // // The PE file headers usually fit into a single 1KB page, and a PE file must // at least contain the initial page with the headers. That said, as long as // we expect at least sizeof(IMAGE_DOS_HEADER) bytes, we're ok. const size_t kMinHeaderBufferSize = 0x400; // A handy symbolic constant. const size_t kOneHundredPercent = 100; void StaticAssertions() { COMPILE_ASSERT(kMinHeaderBufferSize >= sizeof(IMAGE_DOS_HEADER), min_header_buffer_size_at_least_as_big_as_the_dos_header); } // This struct provides a deallocation functor for use with scoped_ptr<T> // allocated with ::VirtualAlloc(). struct ScopedPtrVirtualFree { void operator() (void* ptr) { ::VirtualFree(ptr, 0, MEM_RELEASE); } }; // A wrapper for the Win32 ::SetFilePointer() function with some error checking. bool SetFilePointer(HANDLE file_handle, size_t position) { return position <= static_cast<size_t>(std::numeric_limits<LONG>::max()) && ::SetFilePointer(file_handle, static_cast<LONG>(position), NULL, FILE_BEGIN) != INVALID_SET_FILE_POINTER; } // A helper function to read the next |bytes_to_read| bytes from the file // given by |file_handle| into |buffer|. bool ReadNextBytes(HANDLE file_handle, void* buffer, size_t bytes_to_read) { DCHECK(file_handle != INVALID_HANDLE_VALUE); DCHECK(buffer != NULL); DCHECK(bytes_to_read > 0); DWORD bytes_read = 0; return bytes_to_read <= std::numeric_limits<DWORD>::max() && ::ReadFile(file_handle, buffer, static_cast<DWORD>(bytes_to_read), &bytes_read, NULL) && bytes_read == bytes_to_read; } // A helper function to extend the |current_buffer| of bytes such that it // contains |desired_length| bytes read from the file given by |file_handle|. // // It is assumed that |file_handle| has been used to sequentially populate // |current_buffer| thus far and is already positioned at the appropriate // read location. bool ReadMissingBytes(HANDLE file_handle, std::vector<uint8>* current_buffer, size_t desired_length) { DCHECK(file_handle != INVALID_HANDLE_VALUE); DCHECK(current_buffer != NULL); size_t current_length = current_buffer->size(); if (current_length >= desired_length) return true; size_t bytes_to_read = desired_length - current_length; current_buffer->resize(desired_length); return ReadNextBytes(file_handle, &(current_buffer->at(current_length)), bytes_to_read); } // Return a |percentage| of the number of initialized bytes in the given // |section|. // // This returns a percentage of the lesser of the size of the raw data in // the section and the virtual size of the section. // // Note that sections can have their tails implicitly initialized to zero // (i.e., their virtual size is larger than the raw size) and that raw data // is padded to the PE page size if the entire section is initialized (i.e., // their raw data size will be larger than the virtual size). // // Any data after the initialized portion of the section will be soft-faulted // in (very quickly) as needed, so we don't need to include it in the returned // length. size_t GetPercentageOfSectionLength(const IMAGE_SECTION_HEADER* section, size_t percentage) { DCHECK(section != NULL); DCHECK_GT(percentage, 0u); DCHECK_LE(percentage, kOneHundredPercent); size_t initialized_length = std::min(section->SizeOfRawData, section->Misc.VirtualSize); if (initialized_length == 0) return 0; size_t length = (initialized_length * percentage) / kOneHundredPercent; return std::max<size_t>(length, 1); } // Helper function to read through a |percentage| of the given |section| // of the file denoted by |file_handle|. The |temp_buffer| is (re)used as // a transient storage area as the section is read in chunks of // |temp_buffer_size| bytes. bool ReadThroughSection(HANDLE file_handle, const IMAGE_SECTION_HEADER* section, size_t percentage, void* temp_buffer, size_t temp_buffer_size) { DCHECK(file_handle != INVALID_HANDLE_VALUE); DCHECK(section != NULL); DCHECK_LE(percentage, kOneHundredPercent); DCHECK(temp_buffer != NULL); DCHECK(temp_buffer_size > 0); size_t bytes_to_read = GetPercentageOfSectionLength(section, percentage); if (bytes_to_read == 0) return true; if (!SetFilePointer(file_handle, section->PointerToRawData)) return false; // Read all chunks except the last one. while (bytes_to_read > temp_buffer_size) { if (!ReadNextBytes(file_handle, temp_buffer, temp_buffer_size)) return false; bytes_to_read -= temp_buffer_size; } // Read the last (possibly partial) chunk and return. DCHECK(bytes_to_read > 0); DCHECK(bytes_to_read <= temp_buffer_size); return ReadNextBytes(file_handle, temp_buffer, bytes_to_read); } // A helper function to touch all pages in the range // [base_addr, base_addr + length). void TouchPagesInRange(void* base_addr, size_t length) { DCHECK(base_addr != NULL); DCHECK(length > 0); // Get the system info so we know the page size. Also, make sure we use a // non-zero value for the page size; GetSystemInfo() is hookable/patchable, // and you never know what shenanigans someone could get up to. SYSTEM_INFO system_info = {}; GetSystemInfo(&system_info); if (system_info.dwPageSize == 0) system_info.dwPageSize = 4096; // We don't want to read outside the byte range (which could trigger an // access violation), so let's figure out the exact locations of the first // and final bytes we want to read. volatile uint8* touch_ptr = reinterpret_cast<uint8*>(base_addr); volatile uint8* final_touch_ptr = touch_ptr + length - 1; // Read the memory in the range [touch_ptr, final_touch_ptr] with a stride // of the system page size, to ensure that it's been paged in. uint8 dummy; while (touch_ptr < final_touch_ptr) { dummy = *touch_ptr; touch_ptr += system_info.dwPageSize; } dummy = *final_touch_ptr; } } // namespace bool ImagePreReader::PartialPreReadImageOnDisk(const wchar_t* file_path, size_t percentage, size_t max_chunk_size) { // TODO(rogerm): change this to have the number of bytes pre-read per // section be driven by a static table within the PE file (defaulting to // full read if it's not there?) that's initialized by the optimization // toolchain. DCHECK(file_path != NULL); if (percentage == 0) return true; if (percentage > kOneHundredPercent) percentage = kOneHundredPercent; // Validate/setup max_chunk_size, imposing a 1MB minimum on the chunk size. const size_t kMinChunkSize = 1024 * 1024; max_chunk_size = std::max(max_chunk_size, kMinChunkSize); // Open the file. base::win::ScopedHandle file( CreateFile(file_path, GENERIC_READ, FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE, NULL, OPEN_EXISTING, FILE_FLAG_SEQUENTIAL_SCAN, NULL)); if (!file.IsValid()) return false; // Allocate a resizable buffer for the headers. We initially reserve as much // space as we typically see as the header size for chrome.dll and other // PE images. std::vector<uint8> headers; headers.reserve(kMinHeaderBufferSize); // Read, hopefully, all of the headers. if (!ReadMissingBytes(file, &headers, kMinHeaderBufferSize)) return false; // The DOS header starts at offset 0 and allows us to get the offset of the // NT headers. Let's ensure we've read enough to capture the NT headers. size_t nt_headers_start = reinterpret_cast<IMAGE_DOS_HEADER*>(&headers[0])->e_lfanew; size_t nt_headers_end = nt_headers_start + sizeof(IMAGE_NT_HEADERS); if (!ReadMissingBytes(file, &headers, nt_headers_end)) return false; // Now that we've got the NT headers we can get the total header size, // including all of the section headers. Let's ensure we've read enough // to capture all of the header data. size_t size_of_headers = reinterpret_cast<IMAGE_NT_HEADERS*>( &headers[nt_headers_start])->OptionalHeader.SizeOfHeaders; if (!ReadMissingBytes(file, &headers, size_of_headers)) return false; // Now we have all of the headers. This is enough to let us use the PEImage // wrapper to query the structure of the image. base::win::PEImage pe_image(reinterpret_cast<HMODULE>(&headers[0])); CHECK(pe_image.VerifyMagic()); // Allocate a buffer to hold the pre-read bytes. scoped_ptr_malloc<uint8, ScopedPtrVirtualFree> buffer( reinterpret_cast<uint8*>( ::VirtualAlloc(NULL, max_chunk_size, MEM_COMMIT, PAGE_READWRITE))); if (buffer.get() == NULL) return false; // Iterate over each section, reading in a percentage of each. const IMAGE_SECTION_HEADER* section = NULL; for (UINT i = 0; (section = pe_image.GetSectionHeader(i)) != NULL; ++i) { CHECK_LE(reinterpret_cast<const uint8*>(section + 1), &headers[0] + headers.size()); if (!ReadThroughSection( file, section, percentage, buffer.get(), max_chunk_size)) return false; } // We're done. return true; } bool ImagePreReader::PartialPreReadImageInMemory(const wchar_t* file_path, size_t percentage) { // TODO(rogerm): change this to have the number of bytes pre-read per // section be driven by a static table within the PE file (defaulting to // full read if it's not there?) that's initialized by the optimization // toolchain. DCHECK(file_path != NULL); if (percentage == 0) return true; if (percentage > kOneHundredPercent) percentage = kOneHundredPercent; HMODULE dll_module = ::LoadLibraryExW( file_path, NULL, LOAD_WITH_ALTERED_SEARCH_PATH | DONT_RESOLVE_DLL_REFERENCES); if (!dll_module) return false; base::win::PEImage pe_image(dll_module); CHECK(pe_image.VerifyMagic()); // Iterate over each section, stepping through a percentage of each to page // it in off the disk. const IMAGE_SECTION_HEADER* section = NULL; for (UINT i = 0; (section = pe_image.GetSectionHeader(i)) != NULL; ++i) { // Get the extent we want to touch. size_t length = GetPercentageOfSectionLength(section, percentage); if (length == 0) continue; uint8* start = static_cast<uint8*>(pe_image.RVAToAddr(section->VirtualAddress)); // Verify that the extent we're going to touch falls inside the section // we expect it to (and by implication, inside the pe_image). CHECK_EQ(section, pe_image.GetImageSectionFromAddr(start)); CHECK_EQ(section, pe_image.GetImageSectionFromAddr(start + length - 1)); // Page in the section range. TouchPagesInRange(start, length); } FreeLibrary(dll_module); return true; } bool ImagePreReader::PreReadImage(const wchar_t* file_path, size_t size_to_read, size_t step_size) { base::ThreadRestrictions::AssertIOAllowed(); if (base::win::GetVersion() > base::win::VERSION_XP) { // Vista+ branch. On these OSes, the forced reads through the DLL actually // slows warm starts. The solution is to sequentially read file contents // with an optional cap on total amount to read. base::win::ScopedHandle file( CreateFile(file_path, GENERIC_READ, FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE, NULL, OPEN_EXISTING, FILE_FLAG_SEQUENTIAL_SCAN, NULL)); if (!file.IsValid()) return false; // Default to 1MB sequential reads. const DWORD actual_step_size = std::max(static_cast<DWORD>(step_size), static_cast<DWORD>(1024*1024)); LPVOID buffer = ::VirtualAlloc(NULL, actual_step_size, MEM_COMMIT, PAGE_READWRITE); if (buffer == NULL) return false; DWORD len; size_t total_read = 0; while (::ReadFile(file, buffer, actual_step_size, &len, NULL) && len > 0 && (size_to_read ? total_read < size_to_read : true)) { total_read += static_cast<size_t>(len); } ::VirtualFree(buffer, 0, MEM_RELEASE); } else { // WinXP branch. Here, reading the DLL from disk doesn't do // what we want so instead we pull the pages into memory by loading // the DLL and touching pages at a stride. We use the system's page // size as the stride, ignoring the passed in step_size, to make sure // each page in the range is touched. HMODULE dll_module = ::LoadLibraryExW( file_path, NULL, LOAD_WITH_ALTERED_SEARCH_PATH | DONT_RESOLVE_DLL_REFERENCES); if (!dll_module) return false; base::win::PEImage pe_image(dll_module); CHECK(pe_image.VerifyMagic()); // We don't want to read past the end of the module (which could trigger // an access violation), so make sure to check the image size. PIMAGE_NT_HEADERS nt_headers = pe_image.GetNTHeaders(); size_t dll_module_length = std::min( size_to_read ? size_to_read : ~0, static_cast<size_t>(nt_headers->OptionalHeader.SizeOfImage)); // Page in then release the module. TouchPagesInRange(dll_module, dll_module_length); FreeLibrary(dll_module); } return true; } bool ImagePreReader::PartialPreReadImage(const wchar_t* file_path, size_t percentage, size_t max_chunk_size) { base::ThreadRestrictions::AssertIOAllowed(); if (percentage >= kOneHundredPercent) { // If we're reading the whole image, we don't need to parse headers and // navigate sections, the basic PreReadImage() can be used to just step // blindly through the entire file / address-space. return PreReadImage(file_path, 0, max_chunk_size); } if (base::win::GetVersion() > base::win::VERSION_XP) { // Vista+ branch. On these OSes, we warm up the Image by reading its // file off the disk. return PartialPreReadImageOnDisk(file_path, percentage, max_chunk_size); } // WinXP branch. For XP, reading the image from disk doesn't do what we want // so instead we pull the pages into memory by loading the DLL and touching // initialized pages at a stride. return PartialPreReadImageInMemory(file_path, percentage); }