1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "chrome/app/image_pre_reader_win.h"
12 #include "base/logging.h"
13 #include "base/memory/scoped_ptr.h"
14 #include "base/threading/thread_restrictions.h"
15 #include "base/win/pe_image.h"
16 #include "base/win/scoped_handle.h"
17 #include "base/win/windows_version.h"
21 // The minimum buffer size to allocate when reading the PE file headers.
23 // The PE file headers usually fit into a single 1KB page, and a PE file must
24 // at least contain the initial page with the headers. That said, as long as
25 // we expect at least sizeof(IMAGE_DOS_HEADER) bytes, we're ok.
26 const size_t kMinHeaderBufferSize
= 0x400;
28 // A handy symbolic constant.
29 const size_t kOneHundredPercent
= 100;
31 void StaticAssertions() {
32 COMPILE_ASSERT(kMinHeaderBufferSize
>= sizeof(IMAGE_DOS_HEADER
),
33 min_header_buffer_size_at_least_as_big_as_the_dos_header
);
36 // This struct provides a deallocation functor for use with scoped_ptr<T>
37 // allocated with ::VirtualAlloc().
38 struct ScopedPtrVirtualFree
{
39 void operator() (void* ptr
) {
40 ::VirtualFree(ptr
, 0, MEM_RELEASE
);
44 // A wrapper for the Win32 ::SetFilePointer() function with some error checking.
45 bool SetFilePointer(HANDLE file_handle
, size_t position
) {
46 return position
<= static_cast<size_t>(std::numeric_limits
<LONG
>::max()) &&
47 ::SetFilePointer(file_handle
,
48 static_cast<LONG
>(position
),
50 FILE_BEGIN
) != INVALID_SET_FILE_POINTER
;
53 // A helper function to read the next |bytes_to_read| bytes from the file
54 // given by |file_handle| into |buffer|.
55 bool ReadNextBytes(HANDLE file_handle
, void* buffer
, size_t bytes_to_read
) {
56 DCHECK(file_handle
!= INVALID_HANDLE_VALUE
);
57 DCHECK(buffer
!= NULL
);
58 DCHECK(bytes_to_read
> 0);
61 return bytes_to_read
<= std::numeric_limits
<DWORD
>::max() &&
62 ::ReadFile(file_handle
,
64 static_cast<DWORD
>(bytes_to_read
),
67 bytes_read
== bytes_to_read
;
70 // A helper function to extend the |current_buffer| of bytes such that it
71 // contains |desired_length| bytes read from the file given by |file_handle|.
73 // It is assumed that |file_handle| has been used to sequentially populate
74 // |current_buffer| thus far and is already positioned at the appropriate
76 bool ReadMissingBytes(HANDLE file_handle
,
77 std::vector
<uint8
>* current_buffer
,
78 size_t desired_length
) {
79 DCHECK(file_handle
!= INVALID_HANDLE_VALUE
);
80 DCHECK(current_buffer
!= NULL
);
82 size_t current_length
= current_buffer
->size();
83 if (current_length
>= desired_length
)
86 size_t bytes_to_read
= desired_length
- current_length
;
87 current_buffer
->resize(desired_length
);
88 return ReadNextBytes(file_handle
,
89 &(current_buffer
->at(current_length
)),
93 // Return a |percentage| of the number of initialized bytes in the given
96 // This returns a percentage of the lesser of the size of the raw data in
97 // the section and the virtual size of the section.
99 // Note that sections can have their tails implicitly initialized to zero
100 // (i.e., their virtual size is larger than the raw size) and that raw data
101 // is padded to the PE page size if the entire section is initialized (i.e.,
102 // their raw data size will be larger than the virtual size).
104 // Any data after the initialized portion of the section will be soft-faulted
105 // in (very quickly) as needed, so we don't need to include it in the returned
107 size_t GetPercentageOfSectionLength(const IMAGE_SECTION_HEADER
* section
,
109 DCHECK(section
!= NULL
);
110 DCHECK_GT(percentage
, 0u);
111 DCHECK_LE(percentage
, kOneHundredPercent
);
113 size_t initialized_length
= std::min(section
->SizeOfRawData
,
114 section
->Misc
.VirtualSize
);
116 if (initialized_length
== 0)
119 size_t length
= (initialized_length
* percentage
) / kOneHundredPercent
;
121 return std::max
<size_t>(length
, 1);
124 // Helper function to read through a |percentage| of the given |section|
125 // of the file denoted by |file_handle|. The |temp_buffer| is (re)used as
126 // a transient storage area as the section is read in chunks of
127 // |temp_buffer_size| bytes.
128 bool ReadThroughSection(HANDLE file_handle
,
129 const IMAGE_SECTION_HEADER
* section
,
132 size_t temp_buffer_size
) {
133 DCHECK(file_handle
!= INVALID_HANDLE_VALUE
);
134 DCHECK(section
!= NULL
);
135 DCHECK_LE(percentage
, kOneHundredPercent
);
136 DCHECK(temp_buffer
!= NULL
);
137 DCHECK(temp_buffer_size
> 0);
139 size_t bytes_to_read
= GetPercentageOfSectionLength(section
, percentage
);
140 if (bytes_to_read
== 0)
143 if (!SetFilePointer(file_handle
, section
->PointerToRawData
))
146 // Read all chunks except the last one.
147 while (bytes_to_read
> temp_buffer_size
) {
148 if (!ReadNextBytes(file_handle
, temp_buffer
, temp_buffer_size
))
150 bytes_to_read
-= temp_buffer_size
;
153 // Read the last (possibly partial) chunk and return.
154 DCHECK(bytes_to_read
> 0);
155 DCHECK(bytes_to_read
<= temp_buffer_size
);
156 return ReadNextBytes(file_handle
, temp_buffer
, bytes_to_read
);
159 // A helper function to touch all pages in the range
160 // [base_addr, base_addr + length).
161 void TouchPagesInRange(void* base_addr
, size_t length
) {
162 DCHECK(base_addr
!= NULL
);
165 // Get the system info so we know the page size. Also, make sure we use a
166 // non-zero value for the page size; GetSystemInfo() is hookable/patchable,
167 // and you never know what shenanigans someone could get up to.
168 SYSTEM_INFO system_info
= {};
169 GetSystemInfo(&system_info
);
170 if (system_info
.dwPageSize
== 0)
171 system_info
.dwPageSize
= 4096;
173 // We don't want to read outside the byte range (which could trigger an
174 // access violation), so let's figure out the exact locations of the first
175 // and final bytes we want to read.
176 volatile uint8
* touch_ptr
= reinterpret_cast<uint8
*>(base_addr
);
177 volatile uint8
* final_touch_ptr
= touch_ptr
+ length
- 1;
179 // Read the memory in the range [touch_ptr, final_touch_ptr] with a stride
180 // of the system page size, to ensure that it's been paged in.
182 while (touch_ptr
< final_touch_ptr
) {
184 touch_ptr
+= system_info
.dwPageSize
;
186 dummy
= *final_touch_ptr
;
191 bool ImagePreReader::PartialPreReadImageOnDisk(const wchar_t* file_path
,
193 size_t max_chunk_size
) {
194 // TODO(rogerm): change this to have the number of bytes pre-read per
195 // section be driven by a static table within the PE file (defaulting to
196 // full read if it's not there?) that's initialized by the optimization
198 DCHECK(file_path
!= NULL
);
203 if (percentage
> kOneHundredPercent
)
204 percentage
= kOneHundredPercent
;
206 // Validate/setup max_chunk_size, imposing a 1MB minimum on the chunk size.
207 const size_t kMinChunkSize
= 1024 * 1024;
208 max_chunk_size
= std::max(max_chunk_size
, kMinChunkSize
);
211 base::win::ScopedHandle
file(
212 CreateFile(file_path
,
214 FILE_SHARE_READ
| FILE_SHARE_WRITE
| FILE_SHARE_DELETE
,
217 FILE_FLAG_SEQUENTIAL_SCAN
,
223 // Allocate a resizable buffer for the headers. We initially reserve as much
224 // space as we typically see as the header size for chrome.dll and other
226 std::vector
<uint8
> headers
;
227 headers
.reserve(kMinHeaderBufferSize
);
229 // Read, hopefully, all of the headers.
230 if (!ReadMissingBytes(file
, &headers
, kMinHeaderBufferSize
))
233 // The DOS header starts at offset 0 and allows us to get the offset of the
234 // NT headers. Let's ensure we've read enough to capture the NT headers.
235 size_t nt_headers_start
=
236 reinterpret_cast<IMAGE_DOS_HEADER
*>(&headers
[0])->e_lfanew
;
237 size_t nt_headers_end
= nt_headers_start
+ sizeof(IMAGE_NT_HEADERS
);
238 if (!ReadMissingBytes(file
, &headers
, nt_headers_end
))
241 // Now that we've got the NT headers we can get the total header size,
242 // including all of the section headers. Let's ensure we've read enough
243 // to capture all of the header data.
244 size_t size_of_headers
= reinterpret_cast<IMAGE_NT_HEADERS
*>(
245 &headers
[nt_headers_start
])->OptionalHeader
.SizeOfHeaders
;
246 if (!ReadMissingBytes(file
, &headers
, size_of_headers
))
249 // Now we have all of the headers. This is enough to let us use the PEImage
250 // wrapper to query the structure of the image.
251 base::win::PEImage
pe_image(reinterpret_cast<HMODULE
>(&headers
[0]));
252 CHECK(pe_image
.VerifyMagic());
254 // Allocate a buffer to hold the pre-read bytes.
255 scoped_ptr_malloc
<uint8
, ScopedPtrVirtualFree
> buffer(
256 reinterpret_cast<uint8
*>(
257 ::VirtualAlloc(NULL
, max_chunk_size
, MEM_COMMIT
, PAGE_READWRITE
)));
258 if (buffer
.get() == NULL
)
261 // Iterate over each section, reading in a percentage of each.
262 const IMAGE_SECTION_HEADER
* section
= NULL
;
263 for (UINT i
= 0; (section
= pe_image
.GetSectionHeader(i
)) != NULL
; ++i
) {
264 CHECK_LE(reinterpret_cast<const uint8
*>(section
+ 1),
265 &headers
[0] + headers
.size());
266 if (!ReadThroughSection(
267 file
, section
, percentage
, buffer
.get(), max_chunk_size
))
275 bool ImagePreReader::PartialPreReadImageInMemory(const wchar_t* file_path
,
277 // TODO(rogerm): change this to have the number of bytes pre-read per
278 // section be driven by a static table within the PE file (defaulting to
279 // full read if it's not there?) that's initialized by the optimization
281 DCHECK(file_path
!= NULL
);
286 if (percentage
> kOneHundredPercent
)
287 percentage
= kOneHundredPercent
;
289 HMODULE dll_module
= ::LoadLibraryExW(
292 LOAD_WITH_ALTERED_SEARCH_PATH
| DONT_RESOLVE_DLL_REFERENCES
);
297 base::win::PEImage
pe_image(dll_module
);
298 CHECK(pe_image
.VerifyMagic());
300 // Iterate over each section, stepping through a percentage of each to page
301 // it in off the disk.
302 const IMAGE_SECTION_HEADER
* section
= NULL
;
303 for (UINT i
= 0; (section
= pe_image
.GetSectionHeader(i
)) != NULL
; ++i
) {
304 // Get the extent we want to touch.
305 size_t length
= GetPercentageOfSectionLength(section
, percentage
);
309 static_cast<uint8
*>(pe_image
.RVAToAddr(section
->VirtualAddress
));
311 // Verify that the extent we're going to touch falls inside the section
312 // we expect it to (and by implication, inside the pe_image).
314 pe_image
.GetImageSectionFromAddr(start
));
316 pe_image
.GetImageSectionFromAddr(start
+ length
- 1));
318 // Page in the section range.
319 TouchPagesInRange(start
, length
);
322 FreeLibrary(dll_module
);
327 bool ImagePreReader::PreReadImage(const wchar_t* file_path
,
330 base::ThreadRestrictions::AssertIOAllowed();
331 if (base::win::GetVersion() > base::win::VERSION_XP
) {
332 // Vista+ branch. On these OSes, the forced reads through the DLL actually
333 // slows warm starts. The solution is to sequentially read file contents
334 // with an optional cap on total amount to read.
335 base::win::ScopedHandle
file(
336 CreateFile(file_path
,
338 FILE_SHARE_READ
| FILE_SHARE_WRITE
| FILE_SHARE_DELETE
,
341 FILE_FLAG_SEQUENTIAL_SCAN
,
347 // Default to 1MB sequential reads.
348 const DWORD actual_step_size
= std::max(static_cast<DWORD
>(step_size
),
349 static_cast<DWORD
>(1024*1024));
350 LPVOID buffer
= ::VirtualAlloc(NULL
,
359 size_t total_read
= 0;
360 while (::ReadFile(file
, buffer
, actual_step_size
, &len
, NULL
) &&
362 (size_to_read
? total_read
< size_to_read
: true)) {
363 total_read
+= static_cast<size_t>(len
);
365 ::VirtualFree(buffer
, 0, MEM_RELEASE
);
367 // WinXP branch. Here, reading the DLL from disk doesn't do
368 // what we want so instead we pull the pages into memory by loading
369 // the DLL and touching pages at a stride. We use the system's page
370 // size as the stride, ignoring the passed in step_size, to make sure
371 // each page in the range is touched.
372 HMODULE dll_module
= ::LoadLibraryExW(
375 LOAD_WITH_ALTERED_SEARCH_PATH
| DONT_RESOLVE_DLL_REFERENCES
);
380 base::win::PEImage
pe_image(dll_module
);
381 CHECK(pe_image
.VerifyMagic());
383 // We don't want to read past the end of the module (which could trigger
384 // an access violation), so make sure to check the image size.
385 PIMAGE_NT_HEADERS nt_headers
= pe_image
.GetNTHeaders();
386 size_t dll_module_length
= std::min(
387 size_to_read
? size_to_read
: ~0,
388 static_cast<size_t>(nt_headers
->OptionalHeader
.SizeOfImage
));
390 // Page in then release the module.
391 TouchPagesInRange(dll_module
, dll_module_length
);
392 FreeLibrary(dll_module
);
398 bool ImagePreReader::PartialPreReadImage(const wchar_t* file_path
,
400 size_t max_chunk_size
) {
401 base::ThreadRestrictions::AssertIOAllowed();
403 if (percentage
>= kOneHundredPercent
) {
404 // If we're reading the whole image, we don't need to parse headers and
405 // navigate sections, the basic PreReadImage() can be used to just step
406 // blindly through the entire file / address-space.
407 return PreReadImage(file_path
, 0, max_chunk_size
);
410 if (base::win::GetVersion() > base::win::VERSION_XP
) {
411 // Vista+ branch. On these OSes, we warm up the Image by reading its
412 // file off the disk.
413 return PartialPreReadImageOnDisk(file_path
, percentage
, max_chunk_size
);
416 // WinXP branch. For XP, reading the image from disk doesn't do what we want
417 // so instead we pull the pages into memory by loading the DLL and touching
418 // initialized pages at a stride.
419 return PartialPreReadImageInMemory(file_path
, percentage
);