OLD | NEW |
---|---|
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "content/browser/download/mhtml_generation_manager.h" | 5 #include "content/browser/download/mhtml_generation_manager.h" |
6 | 6 |
7 #include <map> | 7 #include <map> |
8 #include <queue> | 8 #include <queue> |
9 #include <utility> | 9 #include <utility> |
10 | 10 |
11 #include "base/bind.h" | 11 #include "base/bind.h" |
12 #include "base/files/file.h" | 12 #include "base/files/file.h" |
13 #include "base/guid.h" | 13 #include "base/guid.h" |
14 #include "base/macros.h" | 14 #include "base/macros.h" |
15 #include "base/memory/ptr_util.h" | 15 #include "base/memory/ptr_util.h" |
16 #include "base/metrics/histogram_macros.h" | 16 #include "base/metrics/histogram_macros.h" |
17 #include "base/scoped_observer.h" | 17 #include "base/scoped_observer.h" |
18 #include "base/stl_util.h" | 18 #include "base/stl_util.h" |
19 #include "base/strings/string_util.h" | 19 #include "base/strings/string_util.h" |
20 #include "base/strings/stringprintf.h" | 20 #include "base/strings/stringprintf.h" |
21 #include "base/time/time.h" | 21 #include "base/time/time.h" |
22 #include "base/trace_event/trace_event.h" | 22 #include "base/trace_event/trace_event.h" |
23 #include "content/browser/bad_message.h" | 23 #include "content/browser/bad_message.h" |
24 #include "content/browser/download/mhtml_extra_parts_impl.h" | |
24 #include "content/browser/frame_host/frame_tree_node.h" | 25 #include "content/browser/frame_host/frame_tree_node.h" |
25 #include "content/browser/frame_host/render_frame_host_impl.h" | 26 #include "content/browser/frame_host/render_frame_host_impl.h" |
26 #include "content/common/frame_messages.h" | 27 #include "content/common/frame_messages.h" |
27 #include "content/public/browser/browser_thread.h" | 28 #include "content/public/browser/browser_thread.h" |
29 #include "content/public/browser/mhtml_extra_parts.h" | |
28 #include "content/public/browser/render_frame_host.h" | 30 #include "content/public/browser/render_frame_host.h" |
29 #include "content/public/browser/render_process_host.h" | 31 #include "content/public/browser/render_process_host.h" |
30 #include "content/public/browser/render_process_host_observer.h" | 32 #include "content/public/browser/render_process_host_observer.h" |
31 #include "content/public/browser/web_contents.h" | 33 #include "content/public/browser/web_contents.h" |
32 #include "content/public/common/mhtml_generation_params.h" | 34 #include "content/public/common/mhtml_generation_params.h" |
33 #include "net/base/mime_util.h" | 35 #include "net/base/mime_util.h" |
34 | 36 |
37 namespace { | |
38 const char kContentLocation[] = "Content-Location: "; | |
39 const char kContentType[] = "Content-Type: "; | |
40 const char kContentTransferEncodingBinary[] = | |
41 "Content-Transfer-Encoding: binary"; | |
42 int kInvalidFileSize = -1; | |
43 } // namespace | |
44 | |
35 namespace content { | 45 namespace content { |
36 | 46 |
37 // The class and all of its members live on the UI thread. Only static methods | 47 // The class and all of its members live on the UI thread. Only static methods |
38 // are executed on other threads. | 48 // are executed on other threads. |
39 class MHTMLGenerationManager::Job : public RenderProcessHostObserver { | 49 class MHTMLGenerationManager::Job : public RenderProcessHostObserver { |
40 public: | 50 public: |
41 Job(int job_id, | 51 Job(int job_id, |
42 WebContents* web_contents, | 52 WebContents* web_contents, |
43 const MHTMLGenerationParams& params, | 53 const MHTMLGenerationParams& params, |
44 const GenerateMHTMLCallback& callback); | 54 const GenerateMHTMLCallback& callback); |
(...skipping 46 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
91 void MarkAsFinished(); | 101 void MarkAsFinished(); |
92 | 102 |
93 void ReportRendererMainThreadTime(base::TimeDelta renderer_main_thread_time); | 103 void ReportRendererMainThreadTime(base::TimeDelta renderer_main_thread_time); |
94 | 104 |
95 private: | 105 private: |
96 // Writes the MHTML footer to the file and closes it. | 106 // Writes the MHTML footer to the file and closes it. |
97 // | 107 // |
98 // Note: The same |boundary| marker must be used for all "boundaries" -- in | 108 // Note: The same |boundary| marker must be used for all "boundaries" -- in |
99 // the header, parts and footer -- that belong to the same MHTML document (see | 109 // the header, parts and footer -- that belong to the same MHTML document (see |
100 // also rfc1341, section 7.2.1, "boundary" description). | 110 // also rfc1341, section 7.2.1, "boundary" description). |
101 static std::tuple<MhtmlSaveStatus, int64_t> CloseFileOnFileThread( | 111 static std::tuple<MhtmlSaveStatus, int64_t> FinalizeAndCloseFileOnFileThread( |
102 MhtmlSaveStatus save_status, | 112 MhtmlSaveStatus save_status, |
103 const std::string& boundary, | 113 const std::string& boundary, |
104 base::File file); | 114 base::File file, |
115 const MHTMLExtraPartsImpl* extra_parts); | |
105 void AddFrame(RenderFrameHost* render_frame_host); | 116 void AddFrame(RenderFrameHost* render_frame_host); |
106 | 117 |
118 // If we have any extra MHTML parts to write out, write them into the file | |
119 // while on the file thread. Returns true for success, or if there is no data | |
120 // to write. | |
121 static bool WriteExtraDataParts(const std::string& boundary, | |
122 base::File& file, | |
123 const MHTMLExtraPartsImpl* extra_parts); | |
124 | |
125 // Writes the footer into the MHTML file. Returns false for faiulre. | |
126 static bool WriteFooter(const std::string& boundary, base::File& file); | |
127 | |
128 // Close the MHTML file if it looks good, setting the size param. Returns | |
129 // false for failure. | |
130 static MhtmlSaveStatus CloseFileIfValid(base::File& file, int64_t& file_size); | |
131 | |
107 // Creates a new map with values (content ids) the same as in | 132 // Creates a new map with values (content ids) the same as in |
108 // |frame_tree_node_to_content_id_| map, but with the keys translated from | 133 // |frame_tree_node_to_content_id_| map, but with the keys translated from |
109 // frame_tree_node_id into a |site_instance|-specific routing_id. | 134 // frame_tree_node_id into a |site_instance|-specific routing_id. |
110 std::map<int, std::string> CreateFrameRoutingIdToContentId( | 135 std::map<int, std::string> CreateFrameRoutingIdToContentId( |
111 SiteInstance* site_instance); | 136 SiteInstance* site_instance); |
112 | 137 |
113 // Id used to map renderer responses to jobs. | 138 // Id used to map renderer responses to jobs. |
114 // See also MHTMLGenerationManager::id_to_job_ map. | 139 // See also MHTMLGenerationManager::id_to_job_ map. |
115 const int job_id_; | 140 const int job_id_; |
116 | 141 |
(...skipping 32 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
149 std::string salt_; | 174 std::string salt_; |
150 | 175 |
151 // The callback to call once generation is complete. | 176 // The callback to call once generation is complete. |
152 const GenerateMHTMLCallback callback_; | 177 const GenerateMHTMLCallback callback_; |
153 | 178 |
154 // Whether the job is finished (set to true only for the short duration of | 179 // Whether the job is finished (set to true only for the short duration of |
155 // time between MHTMLGenerationManager::JobFinished is called and the job is | 180 // time between MHTMLGenerationManager::JobFinished is called and the job is |
156 // destroyed by MHTMLGenerationManager::OnFileClosed). | 181 // destroyed by MHTMLGenerationManager::OnFileClosed). |
157 bool is_finished_; | 182 bool is_finished_; |
158 | 183 |
184 // Any extra data parts that should be emitted into the output MHTML. | |
185 MHTMLExtraPartsImpl* extra_parts_; | |
186 | |
159 // RAII helper for registering this Job as a RenderProcessHost observer. | 187 // RAII helper for registering this Job as a RenderProcessHost observer. |
160 ScopedObserver<RenderProcessHost, MHTMLGenerationManager::Job> | 188 ScopedObserver<RenderProcessHost, MHTMLGenerationManager::Job> |
161 observed_renderer_process_host_; | 189 observed_renderer_process_host_; |
162 | 190 |
163 DISALLOW_COPY_AND_ASSIGN(Job); | 191 DISALLOW_COPY_AND_ASSIGN(Job); |
164 }; | 192 }; |
165 | 193 |
166 MHTMLGenerationManager::Job::Job(int job_id, | 194 MHTMLGenerationManager::Job::Job(int job_id, |
167 WebContents* web_contents, | 195 WebContents* web_contents, |
168 const MHTMLGenerationParams& params, | 196 const MHTMLGenerationParams& params, |
169 const GenerateMHTMLCallback& callback) | 197 const GenerateMHTMLCallback& callback) |
170 : job_id_(job_id), | 198 : job_id_(job_id), |
171 creation_time_(base::TimeTicks::Now()), | 199 creation_time_(base::TimeTicks::Now()), |
172 params_(params), | 200 params_(params), |
173 frame_tree_node_id_of_busy_frame_(FrameTreeNode::kFrameTreeNodeInvalidId), | 201 frame_tree_node_id_of_busy_frame_(FrameTreeNode::kFrameTreeNodeInvalidId), |
174 mhtml_boundary_marker_(net::GenerateMimeMultipartBoundary()), | 202 mhtml_boundary_marker_(net::GenerateMimeMultipartBoundary()), |
175 salt_(base::GenerateGUID()), | 203 salt_(base::GenerateGUID()), |
176 callback_(callback), | 204 callback_(callback), |
177 is_finished_(false), | 205 is_finished_(false), |
178 observed_renderer_process_host_(this) { | 206 observed_renderer_process_host_(this) { |
179 DCHECK_CURRENTLY_ON(BrowserThread::UI); | 207 DCHECK_CURRENTLY_ON(BrowserThread::UI); |
180 web_contents->ForEachFrame(base::Bind( | 208 web_contents->ForEachFrame(base::Bind( |
181 &MHTMLGenerationManager::Job::AddFrame, | 209 &MHTMLGenerationManager::Job::AddFrame, |
182 base::Unretained(this))); // Safe because ForEachFrame is synchronous. | 210 base::Unretained(this))); // Safe because ForEachFrame is synchronous. |
183 | 211 |
184 // Main frame needs to be processed first. | 212 // Main frame needs to be processed first. |
185 DCHECK(!pending_frame_tree_node_ids_.empty()); | 213 DCHECK(!pending_frame_tree_node_ids_.empty()); |
186 DCHECK(FrameTreeNode::GloballyFindByID(pending_frame_tree_node_ids_.front()) | 214 DCHECK(FrameTreeNode::GloballyFindByID(pending_frame_tree_node_ids_.front()) |
187 ->parent() == nullptr); | 215 ->parent() == nullptr); |
216 | |
217 // Save off any extra data. | |
218 extra_parts_ = static_cast<MHTMLExtraPartsImpl*>( | |
219 MHTMLExtraParts::FromWebContents(web_contents)); | |
188 } | 220 } |
189 | 221 |
190 MHTMLGenerationManager::Job::~Job() { | 222 MHTMLGenerationManager::Job::~Job() { |
191 DCHECK_CURRENTLY_ON(BrowserThread::UI); | 223 DCHECK_CURRENTLY_ON(BrowserThread::UI); |
192 } | 224 } |
193 | 225 |
194 std::map<int, std::string> | 226 std::map<int, std::string> |
195 MHTMLGenerationManager::Job::CreateFrameRoutingIdToContentId( | 227 MHTMLGenerationManager::Job::CreateFrameRoutingIdToContentId( |
196 SiteInstance* site_instance) { | 228 SiteInstance* site_instance) { |
197 std::map<int, std::string> result; | 229 std::map<int, std::string> result; |
(...skipping 147 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
345 if (save_status == MhtmlSaveStatus::SUCCESS) | 377 if (save_status == MhtmlSaveStatus::SUCCESS) |
346 save_status = MhtmlSaveStatus::FILE_WRITTING_ERROR; | 378 save_status = MhtmlSaveStatus::FILE_WRITTING_ERROR; |
347 callback.Run(std::make_tuple(save_status, -1)); | 379 callback.Run(std::make_tuple(save_status, -1)); |
348 return; | 380 return; |
349 } | 381 } |
350 | 382 |
351 // If no previous error occurred the boundary should be sent. | 383 // If no previous error occurred the boundary should be sent. |
352 BrowserThread::PostTaskAndReplyWithResult( | 384 BrowserThread::PostTaskAndReplyWithResult( |
353 BrowserThread::FILE, FROM_HERE, | 385 BrowserThread::FILE, FROM_HERE, |
354 base::Bind( | 386 base::Bind( |
355 &MHTMLGenerationManager::Job::CloseFileOnFileThread, save_status, | 387 &MHTMLGenerationManager::Job::FinalizeAndCloseFileOnFileThread, |
388 save_status, | |
356 (save_status == MhtmlSaveStatus::SUCCESS ? mhtml_boundary_marker_ | 389 (save_status == MhtmlSaveStatus::SUCCESS ? mhtml_boundary_marker_ |
357 : std::string()), | 390 : std::string()), |
358 base::Passed(&browser_file_)), | 391 base::Passed(&browser_file_), extra_parts_), |
359 callback); | 392 callback); |
360 } | 393 } |
361 | 394 |
362 bool MHTMLGenerationManager::Job::IsMessageFromFrameExpected( | 395 bool MHTMLGenerationManager::Job::IsMessageFromFrameExpected( |
363 RenderFrameHostImpl* sender) { | 396 RenderFrameHostImpl* sender) { |
364 int sender_id = sender->frame_tree_node()->frame_tree_node_id(); | 397 int sender_id = sender->frame_tree_node()->frame_tree_node_id(); |
365 if (sender_id != frame_tree_node_id_of_busy_frame_) | 398 if (sender_id != frame_tree_node_id_of_busy_frame_) |
366 return false; | 399 return false; |
367 | 400 |
368 // We only expect one message per frame - let's make sure subsequent messages | 401 // We only expect one message per frame - let's make sure subsequent messages |
(...skipping 25 matching lines...) Expand all Loading... | |
394 | 427 |
395 // Report success if all frames have been processed. | 428 // Report success if all frames have been processed. |
396 if (pending_frame_tree_node_ids_.empty()) | 429 if (pending_frame_tree_node_ids_.empty()) |
397 return MhtmlSaveStatus::SUCCESS; | 430 return MhtmlSaveStatus::SUCCESS; |
398 | 431 |
399 return SendToNextRenderFrame(); | 432 return SendToNextRenderFrame(); |
400 } | 433 } |
401 | 434 |
402 // static | 435 // static |
403 std::tuple<MhtmlSaveStatus, int64_t> | 436 std::tuple<MhtmlSaveStatus, int64_t> |
404 MHTMLGenerationManager::Job::CloseFileOnFileThread(MhtmlSaveStatus save_status, | 437 MHTMLGenerationManager::Job::FinalizeAndCloseFileOnFileThread( |
405 const std::string& boundary, | 438 MhtmlSaveStatus save_status, |
406 base::File file) { | 439 const std::string& boundary, |
440 base::File file, | |
441 const MHTMLExtraPartsImpl* extra_parts) { | |
407 DCHECK_CURRENTLY_ON(BrowserThread::FILE); | 442 DCHECK_CURRENTLY_ON(BrowserThread::FILE); |
408 | 443 |
409 // If no previous error occurred the boundary should have been provided. | 444 // If no previous error occurred the boundary should have been provided. |
410 if (save_status == MhtmlSaveStatus::SUCCESS) { | 445 if (save_status == MhtmlSaveStatus::SUCCESS) { |
411 TRACE_EVENT0("page-serialization", | 446 TRACE_EVENT0("page-serialization", |
412 "MHTMLGenerationManager::Job MHTML footer writing"); | 447 "MHTMLGenerationManager::Job MHTML footer writing"); |
413 DCHECK(!boundary.empty()); | 448 DCHECK(!boundary.empty()); |
414 std::string footer = base::StringPrintf("--%s--\r\n", boundary.c_str()); | 449 |
415 DCHECK(base::IsStringASCII(footer)); | 450 // Write the extra data into a part of its own, if we have any. |
416 if (file.WriteAtCurrentPos(footer.data(), footer.size()) < 0) | 451 if (!WriteExtraDataParts(boundary, file, extra_parts)) { |
417 save_status = MhtmlSaveStatus::FILE_WRITTING_ERROR; | 452 save_status = MhtmlSaveStatus::FILE_WRITTING_ERROR; |
453 return std::make_tuple(save_status, kInvalidFileSize); | |
454 } | |
455 | |
456 // Write out the footer at the bottom of the file. | |
457 if (!WriteFooter(boundary, file)) { | |
458 save_status = MhtmlSaveStatus::FILE_WRITTING_ERROR; | |
459 return std::make_tuple(save_status, kInvalidFileSize); | |
460 } | |
418 } | 461 } |
419 | 462 |
420 // If the file is still valid try to close it. Only update the status if that | 463 // If the file is still valid try to close it. Only update the status if that |
421 // won't hide an earlier error. | 464 // won't hide an earlier error. |
422 int64_t file_size = -1; | 465 int64_t file_size = kInvalidFileSize; |
423 if (file.IsValid()) { | 466 MhtmlSaveStatus close_save_status = CloseFileIfValid(file, file_size); |
424 file_size = file.GetLength(); | 467 if (save_status == MhtmlSaveStatus::SUCCESS && |
425 file.Close(); | 468 close_save_status == MhtmlSaveStatus::FILE_WRITTING_ERROR) { |
426 } else if (save_status == MhtmlSaveStatus::SUCCESS) { | 469 save_status = close_save_status; |
427 save_status = MhtmlSaveStatus::FILE_CLOSING_ERROR; | |
428 } | 470 } |
429 | 471 |
430 return std::make_tuple(save_status, file_size); | 472 return std::make_tuple(save_status, file_size); |
431 } | 473 } |
432 | 474 |
475 // static | |
476 bool MHTMLGenerationManager::Job::WriteExtraDataParts( | |
477 const std::string& boundary, | |
478 base::File& file, | |
479 const MHTMLExtraPartsImpl* extra_parts) { | |
480 DCHECK_CURRENTLY_ON(BrowserThread::FILE); | |
481 // Don't write an extra data part if there is none. | |
482 if (extra_parts == nullptr) | |
483 return true; | |
484 | |
485 const std::vector<MHTMLExtraDataPart>& extra_data_parts(extra_parts->parts()); | |
486 if (extra_data_parts.empty()) | |
487 return true; | |
488 | |
489 std::string serialized_extra_data_parts; | |
490 | |
491 // For each extra part, serialize that part and add to our accumulator | |
492 // string. | |
493 for (auto part : extra_data_parts) { | |
494 // Write a newline, then a boundary, another newline, then the content | |
495 // location, another newline, the content type, another newline, the | |
496 // content-transfer-encoding, another newline, the extra data string, and | |
497 // end with a newline. | |
498 std::string serialized_extra_data_part = base::StringPrintf( | |
499 "--%s\r\n%s%s\r\n%s%s\r\n%s\r\n%s\r\n", boundary.c_str(), | |
500 kContentLocation, part.content_location.c_str(), kContentType, | |
501 part.content_type.c_str(), kContentTransferEncodingBinary, | |
Pete Williamson
2017/04/01 01:02:58
Thinking about this just a bit more, I think I'll
| |
502 part.body.c_str()); | |
503 DCHECK(base::IsStringASCII(serialized_extra_data_part)); | |
504 | |
505 serialized_extra_data_parts += serialized_extra_data_part; | |
506 } | |
507 | |
508 // Write the string into the file. Returns false if we failed the write. | |
509 return (file.WriteAtCurrentPos(serialized_extra_data_parts.data(), | |
510 serialized_extra_data_parts.size()) >= 0); | |
511 } | |
512 | |
513 // static | |
514 bool MHTMLGenerationManager::Job::WriteFooter(const std::string& boundary, | |
515 base::File& file) { | |
516 DCHECK_CURRENTLY_ON(BrowserThread::FILE); | |
517 std::string footer = base::StringPrintf("--%s--\r\n", boundary.c_str()); | |
518 DCHECK(base::IsStringASCII(footer)); | |
519 return (file.WriteAtCurrentPos(footer.data(), footer.size()) >= 0); | |
520 } | |
521 | |
522 // static | |
523 MhtmlSaveStatus MHTMLGenerationManager::Job::CloseFileIfValid( | |
524 base::File& file, | |
525 int64_t& file_size) { | |
526 DCHECK_CURRENTLY_ON(BrowserThread::FILE); | |
527 if (file.IsValid()) { | |
528 file_size = file.GetLength(); | |
529 file.Close(); | |
530 return MhtmlSaveStatus::SUCCESS; | |
531 } | |
532 | |
533 return MhtmlSaveStatus::FILE_CLOSING_ERROR; | |
534 } | |
535 | |
433 MHTMLGenerationManager* MHTMLGenerationManager::GetInstance() { | 536 MHTMLGenerationManager* MHTMLGenerationManager::GetInstance() { |
434 return base::Singleton<MHTMLGenerationManager>::get(); | 537 return base::Singleton<MHTMLGenerationManager>::get(); |
435 } | 538 } |
436 | 539 |
437 MHTMLGenerationManager::MHTMLGenerationManager() : next_job_id_(0) {} | 540 MHTMLGenerationManager::MHTMLGenerationManager() : next_job_id_(0) {} |
438 | 541 |
439 MHTMLGenerationManager::~MHTMLGenerationManager() { | 542 MHTMLGenerationManager::~MHTMLGenerationManager() { |
440 } | 543 } |
441 | 544 |
442 void MHTMLGenerationManager::SaveMHTML(WebContents* web_contents, | 545 void MHTMLGenerationManager::SaveMHTML(WebContents* web_contents, |
(...skipping 149 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
592 return iter->second.get(); | 695 return iter->second.get(); |
593 } | 696 } |
594 | 697 |
595 void MHTMLGenerationManager::RenderProcessExited(Job* job) { | 698 void MHTMLGenerationManager::RenderProcessExited(Job* job) { |
596 DCHECK_CURRENTLY_ON(BrowserThread::UI); | 699 DCHECK_CURRENTLY_ON(BrowserThread::UI); |
597 DCHECK(job); | 700 DCHECK(job); |
598 JobFinished(job, MhtmlSaveStatus::RENDER_PROCESS_EXITED); | 701 JobFinished(job, MhtmlSaveStatus::RENDER_PROCESS_EXITED); |
599 } | 702 } |
600 | 703 |
601 } // namespace content | 704 } // namespace content |
OLD | NEW |