Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(59)

Unified Diff: content/browser/download/mhtml_generation_browsertest.cc

Issue 1977303003: Adds a feature to MHTML serialization that omits subframes and subresources marked no-store. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@no-store
Patch Set: Adds a test that compares actual visible content. Created 4 years, 7 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: content/browser/download/mhtml_generation_browsertest.cc
diff --git a/content/browser/download/mhtml_generation_browsertest.cc b/content/browser/download/mhtml_generation_browsertest.cc
index 00f3aeb1964ce93c82c864ee176517fb083ec02c..acb7de8bf37c550845e34439734121e9e8b60dc4 100644
--- a/content/browser/download/mhtml_generation_browsertest.cc
+++ b/content/browser/download/mhtml_generation_browsertest.cc
@@ -11,6 +11,7 @@
#include "base/files/scoped_temp_dir.h"
#include "base/macros.h"
#include "base/run_loop.h"
+#include "base/strings/utf_string_conversions.h"
#include "content/public/browser/web_contents.h"
#include "content/public/common/mhtml_generation_params.h"
#include "content/public/test/browser_test_utils.h"
@@ -18,10 +19,12 @@
#include "content/public/test/content_browser_test_utils.h"
#include "content/public/test/test_utils.h"
#include "content/shell/browser/shell.h"
+#include "net/base/filename_util.h"
#include "net/dns/mock_host_resolver.h"
#include "net/test/embedded_test_server/embedded_test_server.h"
#include "testing/gmock/include/gmock/gmock.h"
#include "testing/gtest/include/gtest/gtest.h"
+#include "third_party/WebKit/public/web/WebFindOptions.h"
using testing::ContainsRegex;
using testing::HasSubstr;
@@ -29,6 +32,54 @@ using testing::Not;
namespace content {
+namespace {
+
+int global_request_id = 0;
Łukasz Anforowicz 2016/05/19 17:00:13 Can this be made a static member of FindTrackingDe
dewittj 2016/05/19 18:18:35 Done.
+
+// A dummy WebContentsDelegate which tracks whether CloseContents() has been
+// called. It refuses the actual close but keeps track of whether the renderer
+// requested it.
+class FindTrackingDelegate : public WebContentsDelegate {
+ public:
+ FindTrackingDelegate(const std::string& search)
+ : search_(search), matches_(-1) {}
+
+ // Returns number of result.
+ int Wait(WebContents* web_contents) {
+ WebContentsDelegate* old_delegate = web_contents->GetDelegate();
+ web_contents->SetDelegate(this);
+
+ blink::WebFindOptions options;
+ options.matchCase = false;
+
+ web_contents->Find(global_request_id++, base::UTF8ToUTF16(search_),
+ options);
+ run_loop_.Run();
+
+ web_contents->SetDelegate(old_delegate);
+
+ return matches_;
+ }
+
+ void FindReply(WebContents* web_contents,
+ int request_id,
+ int number_of_matches,
+ const gfx::Rect& selection_rect,
+ int active_match_ordinal,
+ bool final_update) override {
+ matches_ = number_of_matches;
+ run_loop_.Quit();
+ }
+
+ private:
+ std::string search_;
+ int matches_;
+ base::RunLoop run_loop_;
+
+ DISALLOW_COPY_AND_ASSIGN(FindTrackingDelegate);
+};
+}
+
class MHTMLGenerationTest : public ContentBrowserTest {
public:
MHTMLGenerationTest() : has_mhtml_callback_run_(false), file_size_(0) {}
@@ -61,10 +112,81 @@ class MHTMLGenerationTest : public ContentBrowserTest {
int64_t ReadFileSizeFromDisk(base::FilePath path) {
int64_t file_size;
- if (!base::GetFileSize(path, &file_size)) return -1;
+ if (!base::GetFileSize(path, &file_size))
+ return -1;
return file_size;
}
+ void TestOriginalVsSavedPage(
+ const GURL& url,
+ const MHTMLGenerationParams params,
+ int expected_number_of_frames,
+ const std::vector<std::string>& expected_substrings,
+ const std::vector<std::string>& forbidden_substrings_in_saved_page,
+ bool skip_verification_of_original_page = false) {
+ // Navigate to the test page and verify if test expectations
+ // are met (this is mostly a sanity check - a failure to meet
+ // expectations would probably mean that there is a test bug
+ // (i.e. that we got called with wrong expected_foo argument).
+ NavigateToURL(shell(), url);
+ DLOG(INFO) << "Verifying test expectations for original page... : "
+ << shell()->web_contents()->GetLastCommittedURL();
+ if (!skip_verification_of_original_page) {
+ AssertExpectationsAboutCurrentTab(expected_number_of_frames,
+ expected_substrings,
+ std::vector<std::string>());
+ }
+
+ GenerateMHTML(params, url);
+ ASSERT_FALSE(HasFailure());
+
+ // Stop the test server (to make sure the locally saved page
+ // is self-contained / won't try to open original resources).
+ ASSERT_TRUE(embedded_test_server()->ShutdownAndWaitUntilComplete());
+
+ // Open the saved page and verify if test expectations are
+ // met (i.e. if the same expectations are met for "after"
+ // [saved version of the page] as for the "before"
+ // [the original version of the page].
+ NavigateToURL(shell(), GURL(net::FilePathToFileURL(params.file_path)));
+ DLOG(INFO) << "Verifying test expectations for saved page... : "
+ << shell()->web_contents()->GetLastCommittedURL();
+ AssertExpectationsAboutCurrentTab(expected_number_of_frames,
+ expected_substrings,
+ forbidden_substrings_in_saved_page);
+ }
+
+ void AssertExpectationsAboutCurrentTab(
+ int expected_number_of_frames,
+ const std::vector<std::string>& expected_substrings,
+ const std::vector<std::string>& forbidden_substrings) {
+ int actual_number_of_frames = 0;
+ shell()->web_contents()->ForEachFrame(
+ base::Bind(&MHTMLGenerationTest::increment, base::Unretained(this),
+ &actual_number_of_frames));
Łukasz Anforowicz 2016/05/19 17:00:13 This rather ugly code was written before web_conte
dewittj 2016/05/19 18:18:35 Done.
+ EXPECT_EQ(expected_number_of_frames, actual_number_of_frames);
+
+ for (const auto& expected_substring : expected_substrings) {
+ FindTrackingDelegate delegate(expected_substring);
+ int actual_number_of_matches = delegate.Wait(shell()->web_contents());
+ EXPECT_EQ(1, actual_number_of_matches)
+ << "Verifying that \"" << expected_substring << "\" appears "
+ << "exactly once in the text of web contents of "
+ << shell()->web_contents()->GetURL().spec();
+ }
+
+ for (const auto& forbidden_substring : forbidden_substrings) {
+ FindTrackingDelegate delegate(forbidden_substring);
+ int actual_number_of_matches = delegate.Wait(shell()->web_contents());
+ EXPECT_EQ(0, actual_number_of_matches)
+ << "Verifying that \"" << forbidden_substring << "\" doesn't "
+ << "appear in the text of web contents of "
+ << shell()->web_contents()->GetURL().spec();
+ }
+ }
+
+ void increment(int* i, RenderFrameHost* /* unused */) { (*i)++; }
+
bool has_mhtml_callback_run() const { return has_mhtml_callback_run_; }
int64_t file_size() const { return file_size_; }
@@ -199,6 +321,101 @@ IN_PROC_BROWSER_TEST_F(MHTMLGenerationTest, GenerateMHTMLObeyNoStoreMainFrame) {
EXPECT_THAT(mhtml, Not(HasSubstr("test body")));
}
+IN_PROC_BROWSER_TEST_F(MHTMLGenerationTest,
+ GenerateMHTMLIgnoreNoStoreSubFrame) {
+ base::FilePath path(temp_dir_.path());
+ path = path.Append(FILE_PATH_LITERAL("test.mht"));
+
+ GURL url(embedded_test_server()->GetURL("/page_with_nostore_iframe.html"));
+
+ // Generate MHTML, specifying the FAIL_FOR_NO_STORE_MAIN_FRAME policy.
+ MHTMLGenerationParams params(path);
+ params.cache_control_policy =
+ content::MHTMLCacheControlPolicy::FAIL_FOR_NO_STORE_MAIN_FRAME;
+
+ GenerateMHTML(params, url);
+ // We expect that there was no error (file size -1 indicates an error.)
+ EXPECT_LT(0, file_size());
+
+ std::string mhtml;
+ ASSERT_TRUE(base::ReadFileToString(path, &mhtml));
+
+ EXPECT_THAT(mhtml, HasSubstr("Main Frame"));
+ // Make sure that no-store subresources exist in this mode.
+ EXPECT_THAT(mhtml, HasSubstr("no-store test body"));
+ EXPECT_THAT(mhtml, ContainsRegex("Content-Location:.*nostore.jpg"));
+}
+
+IN_PROC_BROWSER_TEST_F(MHTMLGenerationTest, GenerateMHTMLObeyNoStoreSubFrame) {
+ base::FilePath path(temp_dir_.path());
+ path = path.Append(FILE_PATH_LITERAL("test.mht"));
+
+ GURL url(embedded_test_server()->GetURL("/page_with_nostore_iframe.html"));
+
+ // Generate MHTML, specifying the FAIL_FOR_NO_STORE_MAIN_FRAME policy.
+ MHTMLGenerationParams params(path);
+ params.cache_control_policy = content::MHTMLCacheControlPolicy::
+ SKIP_ANY_FRAME_OR_RESOURCE_MARKED_NO_STORE;
+
+ GenerateMHTML(params, url);
+ // We expect that there was no error (file size -1 indicates an error.)
+ EXPECT_LT(0, file_size());
+
+ std::string mhtml;
+ ASSERT_TRUE(base::ReadFileToString(path, &mhtml));
+
+ EXPECT_THAT(mhtml, HasSubstr("Main Frame"));
+ // Make sure the contents are missing.
+ EXPECT_THAT(mhtml, Not(HasSubstr("no-store test body")));
+ // This image comes from a resource marked no-store.
+ EXPECT_THAT(mhtml, Not(ContainsRegex("Content-Location:.*nostore.jpg")));
+}
+
+IN_PROC_BROWSER_TEST_F(
+ MHTMLGenerationTest,
+ ViewedMHTMLContainsNoStoreContentIfNoCacheControlPolicy) {
+ // Generate MHTML, specifying the FAIL_FOR_NO_STORE_MAIN_FRAME policy.
+ base::FilePath path(temp_dir_.path());
+ path = path.Append(FILE_PATH_LITERAL("test.mht"));
+ MHTMLGenerationParams params(path);
+
+ // No special cache control options so we should see both frames.
+ std::vector<std::string> expectations{
+ "Main Frame, normal headers.", "Cache-Control: no-store test body",
+ };
+ std::vector<std::string> forbidden;
+ TestOriginalVsSavedPage(
+ embedded_test_server()->GetURL("/page_with_nostore_iframe.html"), params,
+ 2 /* expected number of frames */, expectations, forbidden);
+
+ std::string mhtml;
+ ASSERT_TRUE(base::ReadFileToString(params.file_path, &mhtml));
+}
+
+IN_PROC_BROWSER_TEST_F(MHTMLGenerationTest,
+ ViewedMHTMLDoesNotContainNoStoreContent) {
+ // Generate MHTML, specifying the FAIL_FOR_NO_STORE_MAIN_FRAME policy.
+ base::FilePath path(temp_dir_.path());
+ path = path.Append(FILE_PATH_LITERAL("test.mht"));
+ MHTMLGenerationParams params(path);
+ params.cache_control_policy = content::MHTMLCacheControlPolicy::
+ SKIP_ANY_FRAME_OR_RESOURCE_MARKED_NO_STORE;
+
+ // No special cache control options so we should see both frames.
+ std::vector<std::string> expectations{
+ "Main Frame, normal headers.",
+ };
+ std::vector<std::string> forbidden{
+ "Cache-Control: no-store test body",
+ };
+ TestOriginalVsSavedPage(
+ embedded_test_server()->GetURL("/page_with_nostore_iframe.html"), params,
+ 2 /* expected number of frames */, expectations, forbidden);
+
+ std::string mhtml;
+ ASSERT_TRUE(base::ReadFileToString(params.file_path, &mhtml));
+}
+
// Test suite that allows testing --site-per-process against cross-site frames.
// See http://dev.chromium.org/developers/design-documents/site-isolation.
class MHTMLGenerationSitePerProcessTest : public MHTMLGenerationTest {

Powered by Google App Engine
This is Rietveld 408576698