content/renderer/dom_serializer_browsertest.cc - Issue 14304004: Convert a bunch of test_shell_tests to content_browsertests. These are tests that depend on loading…

Unified Diff: content/renderer/dom_serializer_browsertest.cc

Issue 14304004: Convert a bunch of test_shell_tests to content_browsertests. These are tests that depend on loading… (Closed) Base URL: svn://chrome-svn/chrome/trunk/src/

Patch Set: sync Created 7 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: content/renderer/dom_serializer_browsertest.cc

===================================================================

--- content/renderer/dom_serializer_browsertest.cc (revision 195324)

+++ content/renderer/dom_serializer_browsertest.cc (working copy)

@@ -2,12 +2,21 @@

// Use of this source code is governed by a BSD-style license that can be

// found in the LICENSE file.

+#include "base/bind.h"

+#include "base/command_line.h"

#include "base/compiler_specific.h"

#include "base/file_util.h"

#include "base/files/file_path.h"

#include "base/hash_tables.h"

#include "base/string_util.h"

#include "base/utf_string_conversions.h"

+#include "content/public/common/content_switches.h"

+#include "content/public/renderer/render_view.h"

+#include "content/public/renderer/render_view_observer.h"

+#include "content/public/test/test_utils.h"

+#include "content/shell/shell.h"

+#include "content/test/content_browser_test.h"

+#include "content/test/content_browser_test_utils.h"

#include "net/base/net_util.h"

#include "net/url_request/url_request_context.h"

#include "third_party/WebKit/Source/Platform/chromium/public/WebCString.h"

@@ -26,8 +35,6 @@

#include "third_party/WebKit/Source/WebKit/chromium/public/WebView.h"

#include "webkit/base/file_path_string_conversions.h"

#include "webkit/glue/dom_operations.h"

-#include "webkit/tools/test_shell/simple_resource_loader_bridge.h"

-#include "webkit/tools/test_shell/test_shell_test.h"

using WebKit::WebCString;

using WebKit::WebData;

@@ -45,7 +52,7 @@

using WebKit::WebView;

using WebKit::WebVector;

-namespace {

+namespace content {

// Iterate recursively over sub-frames to find one with with a given url.

WebFrame* FindSubFrameByURL(WebView* web_view, const GURL& url) {

@@ -77,12 +84,93 @@

return NULL;

}

-class DomSerializerTests : public TestShellTest,

+// Helper function that test whether the first node in the doc is a doc type

+// node.

+bool HasDocType(const WebDocument& doc) {

+ WebNode node = doc.firstChild();

+ if (node.isNull())

+ return false;

+ return node.nodeType() == WebNode::DocumentTypeNode;

+ // Helper function for checking whether input node is META tag. Return true

+// means it is META element, otherwise return false. The parameter charset_info

+// return actual charset info if the META tag has charset declaration.

+bool IsMetaElement(const WebNode& node, std::string& charset_info) {

+ if (!node.isElementNode())

+ return false;

+ const WebElement meta = node.toConst<WebElement>();

+ if (!meta.hasTagName("meta"))

+ return false;

+ charset_info.erase(0, charset_info.length());

+ // Check the META charset declaration.

+ WebString httpEquiv = meta.getAttribute("http-equiv");

+ if (LowerCaseEqualsASCII(httpEquiv, "content-type")) {

+ std::string content = meta.getAttribute("content").utf8();

+ int pos = content.find("charset", 0);

+ if (pos > -1) {

+ // Add a dummy charset declaration to charset_info, which indicates this

+ // META tag has charset declaration although we do not get correct value

+ // yet.

+ charset_info.append("has-charset-declaration");

+ int remaining_length = content.length() - pos - 7;

+ if (!remaining_length)

+ return true;

+ int start_pos = pos + 7;

+ // Find "=" symbol.

+ while (remaining_length--)

+ if (content[start_pos++] == L'=')

+ break;

+ // Skip beginning space.

+ while (remaining_length) {

+ if (content[start_pos] > 0x0020)

+ break;

+ ++start_pos;

+ --remaining_length;

+ }

+ if (!remaining_length)

+ return true;

+ int end_pos = start_pos;

+ // Now we find out the start point of charset info. Search the end point.

+ while (remaining_length--) {

+ if (content[end_pos] <= 0x0020 || content[end_pos] == L';')

+ break;

+ ++end_pos;

+ }

+ // Get actual charset info.

+ charset_info = content.substr(start_pos, end_pos - start_pos);

+ return true;

+ }

+ return true;

+class LoadObserver : public RenderViewObserver {

+ public:

+ LoadObserver(RenderView* render_view, const base::Closure& quit_closure)

+ : RenderViewObserver(render_view),

+ quit_closure_(quit_closure) {}

+ virtual void DidFinishLoad(WebKit::WebFrame* frame) {

+ if (frame == render_view()->GetWebView()->mainFrame())

+ quit_closure_.Run();

+ }

+ private:

+ base::Closure quit_closure_;

+};

+class DomSerializerTests : public ContentBrowserTest,

public WebPageSerializerClient {

public:

DomSerializerTests()

- : local_directory_name_(FILE_PATH_LITERAL("./dummy_files/")) { }

+ : serialized_(false),

+ local_directory_name_(FILE_PATH_LITERAL("./dummy_files/")) {}

+ virtual void SetUpCommandLine(CommandLine* command_line) {

+ command_line->AppendSwitch(switches::kSingleProcess);

+ }

// DomSerializerDelegate.

virtual void didSerializeDataForFrame(const WebURL& frame_web_url,

const WebCString& data,

@@ -129,38 +217,45 @@

return serialized_frame_map_[frame_url.spec()];

}

- // Load web page according to specific URL.

- void LoadPageFromURL(const GURL& page_url) {

- // Load the test file.

- test_shell_->ResetTestController();

- test_shell_->LoadURL(page_url);

- test_shell_->WaitTestFinished();

+ RenderView* GetRenderView() {

+ // We could have the test on the UI thread get the WebContent's routing ID,

+ // but we know this will be the first RV so skip that and just hardcode it.

+ return RenderView::FromRoutingID(1);

}

+ WebView* GetWebView() {

+ return GetRenderView()->GetWebView();

+ }

+ WebFrame* GetMainFrame() {

+ return GetWebView()->mainFrame();

+ }

// Load web page according to input content and relative URLs within

// the document.

void LoadContents(const std::string& contents,

const GURL& base_url,

const WebString encoding_info) {

- test_shell_->ResetTestController();

+ scoped_refptr<MessageLoopRunner> runner = new MessageLoopRunner;

+ LoadObserver observer(GetRenderView(), runner->QuitClosure());

// If input encoding is empty, use UTF-8 as default encoding.

if (encoding_info.isEmpty()) {

- test_shell_->webView()->mainFrame()->loadHTMLString(contents, base_url);

+ GetMainFrame()->loadHTMLString(contents, base_url);

} else {

WebData data(contents.data(), contents.length());

// Do not use WebFrame.LoadHTMLString because it assumes that input

// html contents use UTF-8 encoding.

// TODO(darin): This should use WebFrame::loadData.

- WebFrame* web_frame =

- test_shell_->webView()->mainFrame();

+ WebFrame* web_frame = GetMainFrame();

ASSERT_TRUE(web_frame != NULL);

web_frame->loadData(data, "text/html", encoding_info, base_url);

}

- test_shell_->WaitTestFinished();

+ runner->Run();

}

// Serialize page DOM according to specific page URL. The parameter

@@ -169,8 +264,7 @@

void SerializeDomForURL(const GURL& page_url,

bool recursive_serialization) {

// Find corresponding WebFrame according to page_url.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(),

- page_url);

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), page_url);

ASSERT_TRUE(web_frame != NULL);

// Add input file URl to links_.

links_.assign(&page_url,1);

@@ -189,6 +283,475 @@

ASSERT_TRUE(serialized_);

}

+ void SerializeHTMLDOMWithDocTypeOnRenderer(const GURL& file_url) {

+ // Make sure original contents have document type.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(HasDocType(doc));

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Load the serialized contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ // Make sure serialized contents still have document type.

+ web_frame = GetMainFrame();

+ doc = web_frame->document();

+ ASSERT_TRUE(HasDocType(doc));

+ }

+ void SerializeHTMLDOMWithoutDocTypeOnRenderer(const GURL& file_url) {

+ // Make sure original contents do not have document type.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(!HasDocType(doc));

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Load the serialized contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ // Make sure serialized contents do not have document type.

+ web_frame = GetMainFrame();

+ doc = web_frame->document();

+ ASSERT_TRUE(!HasDocType(doc));

+ }

+ void SerializeXMLDocWithBuiltInEntitiesOnRenderer(

+ const GURL& xml_file_url, const std::string& original_contents) {

+ // Do serialization.

+ SerializeDomForURL(xml_file_url, false);

+ // Compare the serialized contents with original contents.

+ ASSERT_TRUE(HasSerializedFrame(xml_file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(xml_file_url);

+ ASSERT_EQ(original_contents, serialized_contents);

+ }

+ void SerializeHTMLDOMWithAddingMOTWOnRenderer(

+ const GURL& file_url, const std::string& motw_declaration) {

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Make sure the serialized contents have MOTW ;

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ ASSERT_FALSE(std::string::npos ==

+ serialized_contents.find(motw_declaration));

+ }

+ void SerializeHTMLDOMWithNoMetaCharsetInOriginalDocOnRenderer(

+ const GURL& file_url) {

+ // Make sure there is no META charset declaration in original document.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement head_element = doc.head();

+ ASSERT_TRUE(!head_element.isNull());

+ // Go through all children of HEAD element.

+ for (WebNode child = head_element.firstChild(); !child.isNull();

+ child = child.nextSibling()) {

+ std::string charset_info;

+ if (IsMetaElement(child, charset_info))

+ ASSERT_TRUE(charset_info.empty());

+ }

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Load the serialized contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ // Make sure the first child of HEAD element is META which has charset

+ // declaration in serialized contents.

+ web_frame = GetMainFrame();

+ ASSERT_TRUE(web_frame != NULL);

+ doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ head_element = doc.head();

+ ASSERT_TRUE(!head_element.isNull());

+ WebNode meta_node = head_element.firstChild();

+ ASSERT_TRUE(!meta_node.isNull());

+ // Get meta charset info.

+ std::string charset_info2;

+ ASSERT_TRUE(IsMetaElement(meta_node, charset_info2));

+ ASSERT_TRUE(!charset_info2.empty());

+ ASSERT_EQ(charset_info2,

+ std::string(web_frame->document().encoding().utf8()));

+ // Make sure no more additional META tags which have charset declaration.

+ for (WebNode child = meta_node.nextSibling(); !child.isNull();

+ child = child.nextSibling()) {

+ std::string charset_info;

+ if (IsMetaElement(child, charset_info))

+ ASSERT_TRUE(charset_info.empty());

+ }

+ void SerializeHTMLDOMWithMultipleMetaCharsetInOriginalDocOnRenderer(

+ const GURL& file_url) {

+ // Make sure there are multiple META charset declarations in original

+ // document.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement head_ele = doc.head();

+ ASSERT_TRUE(!head_ele.isNull());

+ // Go through all children of HEAD element.

+ int charset_declaration_count = 0;

+ for (WebNode child = head_ele.firstChild(); !child.isNull();

+ child = child.nextSibling()) {

+ std::string charset_info;

+ if (IsMetaElement(child, charset_info) && !charset_info.empty())

+ charset_declaration_count++;

+ }

+ // The original doc has more than META tags which have charset declaration.

+ ASSERT_TRUE(charset_declaration_count > 1);

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Load the serialized contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ // Make sure only first child of HEAD element is META which has charset

+ // declaration in serialized contents.

+ web_frame = GetMainFrame();

+ ASSERT_TRUE(web_frame != NULL);

+ doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ head_ele = doc.head();

+ ASSERT_TRUE(!head_ele.isNull());

+ WebNode meta_node = head_ele.firstChild();

+ ASSERT_TRUE(!meta_node.isNull());

+ // Get meta charset info.

+ std::string charset_info2;

+ ASSERT_TRUE(IsMetaElement(meta_node, charset_info2));

+ ASSERT_TRUE(!charset_info2.empty());

+ ASSERT_EQ(charset_info2,

+ std::string(web_frame->document().encoding().utf8()));

+ // Make sure no more additional META tags which have charset declaration.

+ for (WebNode child = meta_node.nextSibling(); !child.isNull();

+ child = child.nextSibling()) {

+ std::string charset_info;

+ if (IsMetaElement(child, charset_info))

+ ASSERT_TRUE(charset_info.empty());

+ }

+ void SerializeHTMLDOMWithEntitiesInTextOnRenderer() {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "dom_serializer/htmlentities_in_text.htm");

+ // Get file URL. The URL is dummy URL to identify the following loading

+ // actions. The test content is in constant:original_contents.

+ GURL file_url = net::FilePathToFileURL(page_file_path);

+ ASSERT_TRUE(file_url.SchemeIsFile());

+ // Test contents.

+ static const char* const original_contents =

+ "<html><body>&<>\"\'</body></html>";

+ // Load the test contents.

+ LoadContents(original_contents, file_url, WebString());

+ // Get BODY's text content in DOM.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement body_ele = doc.body();

+ ASSERT_TRUE(!body_ele.isNull());

+ WebNode text_node = body_ele.firstChild();

+ ASSERT_TRUE(text_node.isTextNode());

+ ASSERT_TRUE(std::string(text_node.createMarkup().utf8()) ==

+ "&<>\"\'");

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Compare the serialized contents with original contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ // Compare the serialized contents with original contents to make sure

+ // they are same.

+ // Because we add MOTW when serializing DOM, so before comparison, we also

+ // need to add MOTW to original_contents.

+ std::string original_str =

+ WebPageSerializer::generateMarkOfTheWebDeclaration(file_url).utf8();

+ original_str += original_contents;

+ // Since WebCore now inserts a new HEAD element if there is no HEAD element

+ // when creating BODY element. (Please see

+ // HTMLParser::bodyCreateErrorCheck.) We need to append the HEAD content and

+ // corresponding META content if we find WebCore-generated HEAD element.

+ if (!doc.head().isNull()) {

+ WebString encoding = web_frame->document().encoding();

+ std::string htmlTag("<html>");

+ std::string::size_type pos = original_str.find(htmlTag);

+ ASSERT_NE(std::string::npos, pos);

+ pos += htmlTag.length();

+ std::string head_part("<head>");

+ head_part +=

+ WebPageSerializer::generateMetaCharsetDeclaration(encoding).utf8();

+ head_part += "</head>";

+ original_str.insert(pos, head_part);

+ }

+ ASSERT_EQ(original_str, serialized_contents);

+ }

+ void SerializeHTMLDOMWithEntitiesInAttributeValueOnRenderer() {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "dom_serializer/htmlentities_in_attribute_value.htm");

+ // Get file URL. The URL is dummy URL to identify the following loading

+ // actions. The test content is in constant:original_contents.

+ GURL file_url = net::FilePathToFileURL(page_file_path);

+ ASSERT_TRUE(file_url.SchemeIsFile());

+ // Test contents.

+ static const char* const original_contents =

+ "<html><body title=\"&<>"'\"></body></html>";

+ // Load the test contents.

+ LoadContents(original_contents, file_url, WebString());

+ // Get value of BODY's title attribute in DOM.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement body_ele = doc.body();

+ ASSERT_TRUE(!body_ele.isNull());

+ WebString value = body_ele.getAttribute("title");

+ ASSERT_TRUE(std::string(value.utf8()) == "&<>\"\'");

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Compare the serialized contents with original contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ // Compare the serialized contents with original contents to make sure

+ // they are same.

+ std::string original_str =

+ WebPageSerializer::generateMarkOfTheWebDeclaration(file_url).utf8();

+ original_str += original_contents;

+ if (!doc.isNull()) {

+ WebString encoding = web_frame->document().encoding();

+ std::string htmlTag("<html>");

+ std::string::size_type pos = original_str.find(htmlTag);

+ ASSERT_NE(std::string::npos, pos);

+ pos += htmlTag.length();

+ std::string head_part("<head>");

+ head_part +=

+ WebPageSerializer::generateMetaCharsetDeclaration(encoding).utf8();

+ head_part += "</head>";

+ original_str.insert(pos, head_part);

+ }

+ ASSERT_EQ(original_str, serialized_contents);

+ }

+ void SerializeHTMLDOMWithNonStandardEntitiesOnRenderer(const GURL& file_url) {

+ // Get value of BODY's title attribute in DOM.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement body_element = doc.body();

+ // Unescaped string for "&percnt;&nsup;¹'".

+ static const wchar_t parsed_value[] = {

+ '%', 0x2285, 0x00b9, '\'', 0

+ };

+ WebString value = body_element.getAttribute("title");

+ ASSERT_TRUE(UTF16ToWide(value) == parsed_value);

+ ASSERT_TRUE(UTF16ToWide(body_element.innerText()) == parsed_value);

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Check the serialized string.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ // Confirm that the serialized string has no non-standard HTML entities.

+ ASSERT_EQ(std::string::npos, serialized_contents.find("&percnt;"));

+ ASSERT_EQ(std::string::npos, serialized_contents.find("&nsup;"));

+ ASSERT_EQ(std::string::npos, serialized_contents.find("¹"));

+ ASSERT_EQ(std::string::npos, serialized_contents.find("'"));

+ }

+ void SerializeHTMLDOMWithBaseTagOnRenderer(const GURL& file_url,

+ const GURL& path_dir_url) {

+ // There are total 2 available base tags in this test file.

+ const int kTotalBaseTagCountInTestFile = 2;

+ // Since for this test, we assume there is no savable sub-resource links for

+ // this test file, also all links are relative URLs in this test file, so we

+ // need to check those relative URLs and make sure document has BASE tag.

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ // Go through all descent nodes.

+ WebNodeCollection all = doc.all();

+ int original_base_tag_count = 0;

+ for (WebNode node = all.firstItem(); !node.isNull();

+ node = all.nextItem()) {

+ if (!node.isElementNode())

+ continue;

+ WebElement element = node.to<WebElement>();

+ if (element.hasTagName("base")) {

+ original_base_tag_count++;

+ } else {

+ // Get link.

+ WebString value =

+ webkit_glue::GetSubResourceLinkFromElement(element);

+ if (value.isNull() && element.hasTagName("a")) {

+ value = element.getAttribute("href");

+ if (value.isEmpty())

+ value = WebString();

+ }

+ // Each link is relative link.

+ if (!value.isNull()) {

+ GURL link(value.utf8());

+ ASSERT_TRUE(link.scheme().empty());

+ }

+ ASSERT_EQ(original_base_tag_count, kTotalBaseTagCountInTestFile);

+ // Make sure in original document, the base URL is not equal with the

+ // |path_dir_url|.

+ GURL original_base_url(doc.baseURL());

+ ASSERT_NE(original_base_url, path_dir_url);

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Load the serialized contents.

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ // Make sure all links are absolute URLs and doc there are some number of

+ // BASE tags in serialized HTML data. Each of those BASE tags have same base

+ // URL which is as same as URL of current test file.

+ web_frame = GetMainFrame();

+ ASSERT_TRUE(web_frame != NULL);

+ doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ // Go through all descent nodes.

+ all = doc.all();

+ int new_base_tag_count = 0;

+ for (WebNode node = all.firstItem(); !node.isNull();

+ node = all.nextItem()) {

+ if (!node.isElementNode())

+ continue;

+ WebElement element = node.to<WebElement>();

+ if (element.hasTagName("base")) {

+ new_base_tag_count++;

+ } else {

+ // Get link.

+ WebString value =

+ webkit_glue::GetSubResourceLinkFromElement(element);

+ if (value.isNull() && element.hasTagName("a")) {

+ value = element.getAttribute("href");

+ if (value.isEmpty())

+ value = WebString();

+ }

+ // Each link is absolute link.

+ if (!value.isNull()) {

+ GURL link(std::string(value.utf8()));

+ ASSERT_FALSE(link.scheme().empty());

+ }

+ // We have one more added BASE tag which is generated by JavaScript.

+ ASSERT_EQ(new_base_tag_count, original_base_tag_count + 1);

+ // Make sure in new document, the base URL is equal with the |path_dir_url|.

+ GURL new_base_url(doc.baseURL());

+ ASSERT_EQ(new_base_url, path_dir_url);

+ }

+ void SerializeHTMLDOMWithEmptyHeadOnRenderer() {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "empty_head.htm");

+ GURL file_url = net::FilePathToFileURL(page_file_path);

+ ASSERT_TRUE(file_url.SchemeIsFile());

+ // Load the test html content.

+ static const char* const empty_head_contents =

+ "<html><head></head><body>hello world</body></html>";

+ LoadContents(empty_head_contents, file_url, WebString());

+ // Make sure the head tag is empty.

+ WebFrame* web_frame = GetMainFrame();

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ WebElement head_element = doc.head();

+ ASSERT_TRUE(!head_element.isNull());

+ ASSERT_TRUE(!head_element.hasChildNodes());

+ ASSERT_TRUE(head_element.childNodes().length() == 0);

+ // Do serialization.

+ SerializeDomForURL(file_url, false);

+ // Make sure the serialized contents have META ;

+ ASSERT_TRUE(HasSerializedFrame(file_url));

+ const std::string& serialized_contents =

+ GetSerializedContentForFrame(file_url);

+ // Reload serialized contents and make sure there is only one META tag.

+ LoadContents(serialized_contents, file_url,

+ web_frame->document().encoding());

+ web_frame = GetMainFrame();

+ ASSERT_TRUE(web_frame != NULL);

+ doc = web_frame->document();

+ ASSERT_TRUE(doc.isHTMLDocument());

+ head_element = doc.head();

+ ASSERT_TRUE(!head_element.isNull());

+ ASSERT_TRUE(head_element.hasChildNodes());

+ ASSERT_TRUE(head_element.childNodes().length() == 1);

+ WebNode meta_node = head_element.firstChild();

+ ASSERT_TRUE(!meta_node.isNull());

+ // Get meta charset info.

+ std::string charset_info;

+ ASSERT_TRUE(IsMetaElement(meta_node, charset_info));

+ ASSERT_TRUE(!charset_info.empty());

+ ASSERT_EQ(charset_info,

+ std::string(web_frame->document().encoding().utf8()));

+ // Check the body's first node is text node and its contents are

+ // "hello world"

+ WebElement body_element = doc.body();

+ ASSERT_TRUE(!body_element.isNull());

+ WebNode text_node = body_element.firstChild();

+ ASSERT_TRUE(text_node.isTextNode());

+ WebString text_node_contents = text_node.nodeValue();

+ ASSERT_TRUE(std::string(text_node_contents.utf8()) == "hello world");

+ }

+ void SerializeDocumentWithDownloadedIFrameOnRenderer(const GURL& file_url) {

+ // Do a recursive serialization. We pass if we don't crash.

+ SerializeDomForURL(file_url, true);

+ }

+ void SubResourceForElementsInNonHTMLNamespaceOnRenderer(

+ const GURL& file_url) {

+ WebFrame* web_frame = FindSubFrameByURL(GetWebView(), file_url);

+ ASSERT_TRUE(web_frame != NULL);

+ WebDocument doc = web_frame->document();

+ WebNode lastNodeInBody = doc.body().lastChild();

+ ASSERT_EQ(WebNode::ElementNode, lastNodeInBody.nodeType());

+ WebString uri = webkit_glue::GetSubResourceLinkFromElement(

+ lastNodeInBody.to<WebElement>());

+ EXPECT_TRUE(uri.isNull());

+ }

private:

// Map frame_url to corresponding serialized_content.

typedef base::hash_map<std::string, std::string> SerializedFrameContentMap;

@@ -206,148 +769,46 @@

// The local_directory_name_ is dummy relative path of directory which

// contain all saved auxiliary files included all sub frames and resources.

const base::FilePath local_directory_name_;

- protected:

- // testing::Test

- virtual void SetUp() {

- TestShellTest::SetUp();

- serialized_ = false;

- }

- virtual void TearDown() {

- TestShellTest::TearDown();

- }

};

-// Helper function that test whether the first node in the doc is a doc type

-// node.

-bool HasDocType(const WebDocument& doc) {

- WebNode node = doc.firstChild();

- if (node.isNull())

- return false;

- return node.nodeType() == WebNode::DocumentTypeNode;

-// Helper function for checking whether input node is META tag. Return true

-// means it is META element, otherwise return false. The parameter charset_info

-// return actual charset info if the META tag has charset declaration.

-bool IsMetaElement(const WebNode& node, std::string& charset_info) {

- if (!node.isElementNode())

- return false;

- const WebElement meta = node.toConst<WebElement>();

- if (!meta.hasTagName("meta"))

- return false;

- charset_info.erase(0, charset_info.length());

- // Check the META charset declaration.

- WebString httpEquiv = meta.getAttribute("http-equiv");

- if (LowerCaseEqualsASCII(httpEquiv, "content-type")) {

- std::string content = meta.getAttribute("content").utf8();

- int pos = content.find("charset", 0);

- if (pos > -1) {

- // Add a dummy charset declaration to charset_info, which indicates this

- // META tag has charset declaration although we do not get correct value

- // yet.

- charset_info.append("has-charset-declaration");

- int remaining_length = content.length() - pos - 7;

- if (!remaining_length)

- return true;

- int start_pos = pos + 7;

- // Find "=" symbol.

- while (remaining_length--)

- if (content[start_pos++] == L'=')

- break;

- // Skip beginning space.

- while (remaining_length) {

- if (content[start_pos] > 0x0020)

- break;

- ++start_pos;

- --remaining_length;

- }

- if (!remaining_length)

- return true;

- int end_pos = start_pos;

- // Now we find out the start point of charset info. Search the end point.

- while (remaining_length--) {

- if (content[end_pos] <= 0x0020 || content[end_pos] == L';')

- break;

- ++end_pos;

- }

- // Get actual charset info.

- charset_info = content.substr(start_pos, end_pos - start_pos);

- return true;

- }

- return true;

// If original contents have document type, the serialized contents also have

// document type.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithDocType) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("youtube_1.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithDocType) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "youtube_1.htm");

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

- // Make sure original contents have document type.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(HasDocType(doc));

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Load the serialized contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- LoadContents(serialized_contents, file_url,

- web_frame->document().encoding());

- // Make sure serialized contents still have document type.

- web_frame = test_shell_->webView()->mainFrame();

- doc = web_frame->document();

- ASSERT_TRUE(HasDocType(doc));

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(&DomSerializerTests::SerializeHTMLDOMWithDocTypeOnRenderer,

+ base::Unretained(this), file_url));

}

// If original contents do not have document type, the serialized contents

// also do not have document type.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithoutDocType) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("youtube_2.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithoutDocType) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "youtube_2.htm");

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

- // Make sure original contents do not have document type.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(!HasDocType(doc));

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Load the serialized contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- LoadContents(serialized_contents, file_url,

- web_frame->document().encoding());

- // Make sure serialized contents do not have document type.

- web_frame = test_shell_->webView()->mainFrame();

- doc = web_frame->document();

- ASSERT_TRUE(!HasDocType(doc));

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::SerializeHTMLDOMWithoutDocTypeOnRenderer,

+ base::Unretained(this), file_url));

}

// Serialize XML document which has all 5 built-in entities. After

// finishing serialization, the serialized contents should be same

// with original XML document.

-TEST_F(DomSerializerTests, SerializeXMLDocWithBuiltInEntities) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("note.html");

- base::FilePath xml_file_path = data_dir_;

- xml_file_path = xml_file_path.AppendASCII("dom_serializer");

- xml_file_path = xml_file_path.AppendASCII("note.xml");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeXMLDocWithBuiltInEntities) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "note.html");

+ base::FilePath xml_file_path = GetTestFilePath("dom_serializer", "note.xml");

// Read original contents for later comparison.

std::string original_contents;

ASSERT_TRUE(file_util::ReadFileToString(xml_file_path, &original_contents));

@@ -356,21 +817,18 @@

GURL xml_file_url = net::FilePathToFileURL(xml_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

- // Do serialization.

- SerializeDomForURL(xml_file_url, false);

- // Compare the serialized contents with original contents.

- ASSERT_TRUE(HasSerializedFrame(xml_file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(xml_file_url);

- ASSERT_EQ(original_contents, serialized_contents);

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::SerializeXMLDocWithBuiltInEntitiesOnRenderer,

+ base::Unretained(this), xml_file_url, original_contents));

}

// When serializing DOM, we add MOTW declaration before html tag.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithAddingMOTW) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("youtube_2.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithAddingMOTW) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "youtube_2.htm");

// Read original contents for later comparison .

std::string original_contents;

ASSERT_TRUE(file_util::ReadFileToString(page_file_path, &original_contents));

@@ -383,494 +841,173 @@

ASSERT_FALSE(motw_declaration.empty());

// The encoding of original contents is ISO-8859-1, so we convert the MOTW

// declaration to ASCII and search whether original contents has it or not.

- ASSERT_TRUE(std::string::npos ==

- original_contents.find(motw_declaration));

+ ASSERT_TRUE(std::string::npos == original_contents.find(motw_declaration));

// Load the test file.

- LoadPageFromURL(file_url);

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Make sure the serialized contents have MOTW ;

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- ASSERT_FALSE(std::string::npos ==

- serialized_contents.find(motw_declaration));

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::SerializeHTMLDOMWithAddingMOTWOnRenderer,

+ base::Unretained(this), file_url, motw_declaration));

}

// When serializing DOM, we will add the META which have correct charset

// declaration as first child of HEAD element for resolving WebKit bug:

// http://bugs.webkit.org/show_bug.cgi?id=16621 even the original document

// does not have META charset declaration.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithNoMetaCharsetInOriginalDoc) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("youtube_1.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SerializeHTMLDOMWithNoMetaCharsetInOriginalDoc) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "youtube_1.htm");

// Get file URL.

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

+ NavigateToURL(shell(), file_url);

- // Make sure there is no META charset declaration in original document.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement head_element = doc.head();

- ASSERT_TRUE(!head_element.isNull());

- // Go through all children of HEAD element.

- for (WebNode child = head_element.firstChild(); !child.isNull();

- child = child.nextSibling()) {

- std::string charset_info;

- if (IsMetaElement(child, charset_info))

- ASSERT_TRUE(charset_info.empty());

- }

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Load the serialized contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- LoadContents(serialized_contents, file_url,

- web_frame->document().encoding());

- // Make sure the first child of HEAD element is META which has charset

- // declaration in serialized contents.

- web_frame = test_shell_->webView()->mainFrame();

- ASSERT_TRUE(web_frame != NULL);

- doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- head_element = doc.head();

- ASSERT_TRUE(!head_element.isNull());

- WebNode meta_node = head_element.firstChild();

- ASSERT_TRUE(!meta_node.isNull());

- // Get meta charset info.

- std::string charset_info2;

- ASSERT_TRUE(IsMetaElement(meta_node, charset_info2));

- ASSERT_TRUE(!charset_info2.empty());

- ASSERT_EQ(charset_info2,

- std::string(web_frame->document().encoding().utf8()));

- // Make sure no more additional META tags which have charset declaration.

- for (WebNode child = meta_node.nextSibling(); !child.isNull();

- child = child.nextSibling()) {

- std::string charset_info;

- if (IsMetaElement(child, charset_info))

- ASSERT_TRUE(charset_info.empty());

- }

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SerializeHTMLDOMWithNoMetaCharsetInOriginalDocOnRenderer,

+ base::Unretained(this), file_url));

}

// When serializing DOM, if the original document has multiple META charset

// declaration, we will add the META which have correct charset declaration

// as first child of HEAD element and remove all original META charset

// declarations.

-TEST_F(DomSerializerTests,

- SerializeHTMLDOMWithMultipleMetaCharsetInOriginalDoc) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("youtube_2.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SerializeHTMLDOMWithMultipleMetaCharsetInOriginalDoc) {

+ base::FilePath page_file_path =

+ GetTestFilePath("dom_serializer", "youtube_2.htm");

// Get file URL.

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

+ NavigateToURL(shell(), file_url);

- // Make sure there are multiple META charset declarations in original

- // document.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement head_ele = doc.head();

- ASSERT_TRUE(!head_ele.isNull());

- // Go through all children of HEAD element.

- int charset_declaration_count = 0;

- for (WebNode child = head_ele.firstChild(); !child.isNull();

- child = child.nextSibling()) {

- std::string charset_info;

- if (IsMetaElement(child, charset_info) && !charset_info.empty())

- charset_declaration_count++;

- }

- // The original doc has more than META tags which have charset declaration.

- ASSERT_TRUE(charset_declaration_count > 1);

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Load the serialized contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- LoadContents(serialized_contents, file_url,

- web_frame->document().encoding());

- // Make sure only first child of HEAD element is META which has charset

- // declaration in serialized contents.

- web_frame = test_shell_->webView()->mainFrame();

- ASSERT_TRUE(web_frame != NULL);

- doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- head_ele = doc.head();

- ASSERT_TRUE(!head_ele.isNull());

- WebNode meta_node = head_ele.firstChild();

- ASSERT_TRUE(!meta_node.isNull());

- // Get meta charset info.

- std::string charset_info2;

- ASSERT_TRUE(IsMetaElement(meta_node, charset_info2));

- ASSERT_TRUE(!charset_info2.empty());

- ASSERT_EQ(charset_info2,

- std::string(web_frame->document().encoding().utf8()));

- // Make sure no more additional META tags which have charset declaration.

- for (WebNode child = meta_node.nextSibling(); !child.isNull();

- child = child.nextSibling()) {

- std::string charset_info;

- if (IsMetaElement(child, charset_info))

- ASSERT_TRUE(charset_info.empty());

- }

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SerializeHTMLDOMWithMultipleMetaCharsetInOriginalDocOnRenderer,

+ base::Unretained(this), file_url));

}

// Test situation of html entities in text when serializing HTML DOM.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithEntitiesInText) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII(

- "dom_serializer/htmlentities_in_text.htm");

- // Get file URL. The URL is dummy URL to identify the following loading

- // actions. The test content is in constant:original_contents.

- GURL file_url = net::FilePathToFileURL(page_file_path);

- ASSERT_TRUE(file_url.SchemeIsFile());

- // Test contents.

- static const char* const original_contents =

- "<html><body>&<>\"\'</body></html>";

- // Load the test contents.

- LoadContents(original_contents, file_url, WebString());

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithEntitiesInText) {

+ // Need to spin up the renderer and also navigate to a file url so that the

+ // renderer code doesn't attempt a fork when it sees a load to file scheme

+ // from non-file scheme.

+ NavigateToURL(shell(), GetTestUrl(".", "simple_page.html"));

- // Get BODY's text content in DOM.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement body_ele = doc.body();

- ASSERT_TRUE(!body_ele.isNull());

- WebNode text_node = body_ele.firstChild();

- ASSERT_TRUE(text_node.isTextNode());

- ASSERT_TRUE(std::string(text_node.createMarkup().utf8()) ==

- "&<>\"\'");

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Compare the serialized contents with original contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- // Compare the serialized contents with original contents to make sure

- // they are same.

- // Because we add MOTW when serializing DOM, so before comparison, we also

- // need to add MOTW to original_contents.

- std::string original_str =

- WebPageSerializer::generateMarkOfTheWebDeclaration(file_url).utf8();

- original_str += original_contents;

- // Since WebCore now inserts a new HEAD element if there is no HEAD element

- // when creating BODY element. (Please see HTMLParser::bodyCreateErrorCheck.)

- // We need to append the HEAD content and corresponding META content if we

- // find WebCore-generated HEAD element.

- if (!doc.head().isNull()) {

- WebString encoding = web_frame->document().encoding();

- std::string htmlTag("<html>");

- std::string::size_type pos = original_str.find(htmlTag);

- ASSERT_NE(std::string::npos, pos);

- pos += htmlTag.length();

- std::string head_part("<head>");

- head_part +=

- WebPageSerializer::generateMetaCharsetDeclaration(encoding).utf8();

- head_part += "</head>";

- original_str.insert(pos, head_part);

- }

- ASSERT_EQ(original_str, serialized_contents);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::SerializeHTMLDOMWithEntitiesInTextOnRenderer,

+ base::Unretained(this)));

}

// Test situation of html entities in attribute value when serializing

// HTML DOM.

// This test started to fail at WebKit r65388. See http://crbug.com/52279.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithEntitiesInAttributeValue) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII(

- "dom_serializer/htmlentities_in_attribute_value.htm");

- // Get file URL. The URL is dummy URL to identify the following loading

- // actions. The test content is in constant:original_contents.

- GURL file_url = net::FilePathToFileURL(page_file_path);

- ASSERT_TRUE(file_url.SchemeIsFile());

- // Test contents.

- static const char* const original_contents =

- "<html><body title=\"&<>"'\"></body></html>";

- // Load the test contents.

- LoadContents(original_contents, file_url, WebString());

- // Get value of BODY's title attribute in DOM.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement body_ele = doc.body();

- ASSERT_TRUE(!body_ele.isNull());

- WebString value = body_ele.getAttribute("title");

- ASSERT_TRUE(std::string(value.utf8()) == "&<>\"\'");

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Compare the serialized contents with original contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- // Compare the serialized contents with original contents to make sure

- // they are same.

- std::string original_str =

- WebPageSerializer::generateMarkOfTheWebDeclaration(file_url).utf8();

- original_str += original_contents;

- if (!doc.isNull()) {

- WebString encoding = web_frame->document().encoding();

- std::string htmlTag("<html>");

- std::string::size_type pos = original_str.find(htmlTag);

- ASSERT_NE(std::string::npos, pos);

- pos += htmlTag.length();

- std::string head_part("<head>");

- head_part +=

- WebPageSerializer::generateMetaCharsetDeclaration(encoding).utf8();

- head_part += "</head>";

- original_str.insert(pos, head_part);

- }

- ASSERT_EQ(original_str, serialized_contents);

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SerializeHTMLDOMWithEntitiesInAttributeValue) {

+ // Need to spin up the renderer and also navigate to a file url so that the

+ // renderer code doesn't attempt a fork when it sees a load to file scheme

+ // from non-file scheme.

+ NavigateToURL(shell(), GetTestUrl(".", "simple_page.html"));

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SerializeHTMLDOMWithEntitiesInAttributeValueOnRenderer,

+ base::Unretained(this)));

}

// Test situation of non-standard HTML entities when serializing HTML DOM.

// This test started to fail at WebKit r65351. See http://crbug.com/52279.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithNonStandardEntities) {

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SerializeHTMLDOMWithNonStandardEntities) {

// Make a test file URL and load it.

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("nonstandard_htmlentities.htm");

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "nonstandard_htmlentities.htm");

GURL file_url = net::FilePathToFileURL(page_file_path);

- LoadPageFromURL(file_url);

+ NavigateToURL(shell(), file_url);

- // Get value of BODY's title attribute in DOM.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement body_element = doc.body();

- // Unescaped string for "&percnt;&nsup;¹'".

- static const wchar_t parsed_value[] = {

- '%', 0x2285, 0x00b9, '\'', 0

- };

- WebString value = body_element.getAttribute("title");

- ASSERT_TRUE(UTF16ToWide(value) == parsed_value);

- ASSERT_TRUE(UTF16ToWide(body_element.innerText()) == parsed_value);

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Check the serialized string.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- // Confirm that the serialized string has no non-standard HTML entities.

- ASSERT_EQ(std::string::npos, serialized_contents.find("&percnt;"));

- ASSERT_EQ(std::string::npos, serialized_contents.find("&nsup;"));

- ASSERT_EQ(std::string::npos, serialized_contents.find("¹"));

- ASSERT_EQ(std::string::npos, serialized_contents.find("'"));

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SerializeHTMLDOMWithNonStandardEntitiesOnRenderer,

+ base::Unretained(this), file_url));

}

// Test situation of BASE tag in original document when serializing HTML DOM.

// When serializing, we should comment the BASE tag, append a new BASE tag.

// rewrite all the savable URLs to relative local path, and change other URLs

// to absolute URLs.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithBaseTag) {

- // There are total 2 available base tags in this test file.

- const int kTotalBaseTagCountInTestFile = 2;

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithBaseTag) {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "html_doc_has_base_tag.htm");

- base::FilePath page_file_path =

- data_dir_.AppendASCII("dom_serializer").AsEndingWithSeparator();

+ // Get page dir URL which is base URL of this file.

+ base::FilePath dir_name = page_file_path.DirName();

+ dir_name = dir_name.Append(

+ base::FilePath::StringType(base::FilePath::kSeparators[0], 1));

+ GURL path_dir_url = net::FilePathToFileURL(dir_name);

- // Get page dir URL which is base URL of this file.

- GURL path_dir_url = net::FilePathToFileURL(page_file_path);

- // Get file path.

- page_file_path =

- page_file_path.AppendASCII("html_doc_has_base_tag.htm");

// Get file URL.

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

- // Since for this test, we assume there is no savable sub-resource links for

- // this test file, also all links are relative URLs in this test file, so we

- // need to check those relative URLs and make sure document has BASE tag.

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- // Go through all descent nodes.

- WebNodeCollection all = doc.all();

- int original_base_tag_count = 0;

- for (WebNode node = all.firstItem(); !node.isNull();

- node = all.nextItem()) {

- if (!node.isElementNode())

- continue;

- WebElement element = node.to<WebElement>();

- if (element.hasTagName("base")) {

- original_base_tag_count++;

- } else {

- // Get link.

- WebString value =

- webkit_glue::GetSubResourceLinkFromElement(element);

- if (value.isNull() && element.hasTagName("a")) {

- value = element.getAttribute("href");

- if (value.isEmpty())

- value = WebString();

- }

- // Each link is relative link.

- if (!value.isNull()) {

- GURL link(value.utf8());

- ASSERT_TRUE(link.scheme().empty());

- }

- ASSERT_EQ(original_base_tag_count, kTotalBaseTagCountInTestFile);

- // Make sure in original document, the base URL is not equal with the

- // |path_dir_url|.

- GURL original_base_url(doc.baseURL());

- ASSERT_NE(original_base_url, path_dir_url);

+ NavigateToURL(shell(), file_url);

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Load the serialized contents.

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- LoadContents(serialized_contents, file_url,

- web_frame->document().encoding());

- // Make sure all links are absolute URLs and doc there are some number of

- // BASE tags in serialized HTML data. Each of those BASE tags have same base

- // URL which is as same as URL of current test file.

- web_frame = test_shell_->webView()->mainFrame();

- ASSERT_TRUE(web_frame != NULL);

- doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- // Go through all descent nodes.

- all = doc.all();

- int new_base_tag_count = 0;

- for (WebNode node = all.firstItem(); !node.isNull();

- node = all.nextItem()) {

- if (!node.isElementNode())

- continue;

- WebElement element = node.to<WebElement>();

- if (element.hasTagName("base")) {

- new_base_tag_count++;

- } else {

- // Get link.

- WebString value =

- webkit_glue::GetSubResourceLinkFromElement(element);

- if (value.isNull() && element.hasTagName("a")) {

- value = element.getAttribute("href");

- if (value.isEmpty())

- value = WebString();

- }

- // Each link is absolute link.

- if (!value.isNull()) {

- GURL link(std::string(value.utf8()));

- ASSERT_FALSE(link.scheme().empty());

- }

- // We have one more added BASE tag which is generated by JavaScript.

- ASSERT_EQ(new_base_tag_count, original_base_tag_count + 1);

- // Make sure in new document, the base URL is equal with the |path_dir_url|.

- GURL new_base_url(doc.baseURL());

- ASSERT_EQ(new_base_url, path_dir_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::SerializeHTMLDOMWithBaseTagOnRenderer,

+ base::Unretained(this), file_url, path_dir_url));

}

// Serializing page which has an empty HEAD tag.

-TEST_F(DomSerializerTests, SerializeHTMLDOMWithEmptyHead) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("empty_head.htm");

- GURL file_url = net::FilePathToFileURL(page_file_path);

- ASSERT_TRUE(file_url.SchemeIsFile());

+IN_PROC_BROWSER_TEST_F(DomSerializerTests, SerializeHTMLDOMWithEmptyHead) {

+ // Need to spin up the renderer and also navigate to a file url so that the

+ // renderer code doesn't attempt a fork when it sees a load to file scheme

+ // from non-file scheme.

+ NavigateToURL(shell(), GetTestUrl(".", "simple_page.html"));

- // Load the test html content.

- static const char* const empty_head_contents =

- "<html><head></head><body>hello world</body></html>";

- LoadContents(empty_head_contents, file_url, WebString());

- // Make sure the head tag is empty.

- WebFrame* web_frame = test_shell_->webView()->mainFrame();

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- WebElement head_element = doc.head();

- ASSERT_TRUE(!head_element.isNull());

- ASSERT_TRUE(!head_element.hasChildNodes());

- ASSERT_TRUE(head_element.childNodes().length() == 0);

- // Do serialization.

- SerializeDomForURL(file_url, false);

- // Make sure the serialized contents have META ;

- ASSERT_TRUE(HasSerializedFrame(file_url));

- const std::string& serialized_contents =

- GetSerializedContentForFrame(file_url);

- // Reload serialized contents and make sure there is only one META tag.

- LoadContents(serialized_contents, file_url, web_frame->document().encoding());

- web_frame = test_shell_->webView()->mainFrame();

- ASSERT_TRUE(web_frame != NULL);

- doc = web_frame->document();

- ASSERT_TRUE(doc.isHTMLDocument());

- head_element = doc.head();

- ASSERT_TRUE(!head_element.isNull());

- ASSERT_TRUE(head_element.hasChildNodes());

- ASSERT_TRUE(head_element.childNodes().length() == 1);

- WebNode meta_node = head_element.firstChild();

- ASSERT_TRUE(!meta_node.isNull());

- // Get meta charset info.

- std::string charset_info;

- ASSERT_TRUE(IsMetaElement(meta_node, charset_info));

- ASSERT_TRUE(!charset_info.empty());

- ASSERT_EQ(charset_info,

- std::string(web_frame->document().encoding().utf8()));

- // Check the body's first node is text node and its contents are

- // "hello world"

- WebElement body_element = doc.body();

- ASSERT_TRUE(!body_element.isNull());

- WebNode text_node = body_element.firstChild();

- ASSERT_TRUE(text_node.isTextNode());

- WebString text_node_contents = text_node.nodeValue();

- ASSERT_TRUE(std::string(text_node_contents.utf8()) == "hello world");

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(&DomSerializerTests::SerializeHTMLDOMWithEmptyHeadOnRenderer,

+ base::Unretained(this)));

}

// Test that we don't crash when the page contains an iframe that

// was handled as a download (http://crbug.com/42212).

-TEST_F(DomSerializerTests, SerializeDocumentWithDownloadedIFrame) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("iframe-src-is-exe.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SerializeDocumentWithDownloadedIFrame) {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "iframe-src-is-exe.htm");

GURL file_url = net::FilePathToFileURL(page_file_path);

ASSERT_TRUE(file_url.SchemeIsFile());

// Load the test file.

- LoadPageFromURL(file_url);

- // Do a recursive serialization. We pass if we don't crash.

- SerializeDomForURL(file_url, true);

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SerializeDocumentWithDownloadedIFrameOnRenderer,

+ base::Unretained(this), file_url));

}

-TEST_F(DomSerializerTests, SubResourceForElementsInNonHTMLNamespace) {

- base::FilePath page_file_path = data_dir_;

- page_file_path = page_file_path.AppendASCII("dom_serializer");

- page_file_path = page_file_path.AppendASCII("non_html_namespace.htm");

+IN_PROC_BROWSER_TEST_F(DomSerializerTests,

+ SubResourceForElementsInNonHTMLNamespace) {

+ base::FilePath page_file_path = GetTestFilePath(

+ "dom_serializer", "non_html_namespace.htm");

GURL file_url = net::FilePathToFileURL(page_file_path);

- LoadPageFromURL(file_url);

- WebFrame* web_frame = FindSubFrameByURL(test_shell_->webView(), file_url);

- ASSERT_TRUE(web_frame != NULL);

- WebDocument doc = web_frame->document();

- WebNode lastNodeInBody = doc.body().lastChild();

- ASSERT_EQ(WebNode::ElementNode, lastNodeInBody.nodeType());

- WebString uri = webkit_glue::GetSubResourceLinkFromElement(

- lastNodeInBody.to<WebElement>());

- EXPECT_TRUE(uri.isNull());

+ NavigateToURL(shell(), file_url);

+ PostTaskToInProcessRendererAndWait(

+ base::Bind(

+ &DomSerializerTests::

+ SubResourceForElementsInNonHTMLNamespaceOnRenderer,

+ base::Unretained(this), file_url));

}

-} // namespace

+} // namespace content

« no previous file with comments | « content/renderer/dom_operations_browsertest.cc ('k') | content/renderer/resource_fetcher_browsertest.cc » ('j') | no next file with comments »