Source/core/html/parser/HTMLParserIdioms.cpp - Issue 74513003: Moved text decoding to the parser thread

Unified Diff: Source/core/html/parser/HTMLParserIdioms.cpp

Issue 74513003: Moved text decoding to the parser thread (Closed) Base URL: https://chromium.googlesource.com/chromium/blink.git@parserthread_step25

Patch Set: Rebase Created 7 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: Source/core/html/parser/HTMLParserIdioms.cpp

diff --git a/Source/core/html/parser/HTMLParserIdioms.cpp b/Source/core/html/parser/HTMLParserIdioms.cpp

index f538c54cc5bfc600db038025427f6b21559c110a..5d24c6acf16ef6b361e52fcc446a452ca58fad8f 100644

--- a/Source/core/html/parser/HTMLParserIdioms.cpp

+++ b/Source/core/html/parser/HTMLParserIdioms.cpp

@@ -25,14 +25,18 @@

#include "config.h"

#include "core/html/parser/HTMLParserIdioms.h"

+#include "HTMLNames.h"

#include <limits>

#include "wtf/MathExtras.h"

#include "wtf/text/AtomicString.h"

#include "wtf/text/StringBuilder.h"

#include "wtf/text/StringHash.h"

+#include "wtf/text/TextEncoding.h"

namespace WebCore {

+using namespace HTMLNames;

template <typename CharType>

static String stripLeadingAndTrailingHTMLSpaces(String string, const CharType* characters, unsigned length)

{

@@ -265,6 +269,92 @@ bool parseHTMLNonNegativeInteger(const String& input, unsigned& value)

return parseHTMLNonNegativeIntegerInternal(start, start + length, value);

}

+static const char charsetString[] = "charset";

+static const size_t charsetLength = sizeof("charset") - 1;

+String extractCharset(const String& value)

+ size_t pos = 0;

+ unsigned length = value.length();

+ while (pos < length) {

+ pos = value.find(charsetString, pos, false);

+ if (pos == kNotFound)

+ break;

+ pos += charsetLength;

+ // Skip whitespace.

+ while (pos < length && value[pos] <= ' ')

+ ++pos;

+ if (value[pos] != '=')

+ continue;

+ ++pos;

+ while (pos < length && value[pos] <= ' ')

+ ++pos;

+ char quoteMark = 0;

+ if (pos < length && (value[pos] == '"' || value[pos] == '\'')) {

+ quoteMark = static_cast<char>(value[pos++]);

+ ASSERT(!(quoteMark & 0x80));

+ }

+ if (pos == length)

+ break;

+ unsigned end = pos;

+ while (end < length && ((quoteMark && value[end] != quoteMark) || (!quoteMark && value[end] > ' ' && value[end] != '"' && value[end] != '\'' && value[end] != ';')))

+ ++end;

+ if (quoteMark && (end == length))

+ break; // Close quote not found.

+ return value.substring(pos, end - pos);

+ }

+ return "";

+enum Mode {

+ None,

+ Charset,

+ Pragma,

+};

+WTF::TextEncoding encodingFromMetaAttributes(const HTMLAttributeList& attributes)

+ bool gotPragma = false;

+ Mode mode = None;

+ String charset;

+ for (HTMLAttributeList::const_iterator iter = attributes.begin(); iter != attributes.end(); ++iter) {

+ const String& attributeName = iter->first;

+ const String& attributeValue = iter->second;

+ if (threadSafeMatch(attributeName, http_equivAttr)) {

+ if (equalIgnoringCase(attributeValue, "content-type"))

+ gotPragma = true;

+ } else if (charset.isEmpty()) {

+ if (threadSafeMatch(attributeName, charsetAttr)) {

+ charset = attributeValue;

+ mode = Charset;

+ } else if (threadSafeMatch(attributeName, contentAttr)) {

+ charset = extractCharset(attributeValue);

+ if (charset.length())

+ mode = Pragma;

+ }

+ if (mode == Charset || (mode == Pragma && gotPragma))

+ return WTF::TextEncoding(stripLeadingAndTrailingHTMLSpaces(charset));

+ return WTF::TextEncoding();

static bool threadSafeEqual(const StringImpl* a, const StringImpl* b)

{

if (a == b)

« no previous file with comments | « Source/core/html/parser/HTMLParserIdioms.h ('k') | Source/core/html/parser/HTMLPreloadScanner.cpp » ('j') | no next file with comments »