| OLD | NEW |
| 1 /* | 1 /* |
| 2 * Copyright (C) 2013 Google, Inc. All Rights Reserved. | 2 * Copyright (C) 2013 Google, Inc. All Rights Reserved. |
| 3 * | 3 * |
| 4 * Redistribution and use in source and binary forms, with or without | 4 * Redistribution and use in source and binary forms, with or without |
| 5 * modification, are permitted provided that the following conditions | 5 * modification, are permitted provided that the following conditions |
| 6 * are met: | 6 * are met: |
| 7 * 1. Redistributions of source code must retain the above copyright | 7 * 1. Redistributions of source code must retain the above copyright |
| 8 * notice, this list of conditions and the following disclaimer. | 8 * notice, this list of conditions and the following disclaimer. |
| 9 * 2. Redistributions in binary form must reproduce the above copyright | 9 * 2. Redistributions in binary form must reproduce the above copyright |
| 10 * notice, this list of conditions and the following disclaimer in the | 10 * notice, this list of conditions and the following disclaimer in the |
| (...skipping 74 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 85 // FIXME: This is copied from HTMLElementStack::isMathMLTextIntegrationPoint | 85 // FIXME: This is copied from HTMLElementStack::isMathMLTextIntegrationPoint |
| 86 // and changed to use threadSafeMatch. | 86 // and changed to use threadSafeMatch. |
| 87 const String& tagName = token.data(); | 87 const String& tagName = token.data(); |
| 88 return threadSafeMatch(tagName, MathMLNames::miTag) || | 88 return threadSafeMatch(tagName, MathMLNames::miTag) || |
| 89 threadSafeMatch(tagName, MathMLNames::moTag) || | 89 threadSafeMatch(tagName, MathMLNames::moTag) || |
| 90 threadSafeMatch(tagName, MathMLNames::mnTag) || | 90 threadSafeMatch(tagName, MathMLNames::mnTag) || |
| 91 threadSafeMatch(tagName, MathMLNames::msTag) || | 91 threadSafeMatch(tagName, MathMLNames::msTag) || |
| 92 threadSafeMatch(tagName, MathMLNames::mtextTag); | 92 threadSafeMatch(tagName, MathMLNames::mtextTag); |
| 93 } | 93 } |
| 94 | 94 |
| 95 static bool tokenExitsInSelect(const CompactHTMLToken& token) { |
| 96 // https://html.spec.whatwg.org/#parsing-main-inselect |
| 97 const String& tagName = token.data(); |
| 98 return threadSafeMatch(tagName, inputTag) || |
| 99 threadSafeMatch(tagName, keygenTag) || |
| 100 threadSafeMatch(tagName, textareaTag); |
| 101 } |
| 102 |
| 95 HTMLTreeBuilderSimulator::HTMLTreeBuilderSimulator( | 103 HTMLTreeBuilderSimulator::HTMLTreeBuilderSimulator( |
| 96 const HTMLParserOptions& options) | 104 const HTMLParserOptions& options) |
| 97 : m_options(options) { | 105 : m_options(options), m_inSelectInsertionMode(false) { |
| 98 m_namespaceStack.append(HTML); | 106 m_namespaceStack.append(HTML); |
| 99 } | 107 } |
| 100 | 108 |
| 101 HTMLTreeBuilderSimulator::State HTMLTreeBuilderSimulator::stateFor( | 109 HTMLTreeBuilderSimulator::State HTMLTreeBuilderSimulator::stateFor( |
| 102 HTMLTreeBuilder* treeBuilder) { | 110 HTMLTreeBuilder* treeBuilder) { |
| 103 ASSERT(isMainThread()); | 111 ASSERT(isMainThread()); |
| 104 State namespaceStack; | 112 State namespaceStack; |
| 105 for (HTMLElementStack::ElementRecord* record = | 113 for (HTMLElementStack::ElementRecord* record = |
| 106 treeBuilder->openElements()->topRecord(); | 114 treeBuilder->openElements()->topRecord(); |
| 107 record; record = record->next()) { | 115 record; record = record->next()) { |
| (...skipping 25 matching lines...) Expand all Loading... |
| 133 m_namespaceStack.pop_back(); | 141 m_namespaceStack.pop_back(); |
| 134 if ((m_namespaceStack.last() == SVG && tokenExitsSVG(token)) || | 142 if ((m_namespaceStack.last() == SVG && tokenExitsSVG(token)) || |
| 135 (m_namespaceStack.last() == MathML && tokenExitsMath(token))) | 143 (m_namespaceStack.last() == MathML && tokenExitsMath(token))) |
| 136 m_namespaceStack.append(HTML); | 144 m_namespaceStack.append(HTML); |
| 137 if (!inForeignContent()) { | 145 if (!inForeignContent()) { |
| 138 // FIXME: This is just a copy of Tokenizer::updateStateFor which uses | 146 // FIXME: This is just a copy of Tokenizer::updateStateFor which uses |
| 139 // threadSafeMatches. | 147 // threadSafeMatches. |
| 140 if (threadSafeMatch(tagName, textareaTag) || | 148 if (threadSafeMatch(tagName, textareaTag) || |
| 141 threadSafeMatch(tagName, titleTag)) { | 149 threadSafeMatch(tagName, titleTag)) { |
| 142 tokenizer->setState(HTMLTokenizer::RCDATAState); | 150 tokenizer->setState(HTMLTokenizer::RCDATAState); |
| 143 } else if (threadSafeMatch(tagName, plaintextTag)) { | |
| 144 tokenizer->setState(HTMLTokenizer::PLAINTEXTState); | |
| 145 } else if (threadSafeMatch(tagName, scriptTag)) { | 151 } else if (threadSafeMatch(tagName, scriptTag)) { |
| 146 tokenizer->setState(HTMLTokenizer::ScriptDataState); | 152 tokenizer->setState(HTMLTokenizer::ScriptDataState); |
| 147 simulatedToken = ScriptStart; | 153 simulatedToken = ScriptStart; |
| 148 } else if (threadSafeMatch(tagName, styleTag) || | 154 } else if (!m_inSelectInsertionMode) { |
| 149 threadSafeMatch(tagName, iframeTag) || | 155 // If we're in the "in select" insertion mode, all of these tags are |
| 150 threadSafeMatch(tagName, xmpTag) || | 156 // ignored, so we shouldn't change the tokenizer state: |
| 151 (threadSafeMatch(tagName, noembedTag) && | 157 // https://html.spec.whatwg.org/#parsing-main-inselect |
| 152 m_options.pluginsEnabled) || | 158 if (threadSafeMatch(tagName, plaintextTag) && |
| 153 threadSafeMatch(tagName, noframesTag) || | 159 !m_inSelectInsertionMode) { |
| 154 (threadSafeMatch(tagName, noscriptTag) && | 160 tokenizer->setState(HTMLTokenizer::PLAINTEXTState); |
| 155 m_options.scriptEnabled)) { | 161 } else if (threadSafeMatch(tagName, styleTag) || |
| 156 tokenizer->setState(HTMLTokenizer::RAWTEXTState); | 162 threadSafeMatch(tagName, iframeTag) || |
| 163 threadSafeMatch(tagName, xmpTag) || |
| 164 (threadSafeMatch(tagName, noembedTag) && |
| 165 m_options.pluginsEnabled) || |
| 166 threadSafeMatch(tagName, noframesTag) || |
| 167 (threadSafeMatch(tagName, noscriptTag) && |
| 168 m_options.scriptEnabled)) { |
| 169 tokenizer->setState(HTMLTokenizer::RAWTEXTState); |
| 170 } |
| 171 } |
| 172 |
| 173 // We need to track whether we're in the "in select" insertion mode |
| 174 // in order to determine whether '<plaintext>' will put the tokenizer |
| 175 // into PLAINTEXTState, and whether '<xmp>' and others will consume |
| 176 // textual content. |
| 177 // |
| 178 // https://html.spec.whatwg.org/#parsing-main-inselect |
| 179 if (threadSafeMatch(tagName, selectTag)) { |
| 180 m_inSelectInsertionMode = true; |
| 181 } else if (m_inSelectInsertionMode && tokenExitsInSelect(token)) { |
| 182 m_inSelectInsertionMode = false; |
| 157 } | 183 } |
| 158 } | 184 } |
| 159 } | 185 } |
| 160 | 186 |
| 161 if (token.type() == HTMLToken::EndTag) { | 187 if (token.type() == HTMLToken::EndTag) { |
| 162 const String& tagName = token.data(); | 188 const String& tagName = token.data(); |
| 163 if ((m_namespaceStack.last() == SVG && | 189 if ((m_namespaceStack.last() == SVG && |
| 164 threadSafeMatch(tagName, SVGNames::svgTag)) || | 190 threadSafeMatch(tagName, SVGNames::svgTag)) || |
| 165 (m_namespaceStack.last() == MathML && | 191 (m_namespaceStack.last() == MathML && |
| 166 threadSafeMatch(tagName, MathMLNames::mathTag)) || | 192 threadSafeMatch(tagName, MathMLNames::mathTag)) || |
| 167 (m_namespaceStack.contains(SVG) && m_namespaceStack.last() == HTML && | 193 (m_namespaceStack.contains(SVG) && m_namespaceStack.last() == HTML && |
| 168 tokenExitsSVG(token)) || | 194 tokenExitsSVG(token)) || |
| 169 (m_namespaceStack.contains(MathML) && m_namespaceStack.last() == HTML && | 195 (m_namespaceStack.contains(MathML) && m_namespaceStack.last() == HTML && |
| 170 tokenExitsMath(token))) | 196 tokenExitsMath(token))) { |
| 171 m_namespaceStack.pop_back(); | 197 m_namespaceStack.pop_back(); |
| 198 } |
| 172 if (threadSafeMatch(tagName, scriptTag)) { | 199 if (threadSafeMatch(tagName, scriptTag)) { |
| 173 if (!inForeignContent()) | 200 if (!inForeignContent()) |
| 174 tokenizer->setState(HTMLTokenizer::DataState); | 201 tokenizer->setState(HTMLTokenizer::DataState); |
| 175 return ScriptEnd; | 202 return ScriptEnd; |
| 203 } else if (threadSafeMatch(tagName, selectTag)) { |
| 204 m_inSelectInsertionMode = false; |
| 176 } | 205 } |
| 177 } | 206 } |
| 178 | 207 |
| 179 // FIXME: Also setForceNullCharacterReplacement when in text mode. | 208 // FIXME: Also setForceNullCharacterReplacement when in text mode. |
| 180 tokenizer->setForceNullCharacterReplacement(inForeignContent()); | 209 tokenizer->setForceNullCharacterReplacement(inForeignContent()); |
| 181 tokenizer->setShouldAllowCDATA(inForeignContent()); | 210 tokenizer->setShouldAllowCDATA(inForeignContent()); |
| 182 return simulatedToken; | 211 return simulatedToken; |
| 183 } | 212 } |
| 184 | 213 |
| 185 } // namespace blink | 214 } // namespace blink |
| OLD | NEW |