OLD | NEW |
1 // Copyright 2006-2008 the V8 project authors. All rights reserved. | 1 // Copyright 2006-2008 the V8 project authors. All rights reserved. |
2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
4 // met: | 4 // met: |
5 // | 5 // |
6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
(...skipping 10 matching lines...) Expand all Loading... |
21 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT | 21 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, | 22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | 23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
27 | 27 |
28 #include "v8.h" | 28 #include "v8.h" |
29 | 29 |
30 #include "ast.h" | 30 #include "ast.h" |
| 31 #include "handles.h" |
31 #include "scanner.h" | 32 #include "scanner.h" |
32 | 33 |
33 namespace v8 { | 34 namespace v8 { |
34 namespace internal { | 35 namespace internal { |
35 | 36 |
36 // ---------------------------------------------------------------------------- | 37 // ---------------------------------------------------------------------------- |
37 // Character predicates | 38 // Character predicates |
38 | 39 |
39 | 40 |
40 unibrow::Predicate<IdentifierStart, 128> Scanner::kIsIdentifierStart; | 41 unibrow::Predicate<IdentifierStart, 128> Scanner::kIsIdentifierStart; |
(...skipping 38 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
79 } | 80 } |
80 ASSERT(pos() <= Capacity()); | 81 ASSERT(pos() <= Capacity()); |
81 } | 82 } |
82 | 83 |
83 | 84 |
84 // ---------------------------------------------------------------------------- | 85 // ---------------------------------------------------------------------------- |
85 // UTF16Buffer | 86 // UTF16Buffer |
86 | 87 |
87 | 88 |
88 UTF16Buffer::UTF16Buffer() | 89 UTF16Buffer::UTF16Buffer() |
89 : pos_(0), size_(0) { } | 90 : pos_(0), end_(Scanner::kNoEndPosition) { } |
90 | |
91 | |
92 Handle<String> UTF16Buffer::SubString(int start, int end) { | |
93 return internal::SubString(data_, start, end); | |
94 } | |
95 | 91 |
96 | 92 |
97 // CharacterStreamUTF16Buffer | 93 // CharacterStreamUTF16Buffer |
98 CharacterStreamUTF16Buffer::CharacterStreamUTF16Buffer() | 94 CharacterStreamUTF16Buffer::CharacterStreamUTF16Buffer() |
99 : pushback_buffer_(0), last_(0), stream_(NULL) { } | 95 : pushback_buffer_(0), last_(0), stream_(NULL) { } |
100 | 96 |
101 | 97 |
102 void CharacterStreamUTF16Buffer::Initialize(Handle<String> data, | 98 void CharacterStreamUTF16Buffer::Initialize(Handle<String> data, |
103 unibrow::CharacterStream* input) { | 99 unibrow::CharacterStream* input, |
104 data_ = data; | 100 int start_position, |
105 pos_ = 0; | 101 int end_position) { |
106 stream_ = input; | 102 stream_ = input; |
| 103 if (start_position > 0) { |
| 104 SeekForward(start_position); |
| 105 } |
| 106 end_ = end_position != Scanner::kNoEndPosition ? end_position : kMaxInt; |
107 } | 107 } |
108 | 108 |
109 | 109 |
110 void CharacterStreamUTF16Buffer::PushBack(uc32 ch) { | 110 void CharacterStreamUTF16Buffer::PushBack(uc32 ch) { |
111 pushback_buffer()->Add(last_); | 111 pushback_buffer()->Add(last_); |
112 last_ = ch; | 112 last_ = ch; |
113 pos_--; | 113 pos_--; |
114 } | 114 } |
115 | 115 |
116 | 116 |
117 uc32 CharacterStreamUTF16Buffer::Advance() { | 117 uc32 CharacterStreamUTF16Buffer::Advance() { |
| 118 ASSERT(end_ != Scanner::kNoEndPosition); |
| 119 ASSERT(end_ >= 0); |
118 // NOTE: It is of importance to Persian / Farsi resources that we do | 120 // NOTE: It is of importance to Persian / Farsi resources that we do |
119 // *not* strip format control characters in the scanner; see | 121 // *not* strip format control characters in the scanner; see |
120 // | 122 // |
121 // https://bugzilla.mozilla.org/show_bug.cgi?id=274152 | 123 // https://bugzilla.mozilla.org/show_bug.cgi?id=274152 |
122 // | 124 // |
123 // So, even though ECMA-262, section 7.1, page 11, dictates that we | 125 // So, even though ECMA-262, section 7.1, page 11, dictates that we |
124 // must remove Unicode format-control characters, we do not. This is | 126 // must remove Unicode format-control characters, we do not. This is |
125 // in line with how IE and SpiderMonkey handles it. | 127 // in line with how IE and SpiderMonkey handles it. |
126 if (!pushback_buffer()->is_empty()) { | 128 if (!pushback_buffer()->is_empty()) { |
127 pos_++; | 129 pos_++; |
128 return last_ = pushback_buffer()->RemoveLast(); | 130 return last_ = pushback_buffer()->RemoveLast(); |
129 } else if (stream_->has_more()) { | 131 } else if (stream_->has_more() && pos_ < end_) { |
130 pos_++; | 132 pos_++; |
131 uc32 next = stream_->GetNext(); | 133 uc32 next = stream_->GetNext(); |
132 return last_ = next; | 134 return last_ = next; |
133 } else { | 135 } else { |
134 // Note: currently the following increment is necessary to avoid a | 136 // Note: currently the following increment is necessary to avoid a |
135 // test-parser problem! | 137 // test-parser problem! |
136 pos_++; | 138 pos_++; |
137 return last_ = static_cast<uc32>(-1); | 139 return last_ = static_cast<uc32>(-1); |
138 } | 140 } |
139 } | 141 } |
140 | 142 |
141 | 143 |
142 void CharacterStreamUTF16Buffer::SeekForward(int pos) { | 144 void CharacterStreamUTF16Buffer::SeekForward(int pos) { |
143 pos_ = pos; | 145 pos_ = pos; |
144 ASSERT(pushback_buffer()->is_empty()); | 146 ASSERT(pushback_buffer()->is_empty()); |
145 stream_->Seek(pos); | 147 stream_->Seek(pos); |
146 } | 148 } |
147 | 149 |
148 | 150 |
149 // TwoByteStringUTF16Buffer | 151 // ExternalStringUTF16Buffer |
150 TwoByteStringUTF16Buffer::TwoByteStringUTF16Buffer() | 152 template <typename StringType, typename CharType> |
| 153 ExternalStringUTF16Buffer<StringType, CharType>::ExternalStringUTF16Buffer() |
151 : raw_data_(NULL) { } | 154 : raw_data_(NULL) { } |
152 | 155 |
153 | 156 |
154 void TwoByteStringUTF16Buffer::Initialize( | 157 template <typename StringType, typename CharType> |
155 Handle<ExternalTwoByteString> data) { | 158 void ExternalStringUTF16Buffer<StringType, CharType>::Initialize( |
| 159 Handle<StringType> data, |
| 160 int start_position, |
| 161 int end_position) { |
156 ASSERT(!data.is_null()); | 162 ASSERT(!data.is_null()); |
| 163 raw_data_ = data->resource()->data(); |
157 | 164 |
158 data_ = data; | 165 ASSERT(end_position <= data->length()); |
159 pos_ = 0; | 166 if (start_position > 0) { |
160 | 167 SeekForward(start_position); |
161 raw_data_ = data->resource()->data(); | 168 } |
162 size_ = data->length(); | 169 end_ = |
| 170 end_position != Scanner::kNoEndPosition ? end_position : data->length(); |
163 } | 171 } |
164 | 172 |
165 | 173 |
166 uc32 TwoByteStringUTF16Buffer::Advance() { | 174 template <typename StringType, typename CharType> |
167 if (pos_ < size_) { | 175 uc32 ExternalStringUTF16Buffer<StringType, CharType>::Advance() { |
| 176 if (pos_ < end_) { |
168 return raw_data_[pos_++]; | 177 return raw_data_[pos_++]; |
169 } else { | 178 } else { |
170 // note: currently the following increment is necessary to avoid a | 179 // note: currently the following increment is necessary to avoid a |
171 // test-parser problem! | 180 // test-parser problem! |
172 pos_++; | 181 pos_++; |
173 return static_cast<uc32>(-1); | 182 return static_cast<uc32>(-1); |
174 } | 183 } |
175 } | 184 } |
176 | 185 |
177 | 186 |
178 void TwoByteStringUTF16Buffer::PushBack(uc32 ch) { | 187 template <typename StringType, typename CharType> |
| 188 void ExternalStringUTF16Buffer<StringType, CharType>::PushBack(uc32 ch) { |
179 pos_--; | 189 pos_--; |
180 ASSERT(pos_ >= Scanner::kCharacterLookaheadBufferSize); | 190 ASSERT(pos_ >= Scanner::kCharacterLookaheadBufferSize); |
181 ASSERT(raw_data_[pos_ - Scanner::kCharacterLookaheadBufferSize] == ch); | 191 ASSERT(raw_data_[pos_ - Scanner::kCharacterLookaheadBufferSize] == ch); |
182 } | 192 } |
183 | 193 |
184 | 194 |
185 void TwoByteStringUTF16Buffer::SeekForward(int pos) { | 195 template <typename StringType, typename CharType> |
| 196 void ExternalStringUTF16Buffer<StringType, CharType>::SeekForward(int pos) { |
186 pos_ = pos; | 197 pos_ = pos; |
187 } | 198 } |
188 | 199 |
189 | 200 |
190 // ---------------------------------------------------------------------------- | 201 // ---------------------------------------------------------------------------- |
191 // Keyword Matcher | 202 // Keyword Matcher |
192 KeywordMatcher::FirstState KeywordMatcher::first_states_[] = { | 203 KeywordMatcher::FirstState KeywordMatcher::first_states_[] = { |
193 { "break", KEYWORD_PREFIX, Token::BREAK }, | 204 { "break", KEYWORD_PREFIX, Token::BREAK }, |
194 { NULL, C, Token::ILLEGAL }, | 205 { NULL, C, Token::ILLEGAL }, |
195 { NULL, D, Token::ILLEGAL }, | 206 { NULL, D, Token::ILLEGAL }, |
(...skipping 124 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
320 } | 331 } |
321 | 332 |
322 | 333 |
323 // ---------------------------------------------------------------------------- | 334 // ---------------------------------------------------------------------------- |
324 // Scanner | 335 // Scanner |
325 | 336 |
326 Scanner::Scanner(ParserMode pre) | 337 Scanner::Scanner(ParserMode pre) |
327 : stack_overflow_(false), is_pre_parsing_(pre == PREPARSE) { } | 338 : stack_overflow_(false), is_pre_parsing_(pre == PREPARSE) { } |
328 | 339 |
329 | 340 |
| 341 void Scanner::Initialize(Handle<String> source, |
| 342 ParserLanguage language) { |
| 343 safe_string_input_buffer_.Reset(source.location()); |
| 344 Init(source, &safe_string_input_buffer_, 0, source->length(), language); |
| 345 } |
| 346 |
| 347 |
| 348 void Scanner::Initialize(Handle<String> source, |
| 349 unibrow::CharacterStream* stream, |
| 350 ParserLanguage language) { |
| 351 Init(source, stream, 0, kNoEndPosition, language); |
| 352 } |
| 353 |
| 354 |
| 355 void Scanner::Initialize(Handle<String> source, |
| 356 int start_position, |
| 357 int end_position, |
| 358 ParserLanguage language) { |
| 359 safe_string_input_buffer_.Reset(source.location()); |
| 360 Init(source, &safe_string_input_buffer_, |
| 361 start_position, end_position, language); |
| 362 } |
| 363 |
| 364 |
330 void Scanner::Init(Handle<String> source, | 365 void Scanner::Init(Handle<String> source, |
331 unibrow::CharacterStream* stream, | 366 unibrow::CharacterStream* stream, |
332 int position, | 367 int start_position, |
| 368 int end_position, |
333 ParserLanguage language) { | 369 ParserLanguage language) { |
334 // Initialize the source buffer. | 370 // Initialize the source buffer. |
335 if (!source.is_null() && StringShape(*source).IsExternalTwoByte()) { | 371 if (!source.is_null() && StringShape(*source).IsExternalTwoByte()) { |
336 two_byte_string_buffer_.Initialize( | 372 two_byte_string_buffer_.Initialize( |
337 Handle<ExternalTwoByteString>::cast(source)); | 373 Handle<ExternalTwoByteString>::cast(source), |
| 374 start_position, |
| 375 end_position); |
338 source_ = &two_byte_string_buffer_; | 376 source_ = &two_byte_string_buffer_; |
| 377 } else if (!source.is_null() && StringShape(*source).IsExternalAscii()) { |
| 378 ascii_string_buffer_.Initialize( |
| 379 Handle<ExternalAsciiString>::cast(source), |
| 380 start_position, |
| 381 end_position); |
| 382 source_ = &ascii_string_buffer_; |
339 } else { | 383 } else { |
340 char_stream_buffer_.Initialize(source, stream); | 384 char_stream_buffer_.Initialize(source, |
| 385 stream, |
| 386 start_position, |
| 387 end_position); |
341 source_ = &char_stream_buffer_; | 388 source_ = &char_stream_buffer_; |
342 } | 389 } |
343 | 390 |
344 position_ = position; | |
345 is_parsing_json_ = (language == JSON); | 391 is_parsing_json_ = (language == JSON); |
346 | 392 |
347 // Set c0_ (one character ahead) | 393 // Set c0_ (one character ahead) |
348 ASSERT(kCharacterLookaheadBufferSize == 1); | 394 ASSERT(kCharacterLookaheadBufferSize == 1); |
349 Advance(); | 395 Advance(); |
350 // Initializer current_ to not refer to a literal buffer. | 396 // Initializer current_ to not refer to a literal buffer. |
351 current_.literal_buffer = NULL; | 397 current_.literal_buffer = NULL; |
352 | 398 |
353 // Skip initial whitespace allowing HTML comment ends just like | 399 // Skip initial whitespace allowing HTML comment ends just like |
354 // after a newline and scan first token. | 400 // after a newline and scan first token. |
355 has_line_terminator_before_next_ = true; | 401 has_line_terminator_before_next_ = true; |
356 SkipWhiteSpace(); | 402 SkipWhiteSpace(); |
357 Scan(); | 403 Scan(); |
358 } | 404 } |
359 | 405 |
360 | 406 |
361 Handle<String> Scanner::SubString(int start, int end) { | |
362 return source_->SubString(start - position_, end - position_); | |
363 } | |
364 | |
365 | |
366 Token::Value Scanner::Next() { | 407 Token::Value Scanner::Next() { |
367 // BUG 1215673: Find a thread safe way to set a stack limit in | 408 // BUG 1215673: Find a thread safe way to set a stack limit in |
368 // pre-parse mode. Otherwise, we cannot safely pre-parse from other | 409 // pre-parse mode. Otherwise, we cannot safely pre-parse from other |
369 // threads. | 410 // threads. |
370 current_ = next_; | 411 current_ = next_; |
371 // Check for stack-overflow before returning any tokens. | 412 // Check for stack-overflow before returning any tokens. |
372 StackLimitCheck check; | 413 StackLimitCheck check; |
373 if (check.HasOverflowed()) { | 414 if (check.HasOverflowed()) { |
374 stack_overflow_ = true; | 415 stack_overflow_ = true; |
375 next_.token = Token::ILLEGAL; | 416 next_.token = Token::ILLEGAL; |
(...skipping 914 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1290 } | 1331 } |
1291 AddCharAdvance(); | 1332 AddCharAdvance(); |
1292 } | 1333 } |
1293 TerminateLiteral(); | 1334 TerminateLiteral(); |
1294 | 1335 |
1295 next_.location.end_pos = source_pos() - 1; | 1336 next_.location.end_pos = source_pos() - 1; |
1296 return true; | 1337 return true; |
1297 } | 1338 } |
1298 | 1339 |
1299 } } // namespace v8::internal | 1340 } } // namespace v8::internal |
OLD | NEW |