| OLD | NEW |
| 1 // Copyright 2011 the V8 project authors. All rights reserved. | 1 // Copyright 2016 the V8 project authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #ifndef V8_JSON_PARSER_H_ | 5 #include "src/json-parser.h" |
| 6 #define V8_JSON_PARSER_H_ | |
| 7 | 6 |
| 8 #include "src/char-predicates.h" | 7 #include "src/char-predicates-inl.h" |
| 9 #include "src/conversions.h" | 8 #include "src/conversions.h" |
| 10 #include "src/debug/debug.h" | 9 #include "src/debug/debug.h" |
| 11 #include "src/factory.h" | 10 #include "src/factory.h" |
| 12 #include "src/field-type.h" | 11 #include "src/field-type.h" |
| 13 #include "src/messages.h" | 12 #include "src/messages.h" |
| 13 #include "src/objects-inl.h" |
| 14 #include "src/parsing/scanner.h" | 14 #include "src/parsing/scanner.h" |
| 15 #include "src/parsing/token.h" | 15 #include "src/parsing/token.h" |
| 16 #include "src/transitions.h" | 16 #include "src/transitions.h" |
| 17 | 17 |
| 18 namespace v8 { | 18 namespace v8 { |
| 19 namespace internal { | 19 namespace internal { |
| 20 | 20 |
| 21 enum ParseElementResult { kElementFound, kElementNotFound, kNullHandle }; | 21 template <bool seq_one_byte> |
| 22 JsonParser<seq_one_byte>::JsonParser(Handle<String> source) |
| 23 : source_(source), |
| 24 source_length_(source->length()), |
| 25 isolate_(source->map()->GetHeap()->isolate()), |
| 26 factory_(isolate_->factory()), |
| 27 zone_(isolate_->allocator()), |
| 28 object_constructor_(isolate_->native_context()->object_function(), |
| 29 isolate_), |
| 30 position_(-1) { |
| 31 source_ = String::Flatten(source_); |
| 32 pretenure_ = (source_length_ >= kPretenureTreshold) ? TENURED : NOT_TENURED; |
| 22 | 33 |
| 23 | 34 // Optimized fast case where we only have Latin1 characters. |
| 24 // A simple json parser. | 35 if (seq_one_byte) { |
| 25 template <bool seq_one_byte> | 36 seq_source_ = Handle<SeqOneByteString>::cast(source_); |
| 26 class JsonParser BASE_EMBEDDED { | |
| 27 public: | |
| 28 MUST_USE_RESULT static MaybeHandle<Object> Parse(Handle<String> source) { | |
| 29 return JsonParser(source).ParseJson(); | |
| 30 } | 37 } |
| 31 | 38 } |
| 32 static const int kEndOfString = -1; | |
| 33 | |
| 34 private: | |
| 35 explicit JsonParser(Handle<String> source) | |
| 36 : source_(source), | |
| 37 source_length_(source->length()), | |
| 38 isolate_(source->map()->GetHeap()->isolate()), | |
| 39 factory_(isolate_->factory()), | |
| 40 zone_(isolate_->allocator()), | |
| 41 object_constructor_(isolate_->native_context()->object_function(), | |
| 42 isolate_), | |
| 43 position_(-1) { | |
| 44 source_ = String::Flatten(source_); | |
| 45 pretenure_ = (source_length_ >= kPretenureTreshold) ? TENURED : NOT_TENURED; | |
| 46 | |
| 47 // Optimized fast case where we only have Latin1 characters. | |
| 48 if (seq_one_byte) { | |
| 49 seq_source_ = Handle<SeqOneByteString>::cast(source_); | |
| 50 } | |
| 51 } | |
| 52 | |
| 53 // Parse a string containing a single JSON value. | |
| 54 MaybeHandle<Object> ParseJson(); | |
| 55 | |
| 56 inline void Advance() { | |
| 57 position_++; | |
| 58 if (position_ >= source_length_) { | |
| 59 c0_ = kEndOfString; | |
| 60 } else if (seq_one_byte) { | |
| 61 c0_ = seq_source_->SeqOneByteStringGet(position_); | |
| 62 } else { | |
| 63 c0_ = source_->Get(position_); | |
| 64 } | |
| 65 } | |
| 66 | |
| 67 // The JSON lexical grammar is specified in the ECMAScript 5 standard, | |
| 68 // section 15.12.1.1. The only allowed whitespace characters between tokens | |
| 69 // are tab, carriage-return, newline and space. | |
| 70 | |
| 71 inline void AdvanceSkipWhitespace() { | |
| 72 do { | |
| 73 Advance(); | |
| 74 } while (c0_ == ' ' || c0_ == '\t' || c0_ == '\n' || c0_ == '\r'); | |
| 75 } | |
| 76 | |
| 77 inline void SkipWhitespace() { | |
| 78 while (c0_ == ' ' || c0_ == '\t' || c0_ == '\n' || c0_ == '\r') { | |
| 79 Advance(); | |
| 80 } | |
| 81 } | |
| 82 | |
| 83 inline uc32 AdvanceGetChar() { | |
| 84 Advance(); | |
| 85 return c0_; | |
| 86 } | |
| 87 | |
| 88 // Checks that current charater is c. | |
| 89 // If so, then consume c and skip whitespace. | |
| 90 inline bool MatchSkipWhiteSpace(uc32 c) { | |
| 91 if (c0_ == c) { | |
| 92 AdvanceSkipWhitespace(); | |
| 93 return true; | |
| 94 } | |
| 95 return false; | |
| 96 } | |
| 97 | |
| 98 // A JSON string (production JSONString) is subset of valid JavaScript string | |
| 99 // literals. The string must only be double-quoted (not single-quoted), and | |
| 100 // the only allowed backslash-escapes are ", /, \, b, f, n, r, t and | |
| 101 // four-digit hex escapes (uXXXX). Any other use of backslashes is invalid. | |
| 102 Handle<String> ParseJsonString() { | |
| 103 return ScanJsonString<false>(); | |
| 104 } | |
| 105 | |
| 106 bool ParseJsonString(Handle<String> expected) { | |
| 107 int length = expected->length(); | |
| 108 if (source_->length() - position_ - 1 > length) { | |
| 109 DisallowHeapAllocation no_gc; | |
| 110 String::FlatContent content = expected->GetFlatContent(); | |
| 111 if (content.IsOneByte()) { | |
| 112 DCHECK_EQ('"', c0_); | |
| 113 const uint8_t* input_chars = seq_source_->GetChars() + position_ + 1; | |
| 114 const uint8_t* expected_chars = content.ToOneByteVector().start(); | |
| 115 for (int i = 0; i < length; i++) { | |
| 116 uint8_t c0 = input_chars[i]; | |
| 117 if (c0 != expected_chars[i] || c0 == '"' || c0 < 0x20 || c0 == '\\') { | |
| 118 return false; | |
| 119 } | |
| 120 } | |
| 121 if (input_chars[length] == '"') { | |
| 122 position_ = position_ + length + 1; | |
| 123 AdvanceSkipWhitespace(); | |
| 124 return true; | |
| 125 } | |
| 126 } | |
| 127 } | |
| 128 return false; | |
| 129 } | |
| 130 | |
| 131 Handle<String> ParseJsonInternalizedString() { | |
| 132 Handle<String> result = ScanJsonString<true>(); | |
| 133 if (result.is_null()) return result; | |
| 134 return factory()->InternalizeString(result); | |
| 135 } | |
| 136 | |
| 137 template <bool is_internalized> | |
| 138 Handle<String> ScanJsonString(); | |
| 139 // Creates a new string and copies prefix[start..end] into the beginning | |
| 140 // of it. Then scans the rest of the string, adding characters after the | |
| 141 // prefix. Called by ScanJsonString when reaching a '\' or non-Latin1 char. | |
| 142 template <typename StringType, typename SinkChar> | |
| 143 Handle<String> SlowScanJsonString(Handle<String> prefix, int start, int end); | |
| 144 | |
| 145 // A JSON number (production JSONNumber) is a subset of the valid JavaScript | |
| 146 // decimal number literals. | |
| 147 // It includes an optional minus sign, must have at least one | |
| 148 // digit before and after a decimal point, may not have prefixed zeros (unless | |
| 149 // the integer part is zero), and may include an exponent part (e.g., "e-10"). | |
| 150 // Hexadecimal and octal numbers are not allowed. | |
| 151 Handle<Object> ParseJsonNumber(); | |
| 152 | |
| 153 // Parse a single JSON value from input (grammar production JSONValue). | |
| 154 // A JSON value is either a (double-quoted) string literal, a number literal, | |
| 155 // one of "true", "false", or "null", or an object or array literal. | |
| 156 Handle<Object> ParseJsonValue(); | |
| 157 | |
| 158 // Parse a JSON object literal (grammar production JSONObject). | |
| 159 // An object literal is a squiggly-braced and comma separated sequence | |
| 160 // (possibly empty) of key/value pairs, where the key is a JSON string | |
| 161 // literal, the value is a JSON value, and the two are separated by a colon. | |
| 162 // A JSON array doesn't allow numbers and identifiers as keys, like a | |
| 163 // JavaScript array. | |
| 164 Handle<Object> ParseJsonObject(); | |
| 165 | |
| 166 // Helper for ParseJsonObject. Parses the form "123": obj, which is recorded | |
| 167 // as an element, not a property. | |
| 168 ParseElementResult ParseElement(Handle<JSObject> json_object); | |
| 169 | |
| 170 // Parses a JSON array literal (grammar production JSONArray). An array | |
| 171 // literal is a square-bracketed and comma separated sequence (possibly empty) | |
| 172 // of JSON values. | |
| 173 // A JSON array doesn't allow leaving out values from the sequence, nor does | |
| 174 // it allow a terminal comma, like a JavaScript array does. | |
| 175 Handle<Object> ParseJsonArray(); | |
| 176 | |
| 177 | |
| 178 // Mark that a parsing error has happened at the current token, and | |
| 179 // return a null handle. Primarily for readability. | |
| 180 inline Handle<Object> ReportUnexpectedCharacter() { | |
| 181 return Handle<Object>::null(); | |
| 182 } | |
| 183 | |
| 184 inline Isolate* isolate() { return isolate_; } | |
| 185 inline Factory* factory() { return factory_; } | |
| 186 inline Handle<JSFunction> object_constructor() { return object_constructor_; } | |
| 187 | |
| 188 static const int kInitialSpecialStringLength = 32; | |
| 189 static const int kPretenureTreshold = 100 * 1024; | |
| 190 | |
| 191 | |
| 192 private: | |
| 193 Zone* zone() { return &zone_; } | |
| 194 | |
| 195 void CommitStateToJsonObject(Handle<JSObject> json_object, Handle<Map> map, | |
| 196 ZoneList<Handle<Object> >* properties); | |
| 197 | |
| 198 Handle<String> source_; | |
| 199 int source_length_; | |
| 200 Handle<SeqOneByteString> seq_source_; | |
| 201 | |
| 202 PretenureFlag pretenure_; | |
| 203 Isolate* isolate_; | |
| 204 Factory* factory_; | |
| 205 Zone zone_; | |
| 206 Handle<JSFunction> object_constructor_; | |
| 207 uc32 c0_; | |
| 208 int position_; | |
| 209 }; | |
| 210 | 39 |
| 211 template <bool seq_one_byte> | 40 template <bool seq_one_byte> |
| 212 MaybeHandle<Object> JsonParser<seq_one_byte>::ParseJson() { | 41 MaybeHandle<Object> JsonParser<seq_one_byte>::ParseJson() { |
| 213 // Advance to the first character (possibly EOS) | 42 // Advance to the first character (possibly EOS) |
| 214 AdvanceSkipWhitespace(); | 43 AdvanceSkipWhitespace(); |
| 215 Handle<Object> result = ParseJsonValue(); | 44 Handle<Object> result = ParseJsonValue(); |
| 216 if (result.is_null() || c0_ != kEndOfString) { | 45 if (result.is_null() || c0_ != kEndOfString) { |
| 217 // Some exception (for example stack overflow) is already pending. | 46 // Some exception (for example stack overflow) is already pending. |
| 218 if (isolate_->has_pending_exception()) return Handle<Object>::null(); | 47 if (isolate_->has_pending_exception()) return Handle<Object>::null(); |
| 219 | 48 |
| (...skipping 34 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 254 // We should sent compile error event because we compile JSON object in | 83 // We should sent compile error event because we compile JSON object in |
| 255 // separated source file. | 84 // separated source file. |
| 256 isolate()->debug()->OnCompileError(script); | 85 isolate()->debug()->OnCompileError(script); |
| 257 MessageLocation location(script, position_, position_ + 1); | 86 MessageLocation location(script, position_, position_ + 1); |
| 258 Handle<Object> error = factory->NewSyntaxError(message, arg1, arg2); | 87 Handle<Object> error = factory->NewSyntaxError(message, arg1, arg2); |
| 259 return isolate()->template Throw<Object>(error, &location); | 88 return isolate()->template Throw<Object>(error, &location); |
| 260 } | 89 } |
| 261 return result; | 90 return result; |
| 262 } | 91 } |
| 263 | 92 |
| 93 template <bool seq_one_byte> |
| 94 void JsonParser<seq_one_byte>::Advance() { |
| 95 position_++; |
| 96 if (position_ >= source_length_) { |
| 97 c0_ = kEndOfString; |
| 98 } else if (seq_one_byte) { |
| 99 c0_ = seq_source_->SeqOneByteStringGet(position_); |
| 100 } else { |
| 101 c0_ = source_->Get(position_); |
| 102 } |
| 103 } |
| 104 |
| 105 template <bool seq_one_byte> |
| 106 void JsonParser<seq_one_byte>::AdvanceSkipWhitespace() { |
| 107 do { |
| 108 Advance(); |
| 109 } while (c0_ == ' ' || c0_ == '\t' || c0_ == '\n' || c0_ == '\r'); |
| 110 } |
| 111 |
| 112 template <bool seq_one_byte> |
| 113 void JsonParser<seq_one_byte>::SkipWhitespace() { |
| 114 while (c0_ == ' ' || c0_ == '\t' || c0_ == '\n' || c0_ == '\r') { |
| 115 Advance(); |
| 116 } |
| 117 } |
| 118 |
| 119 template <bool seq_one_byte> |
| 120 uc32 JsonParser<seq_one_byte>::AdvanceGetChar() { |
| 121 Advance(); |
| 122 return c0_; |
| 123 } |
| 124 |
| 125 template <bool seq_one_byte> |
| 126 bool JsonParser<seq_one_byte>::MatchSkipWhiteSpace(uc32 c) { |
| 127 if (c0_ == c) { |
| 128 AdvanceSkipWhitespace(); |
| 129 return true; |
| 130 } |
| 131 return false; |
| 132 } |
| 133 |
| 134 template <bool seq_one_byte> |
| 135 bool JsonParser<seq_one_byte>::ParseJsonString(Handle<String> expected) { |
| 136 int length = expected->length(); |
| 137 if (source_->length() - position_ - 1 > length) { |
| 138 DisallowHeapAllocation no_gc; |
| 139 String::FlatContent content = expected->GetFlatContent(); |
| 140 if (content.IsOneByte()) { |
| 141 DCHECK_EQ('"', c0_); |
| 142 const uint8_t* input_chars = seq_source_->GetChars() + position_ + 1; |
| 143 const uint8_t* expected_chars = content.ToOneByteVector().start(); |
| 144 for (int i = 0; i < length; i++) { |
| 145 uint8_t c0 = input_chars[i]; |
| 146 if (c0 != expected_chars[i] || c0 == '"' || c0 < 0x20 || c0 == '\\') { |
| 147 return false; |
| 148 } |
| 149 } |
| 150 if (input_chars[length] == '"') { |
| 151 position_ = position_ + length + 1; |
| 152 AdvanceSkipWhitespace(); |
| 153 return true; |
| 154 } |
| 155 } |
| 156 } |
| 157 return false; |
| 158 } |
| 264 | 159 |
| 265 // Parse any JSON value. | 160 // Parse any JSON value. |
| 266 template <bool seq_one_byte> | 161 template <bool seq_one_byte> |
| 267 Handle<Object> JsonParser<seq_one_byte>::ParseJsonValue() { | 162 Handle<Object> JsonParser<seq_one_byte>::ParseJsonValue() { |
| 268 StackLimitCheck stack_check(isolate_); | 163 StackLimitCheck stack_check(isolate_); |
| 269 if (stack_check.HasOverflowed()) { | 164 if (stack_check.HasOverflowed()) { |
| 270 isolate_->StackOverflow(); | 165 isolate_->StackOverflow(); |
| 271 return Handle<Object>::null(); | 166 return Handle<Object>::null(); |
| 272 } | 167 } |
| 273 | 168 |
| (...skipping 27 matching lines...) Expand all Loading... |
| 301 if (AdvanceGetChar() == 'u' && AdvanceGetChar() == 'l' && | 196 if (AdvanceGetChar() == 'u' && AdvanceGetChar() == 'l' && |
| 302 AdvanceGetChar() == 'l') { | 197 AdvanceGetChar() == 'l') { |
| 303 AdvanceSkipWhitespace(); | 198 AdvanceSkipWhitespace(); |
| 304 return factory()->null_value(); | 199 return factory()->null_value(); |
| 305 } | 200 } |
| 306 return ReportUnexpectedCharacter(); | 201 return ReportUnexpectedCharacter(); |
| 307 } | 202 } |
| 308 return ReportUnexpectedCharacter(); | 203 return ReportUnexpectedCharacter(); |
| 309 } | 204 } |
| 310 | 205 |
| 311 | |
| 312 template <bool seq_one_byte> | 206 template <bool seq_one_byte> |
| 313 ParseElementResult JsonParser<seq_one_byte>::ParseElement( | 207 ParseElementResult JsonParser<seq_one_byte>::ParseElement( |
| 314 Handle<JSObject> json_object) { | 208 Handle<JSObject> json_object) { |
| 315 uint32_t index = 0; | 209 uint32_t index = 0; |
| 316 // Maybe an array index, try to parse it. | 210 // Maybe an array index, try to parse it. |
| 317 if (c0_ == '0') { | 211 if (c0_ == '0') { |
| 318 // With a leading zero, the string has to be "0" only to be an index. | 212 // With a leading zero, the string has to be "0" only to be an index. |
| 319 Advance(); | 213 Advance(); |
| 320 } else { | 214 } else { |
| 321 do { | 215 do { |
| (...skipping 152 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 474 Handle<Object> value; | 368 Handle<Object> value; |
| 475 | 369 |
| 476 key = ParseJsonInternalizedString(); | 370 key = ParseJsonInternalizedString(); |
| 477 if (key.is_null() || c0_ != ':') return ReportUnexpectedCharacter(); | 371 if (key.is_null() || c0_ != ':') return ReportUnexpectedCharacter(); |
| 478 | 372 |
| 479 AdvanceSkipWhitespace(); | 373 AdvanceSkipWhitespace(); |
| 480 value = ParseJsonValue(); | 374 value = ParseJsonValue(); |
| 481 if (value.is_null()) return ReportUnexpectedCharacter(); | 375 if (value.is_null()) return ReportUnexpectedCharacter(); |
| 482 | 376 |
| 483 JSObject::DefinePropertyOrElementIgnoreAttributes(json_object, key, | 377 JSObject::DefinePropertyOrElementIgnoreAttributes(json_object, key, |
| 484 value).Check(); | 378 value) |
| 379 .Check(); |
| 485 } | 380 } |
| 486 } | 381 } |
| 487 | 382 |
| 488 if (c0_ != '}') { | 383 if (c0_ != '}') { |
| 489 return ReportUnexpectedCharacter(); | 384 return ReportUnexpectedCharacter(); |
| 490 } | 385 } |
| 491 } | 386 } |
| 492 AdvanceSkipWhitespace(); | 387 AdvanceSkipWhitespace(); |
| 493 return scope.CloseAndEscape(json_object); | 388 return scope.CloseAndEscape(json_object); |
| 494 } | 389 } |
| 495 | 390 |
| 496 | |
| 497 template <bool seq_one_byte> | 391 template <bool seq_one_byte> |
| 498 void JsonParser<seq_one_byte>::CommitStateToJsonObject( | 392 void JsonParser<seq_one_byte>::CommitStateToJsonObject( |
| 499 Handle<JSObject> json_object, Handle<Map> map, | 393 Handle<JSObject> json_object, Handle<Map> map, |
| 500 ZoneList<Handle<Object> >* properties) { | 394 ZoneList<Handle<Object> >* properties) { |
| 501 JSObject::AllocateStorageForMap(json_object, map); | 395 JSObject::AllocateStorageForMap(json_object, map); |
| 502 DCHECK(!json_object->map()->is_dictionary_map()); | 396 DCHECK(!json_object->map()->is_dictionary_map()); |
| 503 | 397 |
| 504 DisallowHeapAllocation no_gc; | 398 DisallowHeapAllocation no_gc; |
| 505 | 399 |
| 506 int length = properties->length(); | 400 int length = properties->length(); |
| 507 for (int i = 0; i < length; i++) { | 401 for (int i = 0; i < length; i++) { |
| 508 Handle<Object> value = (*properties)[i]; | 402 Handle<Object> value = (*properties)[i]; |
| 509 json_object->WriteToField(i, *value); | 403 json_object->WriteToField(i, *value); |
| 510 } | 404 } |
| 511 } | 405 } |
| 512 | 406 |
| 513 | |
| 514 // Parse a JSON array. Position must be right at '['. | 407 // Parse a JSON array. Position must be right at '['. |
| 515 template <bool seq_one_byte> | 408 template <bool seq_one_byte> |
| 516 Handle<Object> JsonParser<seq_one_byte>::ParseJsonArray() { | 409 Handle<Object> JsonParser<seq_one_byte>::ParseJsonArray() { |
| 517 HandleScope scope(isolate()); | 410 HandleScope scope(isolate()); |
| 518 ZoneList<Handle<Object> > elements(4, zone()); | 411 ZoneList<Handle<Object> > elements(4, zone()); |
| 519 DCHECK_EQ(c0_, '['); | 412 DCHECK_EQ(c0_, '['); |
| 520 | 413 |
| 521 AdvanceSkipWhitespace(); | 414 AdvanceSkipWhitespace(); |
| 522 if (c0_ != ']') { | 415 if (c0_ != ']') { |
| 523 do { | 416 do { |
| (...skipping 10 matching lines...) Expand all Loading... |
| 534 Handle<FixedArray> fast_elements = | 427 Handle<FixedArray> fast_elements = |
| 535 factory()->NewFixedArray(elements.length(), pretenure_); | 428 factory()->NewFixedArray(elements.length(), pretenure_); |
| 536 for (int i = 0, n = elements.length(); i < n; i++) { | 429 for (int i = 0, n = elements.length(); i < n; i++) { |
| 537 fast_elements->set(i, *elements[i]); | 430 fast_elements->set(i, *elements[i]); |
| 538 } | 431 } |
| 539 Handle<Object> json_array = factory()->NewJSArrayWithElements( | 432 Handle<Object> json_array = factory()->NewJSArrayWithElements( |
| 540 fast_elements, FAST_ELEMENTS, pretenure_); | 433 fast_elements, FAST_ELEMENTS, pretenure_); |
| 541 return scope.CloseAndEscape(json_array); | 434 return scope.CloseAndEscape(json_array); |
| 542 } | 435 } |
| 543 | 436 |
| 544 | |
| 545 template <bool seq_one_byte> | 437 template <bool seq_one_byte> |
| 546 Handle<Object> JsonParser<seq_one_byte>::ParseJsonNumber() { | 438 Handle<Object> JsonParser<seq_one_byte>::ParseJsonNumber() { |
| 547 bool negative = false; | 439 bool negative = false; |
| 548 int beg_pos = position_; | 440 int beg_pos = position_; |
| 549 if (c0_ == '-') { | 441 if (c0_ == '-') { |
| 550 Advance(); | 442 Advance(); |
| 551 negative = true; | 443 negative = true; |
| 552 } | 444 } |
| 553 if (c0_ == '0') { | 445 if (c0_ == '0') { |
| 554 Advance(); | 446 Advance(); |
| (...skipping 25 matching lines...) Expand all Loading... |
| 580 Advance(); | 472 Advance(); |
| 581 if (c0_ == '-' || c0_ == '+') Advance(); | 473 if (c0_ == '-' || c0_ == '+') Advance(); |
| 582 if (!IsDecimalDigit(c0_)) return ReportUnexpectedCharacter(); | 474 if (!IsDecimalDigit(c0_)) return ReportUnexpectedCharacter(); |
| 583 do { | 475 do { |
| 584 Advance(); | 476 Advance(); |
| 585 } while (IsDecimalDigit(c0_)); | 477 } while (IsDecimalDigit(c0_)); |
| 586 } | 478 } |
| 587 int length = position_ - beg_pos; | 479 int length = position_ - beg_pos; |
| 588 double number; | 480 double number; |
| 589 if (seq_one_byte) { | 481 if (seq_one_byte) { |
| 590 Vector<const uint8_t> chars(seq_source_->GetChars() + beg_pos, length); | 482 Vector<const uint8_t> chars(seq_source_->GetChars() + beg_pos, length); |
| 591 number = StringToDouble(isolate()->unicode_cache(), chars, | 483 number = StringToDouble(isolate()->unicode_cache(), chars, |
| 592 NO_FLAGS, // Hex, octal or trailing junk. | 484 NO_FLAGS, // Hex, octal or trailing junk. |
| 593 std::numeric_limits<double>::quiet_NaN()); | 485 std::numeric_limits<double>::quiet_NaN()); |
| 594 } else { | 486 } else { |
| 595 Vector<uint8_t> buffer = Vector<uint8_t>::New(length); | 487 Vector<uint8_t> buffer = Vector<uint8_t>::New(length); |
| 596 String::WriteToFlat(*source_, buffer.start(), beg_pos, position_); | 488 String::WriteToFlat(*source_, buffer.start(), beg_pos, position_); |
| 597 Vector<const uint8_t> result = | 489 Vector<const uint8_t> result = |
| 598 Vector<const uint8_t>(buffer.start(), length); | 490 Vector<const uint8_t>(buffer.start(), length); |
| 599 number = StringToDouble(isolate()->unicode_cache(), | 491 number = StringToDouble(isolate()->unicode_cache(), result, |
| 600 result, | |
| 601 NO_FLAGS, // Hex, octal or trailing junk. | 492 NO_FLAGS, // Hex, octal or trailing junk. |
| 602 0.0); | 493 0.0); |
| 603 buffer.Dispose(); | 494 buffer.Dispose(); |
| 604 } | 495 } |
| 605 SkipWhitespace(); | 496 SkipWhitespace(); |
| 606 return factory()->NewNumber(number, pretenure_); | 497 return factory()->NewNumber(number, pretenure_); |
| 607 } | 498 } |
| 608 | 499 |
| 609 | |
| 610 template <typename StringType> | 500 template <typename StringType> |
| 611 inline void SeqStringSet(Handle<StringType> seq_str, int i, uc32 c); | 501 inline void SeqStringSet(Handle<StringType> seq_str, int i, uc32 c); |
| 612 | 502 |
| 613 template <> | 503 template <> |
| 614 inline void SeqStringSet(Handle<SeqTwoByteString> seq_str, int i, uc32 c) { | 504 inline void SeqStringSet(Handle<SeqTwoByteString> seq_str, int i, uc32 c) { |
| 615 seq_str->SeqTwoByteStringSet(i, c); | 505 seq_str->SeqTwoByteStringSet(i, c); |
| 616 } | 506 } |
| 617 | 507 |
| 618 template <> | 508 template <> |
| 619 inline void SeqStringSet(Handle<SeqOneByteString> seq_str, int i, uc32 c) { | 509 inline void SeqStringSet(Handle<SeqOneByteString> seq_str, int i, uc32 c) { |
| 620 seq_str->SeqOneByteStringSet(i, c); | 510 seq_str->SeqOneByteStringSet(i, c); |
| 621 } | 511 } |
| 622 | 512 |
| 623 template <typename StringType> | 513 template <typename StringType> |
| 624 inline Handle<StringType> NewRawString(Factory* factory, | 514 inline Handle<StringType> NewRawString(Factory* factory, int length, |
| 625 int length, | |
| 626 PretenureFlag pretenure); | 515 PretenureFlag pretenure); |
| 627 | 516 |
| 628 template <> | 517 template <> |
| 629 inline Handle<SeqTwoByteString> NewRawString(Factory* factory, | 518 inline Handle<SeqTwoByteString> NewRawString(Factory* factory, int length, |
| 630 int length, | |
| 631 PretenureFlag pretenure) { | 519 PretenureFlag pretenure) { |
| 632 return factory->NewRawTwoByteString(length, pretenure).ToHandleChecked(); | 520 return factory->NewRawTwoByteString(length, pretenure).ToHandleChecked(); |
| 633 } | 521 } |
| 634 | 522 |
| 635 template <> | 523 template <> |
| 636 inline Handle<SeqOneByteString> NewRawString(Factory* factory, | 524 inline Handle<SeqOneByteString> NewRawString(Factory* factory, int length, |
| 637 int length, | 525 PretenureFlag pretenure) { |
| 638 PretenureFlag pretenure) { | |
| 639 return factory->NewRawOneByteString(length, pretenure).ToHandleChecked(); | 526 return factory->NewRawOneByteString(length, pretenure).ToHandleChecked(); |
| 640 } | 527 } |
| 641 | 528 |
| 642 | |
| 643 // Scans the rest of a JSON string starting from position_ and writes | 529 // Scans the rest of a JSON string starting from position_ and writes |
| 644 // prefix[start..end] along with the scanned characters into a | 530 // prefix[start..end] along with the scanned characters into a |
| 645 // sequential string of type StringType. | 531 // sequential string of type StringType. |
| 646 template <bool seq_one_byte> | 532 template <bool seq_one_byte> |
| 647 template <typename StringType, typename SinkChar> | 533 template <typename StringType, typename SinkChar> |
| 648 Handle<String> JsonParser<seq_one_byte>::SlowScanJsonString( | 534 Handle<String> JsonParser<seq_one_byte>::SlowScanJsonString( |
| 649 Handle<String> prefix, int start, int end) { | 535 Handle<String> prefix, int start, int end) { |
| 650 int count = end - start; | 536 int count = end - start; |
| 651 int max_length = count + source_length_ - position_; | 537 int max_length = count + source_length_ - position_; |
| 652 int length = Min(max_length, Max(kInitialSpecialStringLength, 2 * count)); | 538 int length = Min(max_length, Max(kInitialSpecialStringLength, 2 * count)); |
| (...skipping 58 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 711 } | 597 } |
| 712 if (sizeof(SinkChar) == kUC16Size || | 598 if (sizeof(SinkChar) == kUC16Size || |
| 713 value <= String::kMaxOneByteCharCode) { | 599 value <= String::kMaxOneByteCharCode) { |
| 714 SeqStringSet(seq_string, count++, value); | 600 SeqStringSet(seq_string, count++, value); |
| 715 break; | 601 break; |
| 716 } else { | 602 } else { |
| 717 // StringType is SeqOneByteString and we just read a non-Latin1 | 603 // StringType is SeqOneByteString and we just read a non-Latin1 |
| 718 // char. | 604 // char. |
| 719 position_ -= 6; // Rewind position_ to \ in \uxxxx. | 605 position_ -= 6; // Rewind position_ to \ in \uxxxx. |
| 720 Advance(); | 606 Advance(); |
| 721 return SlowScanJsonString<SeqTwoByteString, uc16>(seq_string, | 607 return SlowScanJsonString<SeqTwoByteString, uc16>(seq_string, 0, |
| 722 0, | |
| 723 count); | 608 count); |
| 724 } | 609 } |
| 725 } | 610 } |
| 726 default: | 611 default: |
| 727 return Handle<String>::null(); | 612 return Handle<String>::null(); |
| 728 } | 613 } |
| 729 Advance(); | 614 Advance(); |
| 730 } | 615 } |
| 731 } | 616 } |
| 732 | 617 |
| 733 DCHECK_EQ('"', c0_); | 618 DCHECK_EQ('"', c0_); |
| 734 // Advance past the last '"'. | 619 // Advance past the last '"'. |
| 735 AdvanceSkipWhitespace(); | 620 AdvanceSkipWhitespace(); |
| 736 | 621 |
| 737 // Shrink seq_string length to count and return. | 622 // Shrink seq_string length to count and return. |
| 738 return SeqString::Truncate(seq_string, count); | 623 return SeqString::Truncate(seq_string, count); |
| 739 } | 624 } |
| 740 | 625 |
| 741 | |
| 742 template <bool seq_one_byte> | 626 template <bool seq_one_byte> |
| 743 template <bool is_internalized> | 627 template <bool is_internalized> |
| 744 Handle<String> JsonParser<seq_one_byte>::ScanJsonString() { | 628 Handle<String> JsonParser<seq_one_byte>::ScanJsonString() { |
| 745 DCHECK_EQ('"', c0_); | 629 DCHECK_EQ('"', c0_); |
| 746 Advance(); | 630 Advance(); |
| 747 if (c0_ == '"') { | 631 if (c0_ == '"') { |
| 748 AdvanceSkipWhitespace(); | 632 AdvanceSkipWhitespace(); |
| 749 return factory()->empty_string(); | 633 return factory()->empty_string(); |
| 750 } | 634 } |
| 751 | 635 |
| 752 if (seq_one_byte && is_internalized) { | 636 if (seq_one_byte && is_internalized) { |
| 753 // Fast path for existing internalized strings. If the the string being | 637 // Fast path for existing internalized strings. If the the string being |
| 754 // parsed is not a known internalized string, contains backslashes or | 638 // parsed is not a known internalized string, contains backslashes or |
| 755 // unexpectedly reaches the end of string, return with an empty handle. | 639 // unexpectedly reaches the end of string, return with an empty handle. |
| 756 uint32_t running_hash = isolate()->heap()->HashSeed(); | 640 uint32_t running_hash = isolate()->heap()->HashSeed(); |
| 757 int position = position_; | 641 int position = position_; |
| 758 uc32 c0 = c0_; | 642 uc32 c0 = c0_; |
| 759 do { | 643 do { |
| 760 if (c0 == '\\') { | 644 if (c0 == '\\') { |
| 761 c0_ = c0; | 645 c0_ = c0; |
| 762 int beg_pos = position_; | 646 int beg_pos = position_; |
| 763 position_ = position; | 647 position_ = position; |
| 764 return SlowScanJsonString<SeqOneByteString, uint8_t>(source_, | 648 return SlowScanJsonString<SeqOneByteString, uint8_t>(source_, beg_pos, |
| 765 beg_pos, | |
| 766 position_); | 649 position_); |
| 767 } | 650 } |
| 768 if (c0 < 0x20) return Handle<String>::null(); | 651 if (c0 < 0x20) return Handle<String>::null(); |
| 769 running_hash = StringHasher::AddCharacterCore(running_hash, | 652 running_hash = StringHasher::AddCharacterCore(running_hash, |
| 770 static_cast<uint16_t>(c0)); | 653 static_cast<uint16_t>(c0)); |
| 771 position++; | 654 position++; |
| 772 if (position >= source_length_) return Handle<String>::null(); | 655 if (position >= source_length_) return Handle<String>::null(); |
| 773 c0 = seq_source_->SeqOneByteStringGet(position); | 656 c0 = seq_source_->SeqOneByteStringGet(position); |
| 774 } while (c0 != '"'); | 657 } while (c0 != '"'); |
| 775 int length = position - position_; | 658 int length = position - position_; |
| 776 uint32_t hash = (length <= String::kMaxHashCalcLength) | 659 uint32_t hash = (length <= String::kMaxHashCalcLength) |
| 777 ? StringHasher::GetHashCore(running_hash) | 660 ? StringHasher::GetHashCore(running_hash) |
| 778 : static_cast<uint32_t>(length); | 661 : static_cast<uint32_t>(length); |
| 779 Vector<const uint8_t> string_vector( | 662 Vector<const uint8_t> string_vector(seq_source_->GetChars() + position_, |
| 780 seq_source_->GetChars() + position_, length); | 663 length); |
| 781 StringTable* string_table = isolate()->heap()->string_table(); | 664 StringTable* string_table = isolate()->heap()->string_table(); |
| 782 uint32_t capacity = string_table->Capacity(); | 665 uint32_t capacity = string_table->Capacity(); |
| 783 uint32_t entry = StringTable::FirstProbe(hash, capacity); | 666 uint32_t entry = StringTable::FirstProbe(hash, capacity); |
| 784 uint32_t count = 1; | 667 uint32_t count = 1; |
| 785 Handle<String> result; | 668 Handle<String> result; |
| 786 while (true) { | 669 while (true) { |
| 787 Object* element = string_table->KeyAt(entry); | 670 Object* element = string_table->KeyAt(entry); |
| 788 if (element == isolate()->heap()->undefined_value()) { | 671 if (element == isolate()->heap()->undefined_value()) { |
| 789 // Lookup failure. | 672 // Lookup failure. |
| 790 result = factory()->InternalizeOneByteString( | 673 result = |
| 791 seq_source_, position_, length); | 674 factory()->InternalizeOneByteString(seq_source_, position_, length); |
| 792 break; | 675 break; |
| 793 } | 676 } |
| 794 if (element != isolate()->heap()->the_hole_value() && | 677 if (element != isolate()->heap()->the_hole_value() && |
| 795 String::cast(element)->IsOneByteEqualTo(string_vector)) { | 678 String::cast(element)->IsOneByteEqualTo(string_vector)) { |
| 796 result = Handle<String>(String::cast(element), isolate()); | 679 result = Handle<String>(String::cast(element), isolate()); |
| 797 #ifdef DEBUG | 680 #ifdef DEBUG |
| 798 uint32_t hash_field = | 681 uint32_t hash_field = |
| 799 (hash << String::kHashShift) | String::kIsNotArrayIndexMask; | 682 (hash << String::kHashShift) | String::kIsNotArrayIndexMask; |
| 800 DCHECK_EQ(static_cast<int>(result->Hash()), | 683 DCHECK_EQ(static_cast<int>(result->Hash()), |
| 801 static_cast<int>(hash_field >> String::kHashShift)); | 684 static_cast<int>(hash_field >> String::kHashShift)); |
| (...skipping 10 matching lines...) Expand all Loading... |
| 812 | 695 |
| 813 int beg_pos = position_; | 696 int beg_pos = position_; |
| 814 // Fast case for Latin1 only without escape characters. | 697 // Fast case for Latin1 only without escape characters. |
| 815 do { | 698 do { |
| 816 // Check for control character (0x00-0x1f) or unterminated string (<0). | 699 // Check for control character (0x00-0x1f) or unterminated string (<0). |
| 817 if (c0_ < 0x20) return Handle<String>::null(); | 700 if (c0_ < 0x20) return Handle<String>::null(); |
| 818 if (c0_ != '\\') { | 701 if (c0_ != '\\') { |
| 819 if (seq_one_byte || c0_ <= String::kMaxOneByteCharCode) { | 702 if (seq_one_byte || c0_ <= String::kMaxOneByteCharCode) { |
| 820 Advance(); | 703 Advance(); |
| 821 } else { | 704 } else { |
| 822 return SlowScanJsonString<SeqTwoByteString, uc16>(source_, | 705 return SlowScanJsonString<SeqTwoByteString, uc16>(source_, beg_pos, |
| 823 beg_pos, | |
| 824 position_); | 706 position_); |
| 825 } | 707 } |
| 826 } else { | 708 } else { |
| 827 return SlowScanJsonString<SeqOneByteString, uint8_t>(source_, | 709 return SlowScanJsonString<SeqOneByteString, uint8_t>(source_, beg_pos, |
| 828 beg_pos, | |
| 829 position_); | 710 position_); |
| 830 } | 711 } |
| 831 } while (c0_ != '"'); | 712 } while (c0_ != '"'); |
| 832 int length = position_ - beg_pos; | 713 int length = position_ - beg_pos; |
| 833 Handle<String> result = | 714 Handle<String> result = |
| 834 factory()->NewRawOneByteString(length, pretenure_).ToHandleChecked(); | 715 factory()->NewRawOneByteString(length, pretenure_).ToHandleChecked(); |
| 835 uint8_t* dest = SeqOneByteString::cast(*result)->GetChars(); | 716 uint8_t* dest = SeqOneByteString::cast(*result)->GetChars(); |
| 836 String::WriteToFlat(*source_, dest, beg_pos, position_); | 717 String::WriteToFlat(*source_, dest, beg_pos, position_); |
| 837 | 718 |
| 838 DCHECK_EQ('"', c0_); | 719 DCHECK_EQ('"', c0_); |
| 839 // Advance past the last '"'. | 720 // Advance past the last '"'. |
| 840 AdvanceSkipWhitespace(); | 721 AdvanceSkipWhitespace(); |
| 841 return result; | 722 return result; |
| 842 } | 723 } |
| 843 | 724 |
| 725 // Explicit instantiation. |
| 726 template class JsonParser<true>; |
| 727 template class JsonParser<false>; |
| 728 |
| 844 } // namespace internal | 729 } // namespace internal |
| 845 } // namespace v8 | 730 } // namespace v8 |
| 846 | |
| 847 #endif // V8_JSON_PARSER_H_ | |
| OLD | NEW |