Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(239)

Side by Side Diff: src/json-parser.h

Issue 7020018: Remove scanner abstraction layer from JSON parsing. The change in api.cc is t... (Closed) Base URL: http://v8.googlecode.com/svn/branches/bleeding_edge/
Patch Set: '' Created 9 years, 6 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch | Annotate | Revision Log
« no previous file with comments | « no previous file | src/json-parser.cc » ('j') | src/json-parser.cc » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright 2011 the V8 project authors. All rights reserved. 1 // Copyright 2011 the V8 project authors. All rights reserved.
2 // Redistribution and use in source and binary forms, with or without 2 // Redistribution and use in source and binary forms, with or without
3 // modification, are permitted provided that the following conditions are 3 // modification, are permitted provided that the following conditions are
4 // met: 4 // met:
5 // 5 //
6 // * Redistributions of source code must retain the above copyright 6 // * Redistributions of source code must retain the above copyright
7 // notice, this list of conditions and the following disclaimer. 7 // notice, this list of conditions and the following disclaimer.
8 // * Redistributions in binary form must reproduce the above 8 // * Redistributions in binary form must reproduce the above
9 // copyright notice, this list of conditions and the following 9 // copyright notice, this list of conditions and the following
10 // disclaimer in the documentation and/or other materials provided 10 // disclaimer in the documentation and/or other materials provided
(...skipping 29 matching lines...) Expand all
40 return JsonParser().ParseJson(source); 40 return JsonParser().ParseJson(source);
41 } 41 }
42 42
43 static const int kEndOfString = -1; 43 static const int kEndOfString = -1;
44 44
45 private: 45 private:
46 // Parse a string containing a single JSON value. 46 // Parse a string containing a single JSON value.
47 Handle<Object> ParseJson(Handle<String> source); 47 Handle<Object> ParseJson(Handle<String> source);
48 48
49 inline void Advance() { 49 inline void Advance() {
50 if (position_ >= source_length_) { 50 position_++;
51 position_++; 51 if (position_ > source_length_) {
52 c0_ = kEndOfString; 52 c0_ = kEndOfString;
53 } else if (is_sequential_ascii_) { 53 } else if (is_sequential_ascii_) {
Lasse Reichstein 2011/06/01 11:03:58 This was changed?
sandholm 2011/06/01 13:45:20 r8142 ensures this was not changed.
54 position_++;
55 c0_ = seq_source_->SeqAsciiStringGet(position_); 54 c0_ = seq_source_->SeqAsciiStringGet(position_);
56 } else { 55 } else {
57 position_++;
58 c0_ = source_->Get(position_); 56 c0_ = source_->Get(position_);
59 } 57 }
60 } 58 }
61 59
62 inline Isolate* isolate() { return isolate_; } 60 // The JSON lexical grammar is specified in the ECMAScript 5 standard,
61 // section 15.12.1.1. The only allowed whitespace characters between tokens
62 // are tab, carriage-return, newline and space.
63 63
64 // Get the string for the current string token. 64 inline bool AdvanceWS() {
Lasse Reichstein 2011/06/01 11:03:58 Don't abbreviate unless necessary. Call this Advan
sandholm 2011/06/01 13:45:20 Done.
65 Handle<String> GetString(bool hint_symbol); 65 do {
66 Handle<String> GetString(); 66 Advance();
67 Handle<String> GetSymbol(); 67 } while (c0_ == '\t' || c0_ == '\r' || c0_ == '\n' || c0_ == ' ');
68 return true;
Lasse Reichstein 2011/06/01 11:03:58 Why the return true? If it always returns the same
sandholm 2011/06/01 13:45:20 Done.
69 }
68 70
69 // Scan a single JSON token. The JSON lexical grammar is specified in the 71 inline void SkipWS() {
Lasse Reichstein 2011/06/01 11:03:58 And just SkipWhitespace.
sandholm 2011/06/01 13:45:20 Done.
70 // ECMAScript 5 standard, section 15.12.1.1. 72 while (c0_ == '\t' || c0_ == '\r' || c0_ == '\n' || c0_ == ' ') {
71 // Recognizes all of the single-character tokens directly, or calls a function 73 Advance();
72 // to scan a number, string or identifier literal. 74 }
73 // The only allowed whitespace characters between tokens are tab, 75 }
74 // carriage-return, newline and space. 76
75 void ScanJson(); 77 inline uc32 AdvanceGetChar() {
78 Advance();
79 return c0_;
80 }
76 81
77 // A JSON string (production JSONString) is subset of valid JavaScript string 82 // A JSON string (production JSONString) is subset of valid JavaScript string
78 // literals. The string must only be double-quoted (not single-quoted), and 83 // literals. The string must only be double-quoted (not single-quoted), and
79 // the only allowed backslash-escapes are ", /, \, b, f, n, r, t and 84 // the only allowed backslash-escapes are ", /, \, b, f, n, r, t and
80 // four-digit hex escapes (uXXXX). Any other use of backslashes is invalid. 85 // four-digit hex escapes (uXXXX). Any other use of backslashes is invalid.
81 Token::Value ScanJsonString(); 86 Handle<Object> ParseJsonString() {
87 return ScanJsonString<false>();
88 }
89 Handle<Object> ParseJsonSymbol() {
90 return ScanJsonString<true>();
91 }
92 template <bool is_symbol>
93 Handle<Object> ScanJsonString();
82 // Slow version for unicode support, uses the first ascii_count characters, 94 // Slow version for unicode support, uses the first ascii_count characters,
83 // as first part of a ConsString 95 // as first part of a ConsString
84 Token::Value SlowScanJsonString(); 96 Handle<Object> SlowScanJsonString();
85 97
86 // A JSON number (production JSONNumber) is a subset of the valid JavaScript 98 // A JSON number (production JSONNumber) is a subset of the valid JavaScript
87 // decimal number literals. 99 // decimal number literals.
88 // It includes an optional minus sign, must have at least one 100 // It includes an optional minus sign, must have at least one
89 // digit before and after a decimal point, may not have prefixed zeros (unless 101 // digit before and after a decimal point, may not have prefixed zeros (unless
90 // the integer part is zero), and may include an exponent part (e.g., "e-10"). 102 // the integer part is zero), and may include an exponent part (e.g., "e-10").
91 // Hexadecimal and octal numbers are not allowed. 103 // Hexadecimal and octal numbers are not allowed.
92 Token::Value ScanJsonNumber(); 104 Handle<Object> ParseJsonNumber();
93
94 // Used to recognizes one of the literals "true", "false", or "null". These
95 // are the only valid JSON identifiers (productions JSONBooleanLiteral,
96 // JSONNullLiteral).
97 Token::Value ScanJsonIdentifier(const char* text, Token::Value token);
98 105
99 // Parse a single JSON value from input (grammar production JSONValue). 106 // Parse a single JSON value from input (grammar production JSONValue).
100 // A JSON value is either a (double-quoted) string literal, a number literal, 107 // A JSON value is either a (double-quoted) string literal, a number literal,
101 // one of "true", "false", or "null", or an object or array literal. 108 // one of "true", "false", or "null", or an object or array literal.
102 Handle<Object> ParseJsonValue(); 109 Handle<Object> ParseJsonValue();
103 110
104 // Parse a JSON object literal (grammar production JSONObject). 111 // Parse a JSON object literal (grammar production JSONObject).
105 // An object literal is a squiggly-braced and comma separated sequence 112 // An object literal is a squiggly-braced and comma separated sequence
106 // (possibly empty) of key/value pairs, where the key is a JSON string 113 // (possibly empty) of key/value pairs, where the key is a JSON string
107 // literal, the value is a JSON value, and the two are separated by a colon. 114 // literal, the value is a JSON value, and the two are separated by a colon.
108 // A JSON array dosn't allow numbers and identifiers as keys, like a 115 // A JSON array dosn't allow numbers and identifiers as keys, like a
109 // JavaScript array. 116 // JavaScript array.
110 Handle<Object> ParseJsonObject(); 117 Handle<Object> ParseJsonObject();
111 118
112 // Parses a JSON array literal (grammar production JSONArray). An array 119 // Parses a JSON array literal (grammar production JSONArray). An array
113 // literal is a square-bracketed and comma separated sequence (possibly empty) 120 // literal is a square-bracketed and comma separated sequence (possibly empty)
114 // of JSON values. 121 // of JSON values.
115 // A JSON array doesn't allow leaving out values from the sequence, nor does 122 // A JSON array doesn't allow leaving out values from the sequence, nor does
116 // it allow a terminal comma, like a JavaScript array does. 123 // it allow a terminal comma, like a JavaScript array does.
117 Handle<Object> ParseJsonArray(); 124 Handle<Object> ParseJsonArray();
118 125
119 126
120 // Mark that a parsing error has happened at the current token, and 127 // Mark that a parsing error has happened at the current token, and
121 // return a null handle. Primarily for readability. 128 // return a null handle. Primarily for readability.
122 Handle<Object> ReportUnexpectedToken() { return Handle<Object>::null(); } 129 inline Handle<Object> ReportUnexpectedToken() {
130 return Handle<Object>::null();
131 }
123 132
124 // Peek at the next token. 133 inline Isolate* isolate() { return isolate_; }
125 Token::Value Peek() { return next_.token; }
126 // Scan the next token and return the token scanned on the last call.
127 Token::Value Next();
128
129 struct TokenInfo {
130 TokenInfo() : token(Token::ILLEGAL),
131 beg_pos(0),
132 end_pos(0) { }
133 Token::Value token;
134 int beg_pos;
135 int end_pos;
136 };
137 134
138 static const int kInitialSpecialStringSize = 1024; 135 static const int kInitialSpecialStringSize = 1024;
139 136
140 137
141 private: 138 private:
142 Handle<String> source_; 139 Handle<String> source_;
143 int source_length_; 140 int source_length_;
144 Handle<SeqAsciiString> seq_source_; 141 Handle<SeqAsciiString> seq_source_;
145 142
146 bool is_sequential_ascii_; 143 bool is_sequential_ascii_;
147 // Current and next token 144 // begin and end position of scanned string or number
148 TokenInfo current_; 145 int beg_pos_;
149 TokenInfo next_; 146 int end_pos_;
147
150 Isolate* isolate_; 148 Isolate* isolate_;
151 uc32 c0_; 149 uc32 c0_;
152 int position_; 150 int position_;
153 151
154
155 Handle<String> string_val_;
156 double number_; 152 double number_;
157 }; 153 };
158 154
159 } } // namespace v8::internal 155 } } // namespace v8::internal
160 156
161 #endif // V8_JSON_PARSER_H_ 157 #endif // V8_JSON_PARSER_H_
OLDNEW
« no previous file with comments | « no previous file | src/json-parser.cc » ('j') | src/json-parser.cc » ('J')

Powered by Google App Engine
This is Rietveld 408576698