Chromium Code Reviews| Index: src/scanner.cc | 
| diff --git a/src/scanner.cc b/src/scanner.cc | 
| index ddcd937584d50fc45fa921a25e2a5d21fcf5697e..1b489fdbffffa18f3242287935e924a19dcba58e 100644 | 
| --- a/src/scanner.cc | 
| +++ b/src/scanner.cc | 
| @@ -54,7 +54,7 @@ void Scanner::Initialize(Utf16CharacterStream* source) { | 
| } | 
| -uc32 Scanner::ScanHexNumber(int expected_length) { | 
| +uc32 Scanner::ScanHexNumber(int expected_length, bool recordRaw) { | 
| DCHECK(expected_length <= 4); // prevent overflow | 
| uc32 x = 0; | 
| @@ -64,6 +64,9 @@ uc32 Scanner::ScanHexNumber(int expected_length) { | 
| return -1; | 
| } | 
| x = x * 16 + d; | 
| + if (recordRaw) { | 
| + AddRawLiteralChar(c0_); | 
| + } | 
| Advance(); | 
| } | 
| @@ -403,7 +406,9 @@ Token::Value Scanner::ScanHtmlComment() { | 
| void Scanner::Scan() { | 
| next_.literal_chars = NULL; | 
| + next_.raw_literal_chars = NULL; | 
| Token::Value token; | 
| + | 
| do { | 
| // Remember the position of the next token | 
| next_.location.beg_pos = source_pos(); | 
| @@ -626,6 +631,12 @@ void Scanner::Scan() { | 
| token = Select(Token::BIT_NOT); | 
| break; | 
| + case '`': | 
| + if (HarmonyTemplates()) { | 
| + token = ScanTemplateSpan(); | 
| + break; | 
| + } | 
| + | 
| default: | 
| if (c0_ < 0) { | 
| token = Token::EOS; | 
| @@ -671,8 +682,10 @@ void Scanner::SeekForward(int pos) { | 
| } | 
| -bool Scanner::ScanEscape() { | 
| +bool Scanner::ScanEscape(bool recordRaw) { | 
| uc32 c = c0_; | 
| + uc32 rc = c; | 
| + bool singleCharEscape = true; | 
| Advance(); | 
| // Skip escaped newlines. | 
| @@ -694,13 +707,17 @@ bool Scanner::ScanEscape() { | 
| case 'r' : c = '\r'; break; | 
| case 't' : c = '\t'; break; | 
| case 'u' : { | 
| - c = ScanHexNumber(4); | 
| + if (recordRaw) AddRawLiteralChar('u'); | 
| + singleCharEscape = false; | 
| + c = ScanHexNumber(4, recordRaw); | 
| if (c < 0) return false; | 
| break; | 
| } | 
| case 'v' : c = '\v'; break; | 
| case 'x' : { | 
| - c = ScanHexNumber(2); | 
| + if (recordRaw) AddRawLiteralChar('x'); | 
| + singleCharEscape = false; | 
| + c = ScanHexNumber(2, recordRaw); | 
| if (c < 0) return false; | 
| break; | 
| } | 
| @@ -711,12 +728,16 @@ bool Scanner::ScanEscape() { | 
| case '4' : // fall through | 
| case '5' : // fall through | 
| case '6' : // fall through | 
| - case '7' : c = ScanOctalEscape(c, 2); break; | 
| + case '7': | 
| + singleCharEscape = false; | 
| + c = ScanOctalEscape(c, 2, recordRaw); | 
| + break; | 
| } | 
| // According to ECMA-262, section 7.8.4, characters not covered by the | 
| // above cases should be illegal, but they are commonly handled as | 
| // non-escaped characters by JS VMs. | 
| + if (singleCharEscape && recordRaw) AddRawLiteralChar(rc); | 
| AddLiteralChar(c); | 
| return true; | 
| } | 
| @@ -724,7 +745,7 @@ bool Scanner::ScanEscape() { | 
| // Octal escapes of the forms '\0xx' and '\xxx' are not a part of | 
| // ECMA-262. Other JS VMs support them. | 
| -uc32 Scanner::ScanOctalEscape(uc32 c, int length) { | 
| +uc32 Scanner::ScanOctalEscape(uc32 c, int length, bool recordRaw) { | 
| uc32 x = c - '0'; | 
| int i = 0; | 
| for (; i < length; i++) { | 
| @@ -733,6 +754,9 @@ uc32 Scanner::ScanOctalEscape(uc32 c, int length) { | 
| int nx = x * 8 + d; | 
| if (nx >= 256) break; | 
| x = nx; | 
| + if (recordRaw) { | 
| + AddRawLiteralChar(c0_); | 
| + } | 
| Advance(); | 
| } | 
| // Anything except '\0' is an octal escape sequence, illegal in strict mode. | 
| @@ -770,6 +794,87 @@ Token::Value Scanner::ScanString() { | 
| } | 
| +Token::Value Scanner::ScanTemplateSpan() { | 
| + // When scanning a TemplateSpan, we are looking for the following construct: | 
| + // TEMPLATE_SPAN :: | 
| + // ` LiteralChars* ${ | 
| + // | } LiteralChars* ${ | 
| + // | 
| + // TEMPLATE_TAIL :: | 
| + // ` LiteralChars* ` | 
| + // | } LiteralChar* ` | 
| + // | 
| + // A TEMPLATE_SPAN should always be followed by an Expression, while a | 
| + // TEMPLATE_TAIL terminates a TemplateLiteral and does not need to be | 
| + // followed by an Expression. | 
| + // | 
| + // raw_literal_chars_ represents TRV or the raw value of the template span, | 
| + // per the spec, while literal_chars_ represents TV or the cooked value of | 
| + // the template span. | 
| + // | 
| + // TODO(caitp): Do not store a separate literal buffer for the span TRV. | 
| + // | 
| + | 
| + if (next_.token == Token::RBRACE) { | 
| + PushBack('}'); | 
| 
 
marja
2014/11/11 09:47:24
Hmm, when does this happen and why do we PushBack?
 
caitp (gmail)
2014/11/11 13:59:29
After parsing an expression, the scanner ends up w
 
marja
2014/11/11 15:01:56
But after this, we anyway do Advance() right away.
 
 | 
| + } | 
| + next_.location.beg_pos = source_pos(); | 
| + Token::Value result = Token::ILLEGAL; | 
| + DCHECK(c0_ == '`' || c0_ == '}'); | 
| + Advance(); // Consume ` or } | 
| + | 
| + LiteralScope literal(this); | 
| + while (true) { | 
| + uc32 c = c0_; | 
| + Advance(); | 
| + if (c == '`') { | 
| + result = Token::TEMPLATE_TAIL; | 
| + break; | 
| + } else if (c == '$' && c0_ == '{') { | 
| + Advance(); // Consume '{' | 
| + result = Token::TEMPLATE_SPAN; | 
| + break; | 
| + } else if (c == '\\') { | 
| + AddRawLiteralChar('\\'); | 
| + if (unicode_cache_->IsLineTerminator(c0_)) { | 
| + // The TV of LineContinuation :: \ LineTerminatorSequence is the empty | 
| + // code unit sequence. | 
| + do { | 
| + uc32 lastChar = c0_; | 
| + Advance(); | 
| + if (lastChar == '\r' && c0_ == '\n') Advance(); | 
| + AddRawLiteralChar('\n'); | 
| + } while (unicode_cache_->IsLineTerminator(c0_)); | 
| + } else if (c0_ == '0') { | 
| + Advance(); | 
| + AddRawLiteralChar('0'); | 
| + AddLiteralChar('0'); | 
| + } else { | 
| + ScanEscape(true); | 
| + } | 
| + } else if (c < 0) { | 
| + // Unterminated template literal | 
| + PushBack(c); | 
| + break; | 
| + } else { | 
| + // The TRV of LineTerminatorSequence :: <CR> is the CV 0x000A. | 
| + // The TRV of LineTerminatorSequence :: <CR><LF> is the sequence | 
| + // consisting of the CV 0x000A. | 
| + if (c == '\r') { | 
| + if (c0_ == '\n') Advance(); | 
| + c = '\n'; | 
| + } | 
| + AddLiteralChar(c); | 
| + AddRawLiteralChar(c); | 
| + } | 
| + } | 
| + literal.Complete(); | 
| + next_.location.end_pos = source_pos(); | 
| + next_.token = result; | 
| + return result; | 
| +} | 
| + | 
| + | 
| void Scanner::ScanDecimalDigits() { | 
| while (IsDecimalDigit(c0_)) | 
| AddLiteralCharAdvance(); | 
| @@ -1163,6 +1268,15 @@ const AstRawString* Scanner::CurrentSymbol(AstValueFactory* ast_value_factory) { | 
| } | 
| +const AstRawString* Scanner::CurrentRawSymbol( | 
| + AstValueFactory* ast_value_factory) { | 
| + if (is_raw_one_byte()) { | 
| + return ast_value_factory->GetOneByteString(raw_one_byte_string()); | 
| + } | 
| + return ast_value_factory->GetTwoByteString(raw_two_byte_string()); | 
| +} | 
| + | 
| + | 
| const AstRawString* Scanner::NextSymbol(AstValueFactory* ast_value_factory) { | 
| if (is_next_literal_one_byte()) { | 
| return ast_value_factory->GetOneByteString(next_literal_one_byte_string()); | 
| @@ -1171,6 +1285,14 @@ const AstRawString* Scanner::NextSymbol(AstValueFactory* ast_value_factory) { | 
| } | 
| +const AstRawString* Scanner::NextRawSymbol(AstValueFactory* ast_value_factory) { | 
| + if (is_next_raw_one_byte()) { | 
| + return ast_value_factory->GetOneByteString(next_raw_one_byte_string()); | 
| + } | 
| + return ast_value_factory->GetTwoByteString(next_raw_two_byte_string()); | 
| +} | 
| + | 
| + | 
| double Scanner::DoubleValue() { | 
| DCHECK(is_literal_one_byte()); | 
| return StringToDouble( |