| Index: src/scanner.cc
|
| diff --git a/src/scanner.cc b/src/scanner.cc
|
| index ddcd937584d50fc45fa921a25e2a5d21fcf5697e..1ea5e741f641798edcb4a628d37d9c28a525a98e 100644
|
| --- a/src/scanner.cc
|
| +++ b/src/scanner.cc
|
| @@ -54,7 +54,7 @@ void Scanner::Initialize(Utf16CharacterStream* source) {
|
| }
|
|
|
|
|
| -uc32 Scanner::ScanHexNumber(int expected_length) {
|
| +uc32 Scanner::ScanHexNumber(int expected_length, bool recordRaw) {
|
| DCHECK(expected_length <= 4); // prevent overflow
|
|
|
| uc32 x = 0;
|
| @@ -64,6 +64,9 @@ uc32 Scanner::ScanHexNumber(int expected_length) {
|
| return -1;
|
| }
|
| x = x * 16 + d;
|
| + if (recordRaw) {
|
| + AddRawLiteralChar(c0_);
|
| + }
|
| Advance();
|
| }
|
|
|
| @@ -403,7 +406,9 @@ Token::Value Scanner::ScanHtmlComment() {
|
|
|
| void Scanner::Scan() {
|
| next_.literal_chars = NULL;
|
| + next_.raw_literal_chars = NULL;
|
| Token::Value token;
|
| +
|
| do {
|
| // Remember the position of the next token
|
| next_.location.beg_pos = source_pos();
|
| @@ -626,6 +631,12 @@ void Scanner::Scan() {
|
| token = Select(Token::BIT_NOT);
|
| break;
|
|
|
| + case '`':
|
| + if (HarmonyTemplates()) {
|
| + token = ScanTemplateSpan();
|
| + break;
|
| + }
|
| +
|
| default:
|
| if (c0_ < 0) {
|
| token = Token::EOS;
|
| @@ -671,8 +682,10 @@ void Scanner::SeekForward(int pos) {
|
| }
|
|
|
|
|
| -bool Scanner::ScanEscape() {
|
| +bool Scanner::ScanEscape(bool recordRaw) {
|
| uc32 c = c0_;
|
| + uc32 rc = c;
|
| + bool singleCharEscape = true;
|
| Advance();
|
|
|
| // Skip escaped newlines.
|
| @@ -694,13 +707,17 @@ bool Scanner::ScanEscape() {
|
| case 'r' : c = '\r'; break;
|
| case 't' : c = '\t'; break;
|
| case 'u' : {
|
| - c = ScanHexNumber(4);
|
| + if (recordRaw) AddRawLiteralChar('u');
|
| + singleCharEscape = false;
|
| + c = ScanHexNumber(4, recordRaw);
|
| if (c < 0) return false;
|
| break;
|
| }
|
| case 'v' : c = '\v'; break;
|
| case 'x' : {
|
| - c = ScanHexNumber(2);
|
| + if (recordRaw) AddRawLiteralChar('x');
|
| + singleCharEscape = false;
|
| + c = ScanHexNumber(2, recordRaw);
|
| if (c < 0) return false;
|
| break;
|
| }
|
| @@ -711,12 +728,16 @@ bool Scanner::ScanEscape() {
|
| case '4' : // fall through
|
| case '5' : // fall through
|
| case '6' : // fall through
|
| - case '7' : c = ScanOctalEscape(c, 2); break;
|
| + case '7':
|
| + singleCharEscape = false;
|
| + c = ScanOctalEscape(c, 2, recordRaw);
|
| + break;
|
| }
|
|
|
| // According to ECMA-262, section 7.8.4, characters not covered by the
|
| // above cases should be illegal, but they are commonly handled as
|
| // non-escaped characters by JS VMs.
|
| + if (singleCharEscape && recordRaw) AddRawLiteralChar(rc);
|
| AddLiteralChar(c);
|
| return true;
|
| }
|
| @@ -724,7 +745,7 @@ bool Scanner::ScanEscape() {
|
|
|
| // Octal escapes of the forms '\0xx' and '\xxx' are not a part of
|
| // ECMA-262. Other JS VMs support them.
|
| -uc32 Scanner::ScanOctalEscape(uc32 c, int length) {
|
| +uc32 Scanner::ScanOctalEscape(uc32 c, int length, bool recordRaw) {
|
| uc32 x = c - '0';
|
| int i = 0;
|
| for (; i < length; i++) {
|
| @@ -733,6 +754,9 @@ uc32 Scanner::ScanOctalEscape(uc32 c, int length) {
|
| int nx = x * 8 + d;
|
| if (nx >= 256) break;
|
| x = nx;
|
| + if (recordRaw) {
|
| + AddRawLiteralChar(c0_);
|
| + }
|
| Advance();
|
| }
|
| // Anything except '\0' is an octal escape sequence, illegal in strict mode.
|
| @@ -770,6 +794,87 @@ Token::Value Scanner::ScanString() {
|
| }
|
|
|
|
|
| +Token::Value Scanner::ScanTemplateSpan() {
|
| + // When scanning a TemplateSpan, we are looking for the following construct:
|
| + // TEMPLATE_SPAN ::
|
| + // ` LiteralChars* ${
|
| + // | } LiteralChars* ${
|
| + //
|
| + // TEMPLATE_TAIL ::
|
| + // | ` LiteralChars* `
|
| + // | } LiteralChar* `
|
| + //
|
| + // A TEMPLATE_SPAN should always be followed by an Expression, while a
|
| + // TEMPLATE_TAIL terminates a TemplateLiteral and does not need to be
|
| + // followed by an Expression.
|
| + //
|
| + // raw_literal_chars_ represents TRV or the raw value of the template span,
|
| + // per the spec, while literal_chars_ represents TV or the cooked value of
|
| + // the template span.
|
| + //
|
| + // TODO(caitp): Do not store a separate literal buffer for the span TRV.
|
| + //
|
| +
|
| + if (next_.token == Token::RBRACE) {
|
| + PushBack('}');
|
| + }
|
| + next_.location.beg_pos = source_pos();
|
| + Token::Value result = Token::ILLEGAL;
|
| + DCHECK(c0_ == '`' || c0_ == '}');
|
| + Advance(); // Consume ` or }
|
| +
|
| + LiteralScope literal(this);
|
| + while (true) {
|
| + uc32 c = c0_;
|
| + Advance();
|
| + if (c == '`') {
|
| + result = Token::TEMPLATE_TAIL;
|
| + break;
|
| + } else if (c == '$' && c0_ == '{') {
|
| + Advance(); // Consume '{'
|
| + result = Token::TEMPLATE_SPAN;
|
| + break;
|
| + } else if (c == '\\') {
|
| + AddRawLiteralChar('\\');
|
| + if (unicode_cache_->IsLineTerminator(c0_)) {
|
| + // The TV of LineContinuation :: \ LineTerminatorSequence is the empty
|
| + // code unit sequence.
|
| + do {
|
| + uc32 lastChar = c0_;
|
| + Advance();
|
| + if (lastChar == '\r' && c0_ == '\n') Advance();
|
| + AddRawLiteralChar('\n');
|
| + } while (unicode_cache_->IsLineTerminator(c0_));
|
| + } else if (c0_ == '0') {
|
| + Advance();
|
| + AddRawLiteralChar('0');
|
| + AddLiteralChar('0');
|
| + } else {
|
| + ScanEscape(true);
|
| + }
|
| + } else if (c < 0) {
|
| + // Unterminated template literal
|
| + PushBack(c);
|
| + break;
|
| + } else {
|
| + // The TRV of LineTerminatorSequence :: <CR> is the CV 0x000A.
|
| + // The TRV of LineTerminatorSequence :: <CR><LF> is the sequence
|
| + // consisting of the CV 0x000A.
|
| + if (c == '\r') {
|
| + if (c0_ == '\n') Advance();
|
| + c = '\n';
|
| + }
|
| + AddLiteralChar(c);
|
| + AddRawLiteralChar(c);
|
| + }
|
| + }
|
| + literal.Complete();
|
| + next_.location.end_pos = source_pos();
|
| + next_.token = result;
|
| + return result;
|
| +}
|
| +
|
| +
|
| void Scanner::ScanDecimalDigits() {
|
| while (IsDecimalDigit(c0_))
|
| AddLiteralCharAdvance();
|
| @@ -1163,6 +1268,15 @@ const AstRawString* Scanner::CurrentSymbol(AstValueFactory* ast_value_factory) {
|
| }
|
|
|
|
|
| +const AstRawString* Scanner::CurrentRawSymbol(
|
| + AstValueFactory* ast_value_factory) {
|
| + if (is_raw_one_byte()) {
|
| + return ast_value_factory->GetOneByteString(raw_one_byte_string());
|
| + }
|
| + return ast_value_factory->GetTwoByteString(raw_two_byte_string());
|
| +}
|
| +
|
| +
|
| const AstRawString* Scanner::NextSymbol(AstValueFactory* ast_value_factory) {
|
| if (is_next_literal_one_byte()) {
|
| return ast_value_factory->GetOneByteString(next_literal_one_byte_string());
|
| @@ -1171,6 +1285,14 @@ const AstRawString* Scanner::NextSymbol(AstValueFactory* ast_value_factory) {
|
| }
|
|
|
|
|
| +const AstRawString* Scanner::NextRawSymbol(AstValueFactory* ast_value_factory) {
|
| + if (is_next_raw_one_byte()) {
|
| + return ast_value_factory->GetOneByteString(next_raw_one_byte_string());
|
| + }
|
| + return ast_value_factory->GetTwoByteString(next_raw_two_byte_string());
|
| +}
|
| +
|
| +
|
| double Scanner::DoubleValue() {
|
| DCHECK(is_literal_one_byte());
|
| return StringToDouble(
|
|
|