OLD | NEW |
1 // Copyright 2011 the V8 project authors. All rights reserved. | 1 // Copyright 2011 the V8 project authors. All rights reserved. |
2 // Redistribution and use in source and binary forms, with or without | 2 // Redistribution and use in source and binary forms, with or without |
3 // modification, are permitted provided that the following conditions are | 3 // modification, are permitted provided that the following conditions are |
4 // met: | 4 // met: |
5 // | 5 // |
6 // * Redistributions of source code must retain the above copyright | 6 // * Redistributions of source code must retain the above copyright |
7 // notice, this list of conditions and the following disclaimer. | 7 // notice, this list of conditions and the following disclaimer. |
8 // * Redistributions in binary form must reproduce the above | 8 // * Redistributions in binary form must reproduce the above |
9 // copyright notice, this list of conditions and the following | 9 // copyright notice, this list of conditions and the following |
10 // disclaimer in the documentation and/or other materials provided | 10 // disclaimer in the documentation and/or other materials provided |
(...skipping 20 matching lines...) Expand all Loading... |
31 #include "scanner-base.h" | 31 #include "scanner-base.h" |
32 #include "char-predicates-inl.h" | 32 #include "char-predicates-inl.h" |
33 | 33 |
34 namespace v8 { | 34 namespace v8 { |
35 namespace internal { | 35 namespace internal { |
36 | 36 |
37 // ---------------------------------------------------------------------------- | 37 // ---------------------------------------------------------------------------- |
38 // Scanner | 38 // Scanner |
39 | 39 |
40 Scanner::Scanner(UnicodeCache* unicode_cache) | 40 Scanner::Scanner(UnicodeCache* unicode_cache) |
41 : unicode_cache_(unicode_cache), | 41 : unicode_cache_(unicode_cache) { } |
42 octal_pos_(kNoOctalLocation) { } | |
43 | 42 |
44 | 43 |
45 uc32 Scanner::ScanHexEscape(uc32 c, int length) { | 44 uc32 Scanner::ScanHexEscape(uc32 c, int length) { |
46 ASSERT(length <= 4); // prevent overflow | 45 ASSERT(length <= 4); // prevent overflow |
47 | 46 |
48 uc32 digits[4]; | 47 uc32 digits[4]; |
49 uc32 x = 0; | 48 uc32 x = 0; |
50 for (int i = 0; i < length; i++) { | 49 for (int i = 0; i < length; i++) { |
51 digits[i] = c0_; | 50 digits[i] = c0_; |
52 int d = HexValue(c0_); | 51 int d = HexValue(c0_); |
(...skipping 10 matching lines...) Expand all Loading... |
63 return c; | 62 return c; |
64 } | 63 } |
65 x = x * 16 + d; | 64 x = x * 16 + d; |
66 Advance(); | 65 Advance(); |
67 } | 66 } |
68 | 67 |
69 return x; | 68 return x; |
70 } | 69 } |
71 | 70 |
72 | 71 |
73 // Octal escapes of the forms '\0xx' and '\xxx' are not a part of | |
74 // ECMA-262. Other JS VMs support them. | |
75 uc32 Scanner::ScanOctalEscape(uc32 c, int length) { | |
76 uc32 x = c - '0'; | |
77 int i = 0; | |
78 for (; i < length; i++) { | |
79 int d = c0_ - '0'; | |
80 if (d < 0 || d > 7) break; | |
81 int nx = x * 8 + d; | |
82 if (nx >= 256) break; | |
83 x = nx; | |
84 Advance(); | |
85 } | |
86 // Anything excelt '\0' is an octal escape sequence, illegal in strict mode. | |
87 // Remember the position of octal escape sequences so that better error | |
88 // can be reported later (in strict mode). | |
89 if (c != '0' || i > 0) { | |
90 octal_pos_ = source_pos() - i - 1; // Already advanced | |
91 } | |
92 return x; | |
93 } | |
94 | |
95 | 72 |
96 // ---------------------------------------------------------------------------- | 73 // ---------------------------------------------------------------------------- |
97 // JavaScriptScanner | 74 // JavaScriptScanner |
98 | 75 |
99 JavaScriptScanner::JavaScriptScanner(UnicodeCache* scanner_contants) | 76 JavaScriptScanner::JavaScriptScanner(UnicodeCache* scanner_contants) |
100 : Scanner(scanner_contants) { } | 77 : Scanner(scanner_contants), octal_pos_(Location::invalid()) { } |
101 | 78 |
102 | 79 |
103 Token::Value JavaScriptScanner::Next() { | 80 Token::Value JavaScriptScanner::Next() { |
104 current_ = next_; | 81 current_ = next_; |
105 has_line_terminator_before_next_ = false; | 82 has_line_terminator_before_next_ = false; |
106 Scan(); | 83 Scan(); |
107 return current_.token; | 84 return current_.token; |
108 } | 85 } |
109 | 86 |
110 | 87 |
(...skipping 400 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
511 case '7' : c = ScanOctalEscape(c, 2); break; | 488 case '7' : c = ScanOctalEscape(c, 2); break; |
512 } | 489 } |
513 | 490 |
514 // According to ECMA-262, 3rd, 7.8.4 (p 18ff) these | 491 // According to ECMA-262, 3rd, 7.8.4 (p 18ff) these |
515 // should be illegal, but they are commonly handled | 492 // should be illegal, but they are commonly handled |
516 // as non-escaped characters by JS VMs. | 493 // as non-escaped characters by JS VMs. |
517 AddLiteralChar(c); | 494 AddLiteralChar(c); |
518 } | 495 } |
519 | 496 |
520 | 497 |
| 498 // Octal escapes of the forms '\0xx' and '\xxx' are not a part of |
| 499 // ECMA-262. Other JS VMs support them. |
| 500 uc32 JavaScriptScanner::ScanOctalEscape(uc32 c, int length) { |
| 501 uc32 x = c - '0'; |
| 502 int i = 0; |
| 503 for (; i < length; i++) { |
| 504 int d = c0_ - '0'; |
| 505 if (d < 0 || d > 7) break; |
| 506 int nx = x * 8 + d; |
| 507 if (nx >= 256) break; |
| 508 x = nx; |
| 509 Advance(); |
| 510 } |
| 511 // Anything except '\0' is an octal escape sequence, illegal in strict mode. |
| 512 // Remember the position of octal escape sequences so that an error |
| 513 // can be reported later (in strict mode). |
| 514 // We don't report the error immediately, because the octal escape can |
| 515 // occur before the "use strict" directive. |
| 516 if (c != '0' || i > 0) { |
| 517 octal_pos_ = Location(source_pos() - i - 1, source_pos() - 1); |
| 518 } |
| 519 return x; |
| 520 } |
| 521 |
| 522 |
521 Token::Value JavaScriptScanner::ScanString() { | 523 Token::Value JavaScriptScanner::ScanString() { |
522 uc32 quote = c0_; | 524 uc32 quote = c0_; |
523 Advance(); // consume quote | 525 Advance(); // consume quote |
524 | 526 |
525 LiteralScope literal(this); | 527 LiteralScope literal(this); |
526 while (c0_ != quote && c0_ >= 0 | 528 while (c0_ != quote && c0_ >= 0 |
527 && !unicode_cache_->IsLineTerminator(c0_)) { | 529 && !unicode_cache_->IsLineTerminator(c0_)) { |
528 uc32 c = c0_; | 530 uc32 c = c0_; |
529 Advance(); | 531 Advance(); |
530 if (c == '\\') { | 532 if (c == '\\') { |
(...skipping 48 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
579 } else if ('0' <= c0_ && c0_ <= '7') { | 581 } else if ('0' <= c0_ && c0_ <= '7') { |
580 // (possible) octal number | 582 // (possible) octal number |
581 kind = OCTAL; | 583 kind = OCTAL; |
582 while (true) { | 584 while (true) { |
583 if (c0_ == '8' || c0_ == '9') { | 585 if (c0_ == '8' || c0_ == '9') { |
584 kind = DECIMAL; | 586 kind = DECIMAL; |
585 break; | 587 break; |
586 } | 588 } |
587 if (c0_ < '0' || '7' < c0_) { | 589 if (c0_ < '0' || '7' < c0_) { |
588 // Octal literal finished. | 590 // Octal literal finished. |
589 octal_pos_ = next_.location.beg_pos; | 591 octal_pos_ = next_.location; |
590 break; | 592 break; |
591 } | 593 } |
592 AddLiteralCharAdvance(); | 594 AddLiteralCharAdvance(); |
593 } | 595 } |
594 } | 596 } |
595 } | 597 } |
596 | 598 |
597 // Parse decimal digits and allow trailing fractional part. | 599 // Parse decimal digits and allow trailing fractional part. |
598 if (kind == DECIMAL) { | 600 if (kind == DECIMAL) { |
599 ScanDecimalDigits(); // optional | 601 ScanDecimalDigits(); // optional |
(...skipping 122 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
722 AddLiteralCharAdvance(); | 724 AddLiteralCharAdvance(); |
723 if (unicode_cache_->IsLineTerminator(c0_) || c0_ < 0) return false; | 725 if (unicode_cache_->IsLineTerminator(c0_) || c0_ < 0) return false; |
724 AddLiteralCharAdvance(); | 726 AddLiteralCharAdvance(); |
725 // If the escape allows more characters, i.e., \x??, \u????, or \c?, | 727 // If the escape allows more characters, i.e., \x??, \u????, or \c?, |
726 // only "safe" characters are allowed (letters, digits, underscore), | 728 // only "safe" characters are allowed (letters, digits, underscore), |
727 // otherwise the escape isn't valid and the invalid character has | 729 // otherwise the escape isn't valid and the invalid character has |
728 // its normal meaning. I.e., we can just continue scanning without | 730 // its normal meaning. I.e., we can just continue scanning without |
729 // worrying whether the following characters are part of the escape | 731 // worrying whether the following characters are part of the escape |
730 // or not, since any '/', '\\' or '[' is guaranteed to not be part | 732 // or not, since any '/', '\\' or '[' is guaranteed to not be part |
731 // of the escape sequence. | 733 // of the escape sequence. |
| 734 |
| 735 // TODO(896): At some point, parse RegExps more throughly to capture |
| 736 // octal esacpes in strict mode. |
732 } else { // Unescaped character. | 737 } else { // Unescaped character. |
733 if (c0_ == '[') in_character_class = true; | 738 if (c0_ == '[') in_character_class = true; |
734 if (c0_ == ']') in_character_class = false; | 739 if (c0_ == ']') in_character_class = false; |
735 AddLiteralCharAdvance(); | 740 AddLiteralCharAdvance(); |
736 } | 741 } |
737 } | 742 } |
738 Advance(); // consume '/' | 743 Advance(); // consume '/' |
739 | 744 |
740 literal.Complete(); | 745 literal.Complete(); |
741 | 746 |
(...skipping 195 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
937 if (MatchKeywordStart(input, "with", 1, Token::WITH)) return; | 942 if (MatchKeywordStart(input, "with", 1, Token::WITH)) return; |
938 break; | 943 break; |
939 case UNMATCHABLE: | 944 case UNMATCHABLE: |
940 break; | 945 break; |
941 } | 946 } |
942 // On fallthrough, it's a failure. | 947 // On fallthrough, it's a failure. |
943 state_ = UNMATCHABLE; | 948 state_ = UNMATCHABLE; |
944 } | 949 } |
945 | 950 |
946 } } // namespace v8::internal | 951 } } // namespace v8::internal |
OLD | NEW |