| Index: src/scanner.cc
|
| diff --git a/src/scanner.cc b/src/scanner.cc
|
| index 8b7cb569bddeb63d940b2a32b1cd791c1be51411..26f840b23a5914e9e5d52c207d5f9ed904e15a9d 100644
|
| --- a/src/scanner.cc
|
| +++ b/src/scanner.cc
|
| @@ -27,10 +27,14 @@
|
|
|
| // Features shared by parsing and pre-parsing scanners.
|
|
|
| +#include <cmath>
|
| +
|
| #include "scanner.h"
|
|
|
| #include "../include/v8stdint.h"
|
| #include "char-predicates-inl.h"
|
| +#include "conversions-inl.h"
|
| +#include "list-inl.h"
|
|
|
| namespace v8 {
|
| namespace internal {
|
| @@ -1108,4 +1112,140 @@ bool Scanner::ScanRegExpFlags() {
|
| return true;
|
| }
|
|
|
| +
|
| +int DuplicateFinder::AddAsciiSymbol(Vector<const char> key, int value) {
|
| + return AddSymbol(Vector<const byte>::cast(key), true, value);
|
| +}
|
| +
|
| +
|
| +int DuplicateFinder::AddUtf16Symbol(Vector<const uint16_t> key, int value) {
|
| + return AddSymbol(Vector<const byte>::cast(key), false, value);
|
| +}
|
| +
|
| +
|
| +int DuplicateFinder::AddSymbol(Vector<const byte> key,
|
| + bool is_ascii,
|
| + int value) {
|
| + uint32_t hash = Hash(key, is_ascii);
|
| + byte* encoding = BackupKey(key, is_ascii);
|
| + HashMap::Entry* entry = map_.Lookup(encoding, hash, true);
|
| + int old_value = static_cast<int>(reinterpret_cast<intptr_t>(entry->value));
|
| + entry->value =
|
| + reinterpret_cast<void*>(static_cast<intptr_t>(value | old_value));
|
| + return old_value;
|
| +}
|
| +
|
| +
|
| +int DuplicateFinder::AddNumber(Vector<const char> key, int value) {
|
| + ASSERT(key.length() > 0);
|
| + // Quick check for already being in canonical form.
|
| + if (IsNumberCanonical(key)) {
|
| + return AddAsciiSymbol(key, value);
|
| + }
|
| +
|
| + int flags = ALLOW_HEX | ALLOW_OCTAL | ALLOW_IMPLICIT_OCTAL | ALLOW_BINARY;
|
| + double double_value = StringToDouble(unicode_constants_, key, flags, 0.0);
|
| + int length;
|
| + const char* string;
|
| + if (!std::isfinite(double_value)) {
|
| + string = "Infinity";
|
| + length = 8; // strlen("Infinity");
|
| + } else {
|
| + string = DoubleToCString(double_value,
|
| + Vector<char>(number_buffer_, kBufferSize));
|
| + length = StrLength(string);
|
| + }
|
| + return AddSymbol(Vector<const byte>(reinterpret_cast<const byte*>(string),
|
| + length), true, value);
|
| +}
|
| +
|
| +
|
| +bool DuplicateFinder::IsNumberCanonical(Vector<const char> number) {
|
| + // Test for a safe approximation of number literals that are already
|
| + // in canonical form: max 15 digits, no leading zeroes, except an
|
| + // integer part that is a single zero, and no trailing zeros below
|
| + // the decimal point.
|
| + int pos = 0;
|
| + int length = number.length();
|
| + if (number.length() > 15) return false;
|
| + if (number[pos] == '0') {
|
| + pos++;
|
| + } else {
|
| + while (pos < length &&
|
| + static_cast<unsigned>(number[pos] - '0') <= ('9' - '0')) pos++;
|
| + }
|
| + if (length == pos) return true;
|
| + if (number[pos] != '.') return false;
|
| + pos++;
|
| + bool invalid_last_digit = true;
|
| + while (pos < length) {
|
| + byte digit = number[pos] - '0';
|
| + if (digit > '9' - '0') return false;
|
| + invalid_last_digit = (digit == 0);
|
| + pos++;
|
| + }
|
| + return !invalid_last_digit;
|
| +}
|
| +
|
| +
|
| +uint32_t DuplicateFinder::Hash(Vector<const byte> key, bool is_ascii) {
|
| + // Primitive hash function, almost identical to the one used
|
| + // for strings (except that it's seeded by the length and ASCII-ness).
|
| + int length = key.length();
|
| + uint32_t hash = (length << 1) | (is_ascii ? 1 : 0) ;
|
| + for (int i = 0; i < length; i++) {
|
| + uint32_t c = key[i];
|
| + hash = (hash + c) * 1025;
|
| + hash ^= (hash >> 6);
|
| + }
|
| + return hash;
|
| +}
|
| +
|
| +
|
| +bool DuplicateFinder::Match(void* first, void* second) {
|
| + // Decode lengths.
|
| + // Length + ASCII-bit is encoded as base 128, most significant heptet first,
|
| + // with a 8th bit being non-zero while there are more heptets.
|
| + // The value encodes the number of bytes following, and whether the original
|
| + // was ASCII.
|
| + byte* s1 = reinterpret_cast<byte*>(first);
|
| + byte* s2 = reinterpret_cast<byte*>(second);
|
| + uint32_t length_ascii_field = 0;
|
| + byte c1;
|
| + do {
|
| + c1 = *s1;
|
| + if (c1 != *s2) return false;
|
| + length_ascii_field = (length_ascii_field << 7) | (c1 & 0x7f);
|
| + s1++;
|
| + s2++;
|
| + } while ((c1 & 0x80) != 0);
|
| + int length = static_cast<int>(length_ascii_field >> 1);
|
| + return memcmp(s1, s2, length) == 0;
|
| +}
|
| +
|
| +
|
| +byte* DuplicateFinder::BackupKey(Vector<const byte> bytes,
|
| + bool is_ascii) {
|
| + uint32_t ascii_length = (bytes.length() << 1) | (is_ascii ? 1 : 0);
|
| + backing_store_.StartSequence();
|
| + // Emit ascii_length as base-128 encoded number, with the 7th bit set
|
| + // on the byte of every heptet except the last, least significant, one.
|
| + if (ascii_length >= (1 << 7)) {
|
| + if (ascii_length >= (1 << 14)) {
|
| + if (ascii_length >= (1 << 21)) {
|
| + if (ascii_length >= (1 << 28)) {
|
| + backing_store_.Add(static_cast<byte>((ascii_length >> 28) | 0x80));
|
| + }
|
| + backing_store_.Add(static_cast<byte>((ascii_length >> 21) | 0x80u));
|
| + }
|
| + backing_store_.Add(static_cast<byte>((ascii_length >> 14) | 0x80u));
|
| + }
|
| + backing_store_.Add(static_cast<byte>((ascii_length >> 7) | 0x80u));
|
| + }
|
| + backing_store_.Add(static_cast<byte>(ascii_length & 0x7f));
|
| +
|
| + backing_store_.AddBlock(bytes);
|
| + return backing_store_.EndSequence().start();
|
| +}
|
| +
|
| } } // namespace v8::internal
|
|
|