src/parsing/duplicate-finder.cc - Issue 2281443002: Separate DuplicateFinder from Scanner.

Side by Side Diff: src/parsing/duplicate-finder.cc

Issue 2281443002: Separate DuplicateFinder from Scanner. (Closed) Base URL: https://chromium.googlesource.com/v8/v8.git@master

Patch Set: Fix rebase. Created 4 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
(Empty)
	1 // Copyright 2011 the V8 project authors. All rights reserved.

	2 // Use of this source code is governed by a BSD-style license that can be

	3 // found in the LICENSE file.

	4

	5 #include "src/parsing/duplicate-finder.h"

	6

	7 #include "src/conversions.h"

	8 #include "src/unicode-cache.h"

	9

	10 namespace v8 {

	11 namespace internal {

	12

	13 int DuplicateFinder::AddOneByteSymbol(Vector<const uint8_t> key, int value) {

	14 return AddSymbol(key, true, value);

	15 }

	16

	17 int DuplicateFinder::AddTwoByteSymbol(Vector<const uint16_t> key, int value) {

	18 return AddSymbol(Vector<const uint8_t>::cast(key), false, value);

	19 }

	20

	21 int DuplicateFinder::AddSymbol(Vector<const uint8_t> key, bool is_one_byte,

	22 int value) {

	23 uint32_t hash = Hash(key, is_one_byte);

	24 byte* encoding = BackupKey(key, is_one_byte);

	25 base::HashMap::Entry* entry = map_.LookupOrInsert(encoding, hash);

	26 int old_value = static_cast<int>(reinterpret_cast<intptr_t>(entry->value));

	27 entry->value =

	28 reinterpret_cast<void*>(static_cast<intptr_t>(value \| old_value));

	29 return old_value;

	30 }

	31

	32 int DuplicateFinder::AddNumber(Vector<const uint8_t> key, int value) {

	33 DCHECK(key.length() > 0);

	34 // Quick check for already being in canonical form.

	35 if (IsNumberCanonical(key)) {

	36 return AddOneByteSymbol(key, value);

	37 }

	38

	39 int flags = ALLOW_HEX \| ALLOW_OCTAL \| ALLOW_IMPLICIT_OCTAL \| ALLOW_BINARY;

	40 double double_value = StringToDouble(unicode_constants_, key, flags, 0.0);

	41 int length;

	42 const char* string;

	43 if (!std::isfinite(double_value)) {

	44 string = "Infinity";

	45 length = 8; // strlen("Infinity");

	46 } else {

	47 string = DoubleToCString(double_value,

	48 Vector<char>(number_buffer_, kBufferSize));

	49 length = StrLength(string);

	50 }

	51 return AddSymbol(

	52 Vector<const byte>(reinterpret_cast<const byte*>(string), length), true,

	53 value);

	54 }

	55

	56 bool DuplicateFinder::IsNumberCanonical(Vector<const uint8_t> number) {

	57 // Test for a safe approximation of number literals that are already

	58 // in canonical form: max 15 digits, no leading zeroes, except an

	59 // integer part that is a single zero, and no trailing zeros below

	60 // the decimal point.

	61 int pos = 0;

	62 int length = number.length();

	63 if (number.length() > 15) return false;

	64 if (number[pos] == '0') {

	65 pos++;

	66 } else {

	67 while (pos < length &&

	68 static_cast<unsigned>(number[pos] - '0') <= ('9' - '0'))

	69 pos++;

	70 }

	71 if (length == pos) return true;

	72 if (number[pos] != '.') return false;

	73 pos++;

	74 bool invalid_last_digit = true;

	75 while (pos < length) {

	76 uint8_t digit = number[pos] - '0';

	77 if (digit > '9' - '0') return false;

	78 invalid_last_digit = (digit == 0);

	79 pos++;

	80 }

	81 return !invalid_last_digit;

	82 }

	83

	84 uint32_t DuplicateFinder::Hash(Vector<const uint8_t> key, bool is_one_byte) {

	85 // Primitive hash function, almost identical to the one used

	86 // for strings (except that it's seeded by the length and representation).

	87 int length = key.length();

	88 uint32_t hash = (length << 1) \| (is_one_byte ? 1 : 0);

	89 for (int i = 0; i < length; i++) {

	90 uint32_t c = key[i];

	91 hash = (hash + c) * 1025;

	92 hash ^= (hash >> 6);

	93 }

	94 return hash;

	95 }

	96

	97 bool DuplicateFinder::Match(void* first, void* second) {

	98 // Decode lengths.

	99 // Length + representation is encoded as base 128, most significant heptet

	100 // first, with a 8th bit being non-zero while there are more heptets.

	101 // The value encodes the number of bytes following, and whether the original

	102 // was Latin1.

	103 byte* s1 = reinterpret_cast<byte*>(first);

	104 byte* s2 = reinterpret_cast<byte*>(second);

	105 uint32_t length_one_byte_field = 0;

	106 byte c1;

	107 do {

	108 c1 = *s1;

	109 if (c1 != *s2) return false;

	110 length_one_byte_field = (length_one_byte_field << 7) \| (c1 & 0x7f);

	111 s1++;

	112 s2++;

	113 } while ((c1 & 0x80) != 0);

	114 int length = static_cast<int>(length_one_byte_field >> 1);

	115 return memcmp(s1, s2, length) == 0;

	116 }

	117

	118 byte* DuplicateFinder::BackupKey(Vector<const uint8_t> bytes,

	119 bool is_one_byte) {

	120 uint32_t one_byte_length = (bytes.length() << 1) \| (is_one_byte ? 1 : 0);

	121 backing_store_.StartSequence();

	122 // Emit one_byte_length as base-128 encoded number, with the 7th bit set

	123 // on the byte of every heptet except the last, least significant, one.

	124 if (one_byte_length >= (1 << 7)) {

	125 if (one_byte_length >= (1 << 14)) {

	126 if (one_byte_length >= (1 << 21)) {

	127 if (one_byte_length >= (1 << 28)) {

	128 backing_store_.Add(

	129 static_cast<uint8_t>((one_byte_length >> 28) \| 0x80));

	130 }

	131 backing_store_.Add(

	132 static_cast<uint8_t>((one_byte_length >> 21) \| 0x80u));

	133 }

	134 backing_store_.Add(static_cast<uint8_t>((one_byte_length >> 14) \| 0x80u));

	135 }

	136 backing_store_.Add(static_cast<uint8_t>((one_byte_length >> 7) \| 0x80u));

	137 }

	138 backing_store_.Add(static_cast<uint8_t>(one_byte_length & 0x7f));

	139

	140 backing_store_.AddBlock(bytes);

	141 return backing_store_.EndSequence().start();

	142 }

	143

	144 } // namespace internal

	145 } // namespace v8

OLD	NEW

« no previous file with comments | « src/parsing/duplicate-finder.h ('k') | src/parsing/expression-classifier.h » ('j') | no next file with comments »