test/cctest/test-parsing.cc - Issue 1148653007: Update UTF-8 decoder to detect more special cases.

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: test/cctest/test-parsing.cc

Issue 1148653007: Update UTF-8 decoder to detect more special cases. (Closed) Base URL: https://chromium.googlesource.com/v8/v8.git@master

Patch Set: updates Created 5 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: test/cctest/test-parsing.cc

diff --git a/test/cctest/test-parsing.cc b/test/cctest/test-parsing.cc

index 659680d8288989917b64a7a2cadd9510b7d2e1f4..d4f9f0b9d8a9ab7739d800f565baed5e15c3b659 100644

--- a/test/cctest/test-parsing.cc

+++ b/test/cctest/test-parsing.cc

@@ -699,18 +699,22 @@ TEST(Utf8CharacterStream) {

char buffer[kAllUtf8CharsSizeU];

unsigned cursor = 0;

for (int i = 0; i <= kMaxUC16Char; i++) {

- cursor += unibrow::Utf8::Encode(buffer + cursor,

- i,

- unibrow::Utf16::kNoPreviousCharacter);

+ cursor += unibrow::Utf8::Encode(buffer + cursor, i,

+ unibrow::Utf16::kNoPreviousCharacter, true);

}

DCHECK(cursor == kAllUtf8CharsSizeU);

i::Utf8ToUtf16CharacterStream stream(reinterpret_cast<const i::byte*>(buffer),

kAllUtf8CharsSizeU);

+ int32_t bad = unibrow::Utf8::kBadChar;

for (int i = 0; i <= kMaxUC16Char; i++) {

CHECK_EQU(i, stream.pos());

int32_t c = stream.Advance();

- CHECK_EQ(i, c);

+ if (i >= 0xd800 && i <= 0xdfff) {

+ CHECK_EQ(bad, c);

+ } else {

+ CHECK_EQ(i, c);

+ }

CHECK_EQU(i + 1, stream.pos());

}

for (int i = kMaxUC16Char; i >= 0; i--) {

@@ -724,7 +728,9 @@ TEST(Utf8CharacterStream) {

int progress = static_cast<int>(stream.SeekForward(12));

i += progress;

int32_t c = stream.Advance();

- if (i <= kMaxUC16Char) {

+ if (i >= 0xd800 && i <= 0xdfff) {

+ CHECK_EQ(bad, c);

+ } else if (i <= kMaxUC16Char) {

CHECK_EQ(i, c);

} else {

CHECK_EQ(-1, c);

@@ -913,6 +919,15 @@ static int Utf8LengthHelper(const char* s) {

// Record a single kBadChar for the first byte and continue.

continue;

}

+ if (c == 0xed) {

+ unsigned char d = s[i + 1];

+ if ((d < 0x80) || (d > 0x9f)) {

+ // This 3 byte sequence is part of a surrogate pair which is not

+ // supported by UTF-8. Record a single kBadChar for the first byte

+ // and continue.

+ continue;

+ }

input_offset = 2;

// 3 bytes of UTF-8 turn into 1 UTF-16 code unit.

output_adjust = 2;

« test/cctest/test-api.cc ('K') | « test/cctest/test-api.cc ('k') | no next file » | no next file with comments »