runtime/vm/unicode.cc - Issue 11365243: Revert OneByteString back to ISO Latin-1 instead of ASCII

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: runtime/vm/unicode.cc

Issue 11365243: Revert OneByteString back to ISO Latin-1 instead of ASCII (Closed) Base URL: http://dart.googlecode.com/svn/branches/bleeding_edge/dart/

Patch Set: Created 8 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: runtime/vm/unicode.cc

===================================================================

--- runtime/vm/unicode.cc (revision 14982)

+++ runtime/vm/unicode.cc (working copy)

@@ -58,8 +58,8 @@

}

-static bool IsAsciiSequenceStart(uint8_t code_unit) {

- // Check is codepoint is <= U+007F

+static bool IsLatin1SequenceStart(uint8_t code_unit) {

+ // Check is codepoint is <= U+00FF

return (code_unit <= Utf8::kMaxOneByteChar);

}

@@ -101,17 +101,17 @@

intptr_t array_len,

Type* type) {

intptr_t len = 0;

- Type char_type = kAscii;

+ Type char_type = kLatin1;

for (intptr_t i = 0; i < array_len; i++) {

uint8_t code_unit = utf8_array[i];

if (!IsTrailByte(code_unit)) {

++len;

}

- if (!IsAsciiSequenceStart(code_unit)) { // > U+007F

+ if (!IsLatin1SequenceStart(code_unit)) { // > U+00FF

if (IsSmpSequenceStart(code_unit)) { // >= U+10000

char_type = kSMP;

++len;

- } else if (char_type == kAscii) {

+ } else if (char_type == kLatin1) {

char_type = kBMP;

}

@@ -251,19 +251,26 @@

}

-bool Utf8::DecodeToAscii(const uint8_t* utf8_array,

- intptr_t array_len,

- uint8_t* dst,

- intptr_t len) {

- if (len < array_len) {

+bool Utf8::DecodeToLatin1(const uint8_t* utf8_array,

+ intptr_t array_len,

+ uint8_t* dst,

+ intptr_t len) {

+ intptr_t i = 0;

+ intptr_t j = 0;

+ intptr_t num_bytes;

+ for (; (i < array_len) && (j < len); i += num_bytes, ++j) {

+ int32_t ch;

+ ASSERT(IsLatin1SequenceStart(utf8_array[i]));

+ num_bytes = Utf8::Decode(&utf8_array[i], (array_len - i), &ch);

+ if (ch == -1) {

+ return false; // invalid input

+ }

+ ASSERT(ch <= 0xff);

+ dst[j] = ch;

+ }

+ if ((i < array_len) && (j == len)) {

return false; // output overflow

}

-#ifdef DEBUG

- for (intptr_t i = 0; i < array_len; i++) {

- ASSERT(IsAsciiSequenceStart(utf8_array[i]));

- }

-#endif

- memmove(dst, utf8_array, array_len);

return true; // success

}

« no previous file with comments | « runtime/vm/unicode.h ('k') | no next file » | no next file with comments »