base/string_util.cc - Issue 4268: IsStringUTF8 unittest and enforcing UTF-8 in JSON deserialization

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: base/string_util.cc

Issue 4268: IsStringUTF8 unittest and enforcing UTF-8 in JSON deserialization (Closed) Base URL: svn://chrome-svn/chrome/trunk/src/

Patch Set: '' Created 12 years, 3 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: base/string_util.cc

===================================================================

--- base/string_util.cc (revision 2506)

+++ base/string_util.cc (working copy)

@@ -517,7 +517,7 @@

// originally been UTF-8, but has been converted to wide characters because

// that's what we (and Windows) use internally.

template<typename CHAR>

-static bool IsStringUTF8T(const CHAR* str) {

+static bool IsStringUTF8T(const CHAR* str, int length) {

bool overlong = false;

bool surrogate = false;

bool nonchar = false;

@@ -532,7 +532,7 @@

// are left in the sequence

int positions_left = 0;

- for (int i = 0; str[i] != 0; i++) {

+ for (int i = 0; i < length; i++) {

// This whole function assume an unsigned value so force its conversion to

// an unsigned value.

typename ToUnsigned<CHAR>::Unsigned c = str[i];

@@ -556,6 +556,7 @@

slower = 0xA0;

} else if (c == 0xEF) {

// EF BF [BE-BF] : non-character

+ // TODO(jungshik): EF B7 [90-AF] should be checked as well.

nonchar = true;

}

} else if (c <= 0xF4) {

@@ -599,12 +600,12 @@

return true;

}

-bool IsStringUTF8(const char* str) {

- return IsStringUTF8T(str);

+bool IsStringUTF8(const std::string& str) {

+ return IsStringUTF8T(str.data(), str.length());

}

-bool IsStringWideUTF8(const wchar_t* str) {

- return IsStringUTF8T(str);

+bool IsStringWideUTF8(const std::wstring& str) {

+ return IsStringUTF8T(str.data(), str.length());

}

template<typename Iter>

« no previous file with comments | « base/string_util.h ('k') | base/string_util_unittest.cc » ('j') | no next file with comments »