base/string_util.cc - Issue 27243: Revert "Revert "ASCII <-> UTF16 conversion functions. These are just copies of WideToASCII and""

Side by Side Diff: base/string_util.cc

Issue 27243: Revert "Revert "ASCII <-> UTF16 conversion functions. These are just copies of WideToASCII and"" (Closed)

Patch Set: Created 11 years, 10 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
1 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.	1 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.

2 // Use of this source code is governed by a BSD-style license that can be	2 // Use of this source code is governed by a BSD-style license that can be

3 // found in the LICENSE file.	3 // found in the LICENSE file.

4	4

5 #include "base/string_util.h"	5 #include "base/string_util.h"

6	6

7 #include "build/build_config.h"	7 #include "build/build_config.h"

8	8

9 #include <ctype.h>	9 #include <ctype.h>

10 #include <errno.h>	10 #include <errno.h>

(...skipping 432 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
443 std::string WideToASCII(const std::wstring& wide) {	443 std::string WideToASCII(const std::wstring& wide) {

444 DCHECK(IsStringASCII(wide));	444 DCHECK(IsStringASCII(wide));

445 return std::string(wide.begin(), wide.end());	445 return std::string(wide.begin(), wide.end());

446 }	446 }

447	447

448 std::wstring ASCIIToWide(const std::string& ascii) {	448 std::wstring ASCIIToWide(const std::string& ascii) {

449 DCHECK(IsStringASCII(ascii));	449 DCHECK(IsStringASCII(ascii));

450 return std::wstring(ascii.begin(), ascii.end());	450 return std::wstring(ascii.begin(), ascii.end());

451 }	451 }

452	452

	453 std::string UTF16ToASCII(const string16& utf16) {

	454 DCHECK(IsStringASCII(utf16));

	455 return std::string(utf16.begin(), utf16.end());

	456 }

	457

	458 string16 ASCIIToUTF16(const std::string& ascii) {

	459 DCHECK(IsStringASCII(ascii));

	460 return string16(ascii.begin(), ascii.end());

	461 }

	462

453 // Latin1 is just the low range of Unicode, so we can copy directly to convert.	463 // Latin1 is just the low range of Unicode, so we can copy directly to convert.

454 bool WideToLatin1(const std::wstring& wide, std::string* latin1) {	464 bool WideToLatin1(const std::wstring& wide, std::string* latin1) {

455 std::string output;	465 std::string output;

456 output.resize(wide.size());	466 output.resize(wide.size());

457 latin1->clear();	467 latin1->clear();

458 for (size_t i = 0; i < wide.size(); i++) {	468 for (size_t i = 0; i < wide.size(); i++) {

459 if (wide[i] > 255)	469 if (wide[i] > 255)

460 return false;	470 return false;

461 output[i] = static_cast<char>(wide[i]);	471 output[i] = static_cast<char>(wide[i]);

462 }	472 }

463 latin1->swap(output);	473 latin1->swap(output);

464 return true;	474 return true;

465 }	475 }

466	476

467 bool IsString8Bit(const std::wstring& str) {	477 bool IsString8Bit(const std::wstring& str) {

468 for (size_t i = 0; i < str.length(); i++) {	478 for (size_t i = 0; i < str.length(); i++) {

469 if (str[i] > 255)	479 if (str[i] > 255)

470 return false;	480 return false;

471 }	481 }

472 return true;	482 return true;

473 }	483 }

474	484

475 bool IsStringASCII(const std::wstring& str) {	485 template<class STR>

	486 static bool DoIsStringASCII(const STR& str) {

476 for (size_t i = 0; i < str.length(); i++) {	487 for (size_t i = 0; i < str.length(); i++) {

477 if (str[i] > 0x7F)	488 typename ToUnsigned<typename STR::value_type>::Unsigned c = str[i];

	489 if (c > 0x7F)

478 return false;	490 return false;

479 }	491 }

480 return true;	492 return true;

481 }	493 }

482	494

	495 bool IsStringASCII(const std::wstring& str) {

	496 return DoIsStringASCII(str);

	497 }

	498

	499 #if !defined(WCHAR_T_IS_UTF16)

	500 bool IsStringASCII(const string16& str) {

	501 return DoIsStringASCII(str);

	502 }

	503 #endif

	504

483 bool IsStringASCII(const std::string& str) {	505 bool IsStringASCII(const std::string& str) {

484 for (size_t i = 0; i < str.length(); i++) {	506 return DoIsStringASCII(str);

485 if (static_cast<unsigned char>(str[i]) > 0x7F)

486 return false;

487 }

488 return true;

489 }	507 }

490	508

491 // Helper functions that determine whether the given character begins a	509 // Helper functions that determine whether the given character begins a

492 // UTF-8 sequence of bytes with the given length. A character satisfies	510 // UTF-8 sequence of bytes with the given length. A character satisfies

493 // "IsInUTF8Sequence" if it is anything but the first byte in a multi-byte	511 // "IsInUTF8Sequence" if it is anything but the first byte in a multi-byte

494 // character.	512 // character.

495 static inline bool IsBegin2ByteUTF8(int c) {	513 static inline bool IsBegin2ByteUTF8(int c) {

496 return (c & 0xE0) == 0xC0;	514 return (c & 0xE0) == 0xC0;

497 }	515 }

498 static inline bool IsBegin3ByteUTF8(int c) {	516 static inline bool IsBegin3ByteUTF8(int c) {

(...skipping 1107 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
1606 // Each input byte creates two output hex characters.	1624 // Each input byte creates two output hex characters.

1607 std::string ret(size * 2, '\0');	1625 std::string ret(size * 2, '\0');

1608	1626

1609 for (size_t i = 0; i < size; ++i) {	1627 for (size_t i = 0; i < size; ++i) {

1610 char b = reinterpret_cast<const char*>(bytes)[i];	1628 char b = reinterpret_cast<const char*>(bytes)[i];

1611 ret[(i * 2)] = kHexChars[(b >> 4) & 0xf];	1629 ret[(i * 2)] = kHexChars[(b >> 4) & 0xf];

1612 ret[(i * 2) + 1] = kHexChars[b & 0xf];	1630 ret[(i * 2) + 1] = kHexChars[b & 0xf];

1613 }	1631 }

1614 return ret;	1632 return ret;

1615 }	1633 }

OLD	NEW

« no previous file with comments | « base/string_util.h ('k') | no next file » | no next file with comments »