OLD | NEW |
1 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "base/string_util.h" | 5 #include "base/string_util.h" |
6 | 6 |
7 #include "build/build_config.h" | 7 #include "build/build_config.h" |
8 | 8 |
9 #include <ctype.h> | 9 #include <ctype.h> |
10 #include <errno.h> | 10 #include <errno.h> |
(...skipping 432 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
443 std::string WideToASCII(const std::wstring& wide) { | 443 std::string WideToASCII(const std::wstring& wide) { |
444 DCHECK(IsStringASCII(wide)); | 444 DCHECK(IsStringASCII(wide)); |
445 return std::string(wide.begin(), wide.end()); | 445 return std::string(wide.begin(), wide.end()); |
446 } | 446 } |
447 | 447 |
448 std::wstring ASCIIToWide(const std::string& ascii) { | 448 std::wstring ASCIIToWide(const std::string& ascii) { |
449 DCHECK(IsStringASCII(ascii)); | 449 DCHECK(IsStringASCII(ascii)); |
450 return std::wstring(ascii.begin(), ascii.end()); | 450 return std::wstring(ascii.begin(), ascii.end()); |
451 } | 451 } |
452 | 452 |
| 453 std::string UTF16ToASCII(const string16& utf16) { |
| 454 DCHECK(IsStringASCII(utf16)); |
| 455 return std::string(utf16.begin(), utf16.end()); |
| 456 } |
| 457 |
| 458 string16 ASCIIToUTF16(const std::string& ascii) { |
| 459 DCHECK(IsStringASCII(ascii)); |
| 460 return string16(ascii.begin(), ascii.end()); |
| 461 } |
| 462 |
453 // Latin1 is just the low range of Unicode, so we can copy directly to convert. | 463 // Latin1 is just the low range of Unicode, so we can copy directly to convert. |
454 bool WideToLatin1(const std::wstring& wide, std::string* latin1) { | 464 bool WideToLatin1(const std::wstring& wide, std::string* latin1) { |
455 std::string output; | 465 std::string output; |
456 output.resize(wide.size()); | 466 output.resize(wide.size()); |
457 latin1->clear(); | 467 latin1->clear(); |
458 for (size_t i = 0; i < wide.size(); i++) { | 468 for (size_t i = 0; i < wide.size(); i++) { |
459 if (wide[i] > 255) | 469 if (wide[i] > 255) |
460 return false; | 470 return false; |
461 output[i] = static_cast<char>(wide[i]); | 471 output[i] = static_cast<char>(wide[i]); |
462 } | 472 } |
463 latin1->swap(output); | 473 latin1->swap(output); |
464 return true; | 474 return true; |
465 } | 475 } |
466 | 476 |
467 bool IsString8Bit(const std::wstring& str) { | 477 bool IsString8Bit(const std::wstring& str) { |
468 for (size_t i = 0; i < str.length(); i++) { | 478 for (size_t i = 0; i < str.length(); i++) { |
469 if (str[i] > 255) | 479 if (str[i] > 255) |
470 return false; | 480 return false; |
471 } | 481 } |
472 return true; | 482 return true; |
473 } | 483 } |
474 | 484 |
475 bool IsStringASCII(const std::wstring& str) { | 485 template<class STR> |
| 486 static bool DoIsStringASCII(const STR& str) { |
476 for (size_t i = 0; i < str.length(); i++) { | 487 for (size_t i = 0; i < str.length(); i++) { |
477 if (str[i] > 0x7F) | 488 typename ToUnsigned<typename STR::value_type>::Unsigned c = str[i]; |
| 489 if (c > 0x7F) |
478 return false; | 490 return false; |
479 } | 491 } |
480 return true; | 492 return true; |
481 } | 493 } |
482 | 494 |
| 495 bool IsStringASCII(const std::wstring& str) { |
| 496 return DoIsStringASCII(str); |
| 497 } |
| 498 |
| 499 #if !defined(WCHAR_T_IS_UTF16) |
| 500 bool IsStringASCII(const string16& str) { |
| 501 return DoIsStringASCII(str); |
| 502 } |
| 503 #endif |
| 504 |
483 bool IsStringASCII(const std::string& str) { | 505 bool IsStringASCII(const std::string& str) { |
484 for (size_t i = 0; i < str.length(); i++) { | 506 return DoIsStringASCII(str); |
485 if (static_cast<unsigned char>(str[i]) > 0x7F) | |
486 return false; | |
487 } | |
488 return true; | |
489 } | 507 } |
490 | 508 |
491 // Helper functions that determine whether the given character begins a | 509 // Helper functions that determine whether the given character begins a |
492 // UTF-8 sequence of bytes with the given length. A character satisfies | 510 // UTF-8 sequence of bytes with the given length. A character satisfies |
493 // "IsInUTF8Sequence" if it is anything but the first byte in a multi-byte | 511 // "IsInUTF8Sequence" if it is anything but the first byte in a multi-byte |
494 // character. | 512 // character. |
495 static inline bool IsBegin2ByteUTF8(int c) { | 513 static inline bool IsBegin2ByteUTF8(int c) { |
496 return (c & 0xE0) == 0xC0; | 514 return (c & 0xE0) == 0xC0; |
497 } | 515 } |
498 static inline bool IsBegin3ByteUTF8(int c) { | 516 static inline bool IsBegin3ByteUTF8(int c) { |
(...skipping 1107 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1606 // Each input byte creates two output hex characters. | 1624 // Each input byte creates two output hex characters. |
1607 std::string ret(size * 2, '\0'); | 1625 std::string ret(size * 2, '\0'); |
1608 | 1626 |
1609 for (size_t i = 0; i < size; ++i) { | 1627 for (size_t i = 0; i < size; ++i) { |
1610 char b = reinterpret_cast<const char*>(bytes)[i]; | 1628 char b = reinterpret_cast<const char*>(bytes)[i]; |
1611 ret[(i * 2)] = kHexChars[(b >> 4) & 0xf]; | 1629 ret[(i * 2)] = kHexChars[(b >> 4) & 0xf]; |
1612 ret[(i * 2) + 1] = kHexChars[b & 0xf]; | 1630 ret[(i * 2) + 1] = kHexChars[b & 0xf]; |
1613 } | 1631 } |
1614 return ret; | 1632 return ret; |
1615 } | 1633 } |
OLD | NEW |