Index: base/i18n/character_encoding.cc |
diff --git a/base/i18n/character_encoding.cc b/base/i18n/character_encoding.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..fd0553a148eb707b25235015241640bfaa5b9440 |
--- /dev/null |
+++ b/base/i18n/character_encoding.cc |
@@ -0,0 +1,42 @@ |
+// Copyright 2016 The Chromium Authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+#include "base/i18n/character_encoding.h" |
+ |
+#include "base/macros.h" |
+#include "third_party/icu/source/common/unicode/ucnv.h" |
+ |
+namespace base { |
+namespace { |
+ |
+// An array of all supported canonical encoding names. |
+const char* const kCanonicalEncodingNames[] = { |
+ "Big5", "EUC-JP", "EUC-KR", "gb18030", |
+ "GBK", "IBM866", "ISO-2022-JP", "ISO-8859-10", |
+ "ISO-8859-13", "ISO-8859-14", "ISO-8859-15", "ISO-8859-16", |
+ "ISO-8859-2", "ISO-8859-3", "ISO-8859-4", "ISO-8859-5", |
+ "ISO-8859-6", "ISO-8859-7", "ISO-8859-8", "ISO-8859-8-I", |
+ "KOI8-R", "KOI8-U", "macintosh", "Shift_JIS", |
+ "UTF-16LE", "UTF-8", "windows-1250", "windows-1251", |
+ "windows-1252", "windows-1253", "windows-1254", "windows-1255", |
+ "windows-1256", "windows-1257", "windows-1258", "windows-874"}; |
+ |
+} // namespace |
+ |
+const char* GetCanonicalEncodingNameByAliasName(const std::string& alias_name) { |
+ for (auto& encoding_name : kCanonicalEncodingNames) { |
+ if (alias_name == encoding_name) |
+ return encoding_name; |
+ } |
+ static const char* kStandards[3] = {"HTML", "MIME", "IANA"}; |
+ for (auto& standard : kStandards) { |
+ UErrorCode error_code = U_ZERO_ERROR; |
+ const char* canonical_name = |
+ ucnv_getStandardName(alias_name.c_str(), standard, &error_code); |
+ if (U_SUCCESS(error_code) && canonical_name) |
+ return canonical_name; |
+ } |
+ return nullptr; |
+} |
+} // namespace base |