| Index: base/i18n/encoding_detection.cc
|
| diff --git a/base/i18n/encoding_detection.cc b/base/i18n/encoding_detection.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..56582511f306ed785496b582f8bd258e97a4d6ee
|
| --- /dev/null
|
| +++ b/base/i18n/encoding_detection.cc
|
| @@ -0,0 +1,41 @@
|
| +// Copyright 2016 The Chromium Authors. All rights reserved.
|
| +// Use of this source code is governed by a BSD-style license that can be
|
| +// found in the LICENSE file.
|
| +
|
| +#include "base/i18n/encoding_detection.h"
|
| +
|
| +#include "third_party/ced/src/compact_enc_det/compact_enc_det.h"
|
| +
|
| +namespace base {
|
| +
|
| +bool DetectEncoding(const std::string& text, std::string* encoding) {
|
| + int consumed_bytes;
|
| + bool is_reliable;
|
| + Encoding enc = CompactEncDet::DetectEncoding(
|
| + text.c_str(), text.length(), nullptr, nullptr, nullptr,
|
| + UNKNOWN_ENCODING,
|
| + UNKNOWN_LANGUAGE,
|
| + CompactEncDet::QUERY_CORPUS, // plain text
|
| + false, // Include 7-bit encodings
|
| + &consumed_bytes,
|
| + &is_reliable);
|
| +
|
| + if (enc == UNKNOWN_ENCODING)
|
| + return false;
|
| +
|
| + // 7-bit encodings (except ISO-2022-JP) are not supported in web standard.
|
| + // Mark them as ascii to keep the raw bytes intact.
|
| + switch (enc) {
|
| + case HZ_GB_2312:
|
| + case ISO_2022_KR:
|
| + case ISO_2022_CN:
|
| + case UTF7:
|
| + enc = ASCII_7BIT;
|
| + break;
|
| + default:
|
| + break;
|
| + }
|
| + *encoding = MimeEncodingName(enc);
|
| + return true;
|
| +}
|
| +} // namespace base
|
|
|