Index: chrome/common/translate/language_detection_util_unittest.cc |
diff --git a/chrome/common/translate/language_detection_util_unittest.cc b/chrome/common/translate/language_detection_util_unittest.cc |
deleted file mode 100644 |
index 36a4b8c3d2c00e7ddaedaabe27b70d1a4cccc9b7..0000000000000000000000000000000000000000 |
--- a/chrome/common/translate/language_detection_util_unittest.cc |
+++ /dev/null |
@@ -1,169 +0,0 @@ |
-// Copyright 2013 The Chromium Authors. All rights reserved. |
-// Use of this source code is governed by a BSD-style license that can be |
-// found in the LICENSE file. |
- |
-#include "chrome/common/translate/language_detection_util.h" |
- |
-#include "base/strings/string16.h" |
-#include "base/strings/utf_string_conversions.h" |
-#include "chrome/common/chrome_constants.h" |
-#include "testing/gtest/include/gtest/gtest.h" |
- |
-typedef testing::Test LanguageDetectionUtilTest; |
- |
-// Tests that well-known language code typos are fixed. |
-TEST_F(LanguageDetectionUtilTest, LanguageCodeTypoCorrection) { |
- std::string language; |
- |
- // Strip the second and later codes. |
- language = std::string("ja,en"); |
- LanguageDetectionUtil::CorrectLanguageCodeTypo(&language); |
- EXPECT_EQ("ja", language); |
- |
- // Replace dash with hyphen. |
- language = std::string("ja_JP"); |
- LanguageDetectionUtil::CorrectLanguageCodeTypo(&language); |
- EXPECT_EQ("ja-JP", language); |
- |
- // Correct wrong cases. |
- language = std::string("JA-jp"); |
- LanguageDetectionUtil::CorrectLanguageCodeTypo(&language); |
- EXPECT_EQ("ja-JP", language); |
-} |
- |
-// Tests if the language codes' format is invalid. |
-TEST_F(LanguageDetectionUtilTest, IsValidLanguageCode) { |
- std::string language; |
- |
- language = std::string("ja"); |
- EXPECT_TRUE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- language = std::string("ja-JP"); |
- EXPECT_TRUE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- language = std::string("ceb"); |
- EXPECT_TRUE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- language = std::string("ceb-XX"); |
- EXPECT_TRUE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- // Invalid because the sub code consists of a number. |
- language = std::string("utf-8"); |
- EXPECT_FALSE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- // Invalid because of six characters after hyphen. |
- language = std::string("ja-YUKARI"); |
- EXPECT_FALSE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
- |
- // Invalid because of four characters. |
- language = std::string("DHMO"); |
- EXPECT_FALSE(LanguageDetectionUtil::IsValidLanguageCode(language)); |
-} |
- |
-// Tests that similar language table works. |
-TEST_F(LanguageDetectionUtilTest, SimilarLanguageCode) { |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("en", "en")); |
- EXPECT_FALSE(LanguageDetectionUtil::IsSameOrSimilarLanguages("en", "ja")); |
- |
- // Language codes are same if the main parts are same. The synonyms should be |
- // took into account (ex: 'iw' and 'he'). |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("sr-ME", "sr")); |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("sr", "sr-ME")); |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("he", "he-IL")); |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("eng", "eng-US")); |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("eng-US", "eng")); |
- EXPECT_FALSE(LanguageDetectionUtil::IsSameOrSimilarLanguages("eng", "enm")); |
- |
- // Even though the main parts are different, some special language pairs are |
- // recognized as same languages. |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("bs", "hr")); |
- EXPECT_TRUE(LanguageDetectionUtil::IsSameOrSimilarLanguages("ne", "hi")); |
- EXPECT_FALSE(LanguageDetectionUtil::IsSameOrSimilarLanguages("bs", "hi")); |
-} |
- |
-// Tests that well-known languages which often have wrong server configuration |
-// are handles. |
-TEST_F(LanguageDetectionUtilTest, WellKnownWrongConfiguration) { |
- EXPECT_TRUE(LanguageDetectionUtil::MaybeServerWrongConfiguration("en", "ja")); |
- EXPECT_TRUE(LanguageDetectionUtil::MaybeServerWrongConfiguration("en-US", |
- "ja")); |
- EXPECT_TRUE(LanguageDetectionUtil::MaybeServerWrongConfiguration("en", |
- "zh-CN")); |
- EXPECT_FALSE(LanguageDetectionUtil::MaybeServerWrongConfiguration("ja", |
- "en")); |
- EXPECT_FALSE(LanguageDetectionUtil::MaybeServerWrongConfiguration("en", |
- "he")); |
-} |
- |
-// Tests that the language meta tag providing wrong information is ignored by |
-// LanguageDetectionUtil due to disagreement between meta tag and CLD. |
-TEST_F(LanguageDetectionUtilTest, CLDDisagreeWithWrongLanguageCode) { |
- base::string16 contents = ASCIIToUTF16( |
- "<html><head><meta http-equiv='Content-Language' content='ja'></head>" |
- "<body>This is a page apparently written in English. Even though " |
- "content-language is provided, the value will be ignored if the value " |
- "is suspicious.</body></html>"); |
- std::string cld_language; |
- bool is_cld_reliable; |
- std::string language = LanguageDetectionUtil::DeterminePageLanguage( |
- std::string("ja"), std::string(), contents, &cld_language, |
- &is_cld_reliable); |
- EXPECT_EQ(chrome::kUnknownLanguageCode, language); |
- EXPECT_EQ("en", cld_language); |
- EXPECT_TRUE(is_cld_reliable); |
-} |
- |
-// Tests that the language meta tag providing "en-US" style information is |
-// agreed by CLD. |
-TEST_F(LanguageDetectionUtilTest, CLDAgreeWithLanguageCodeHavingCountryCode) { |
- base::string16 contents = ASCIIToUTF16( |
- "<html><head><meta http-equiv='Content-Language' content='en-US'></head>" |
- "<body>This is a page apparently written in English. Even though " |
- "content-language is provided, the value will be ignored if the value " |
- "is suspicious.</body></html>"); |
- std::string cld_language; |
- bool is_cld_reliable; |
- std::string language = LanguageDetectionUtil::DeterminePageLanguage( |
- std::string("en-US"), std::string(), contents, &cld_language, |
- &is_cld_reliable); |
- EXPECT_EQ("en-US", language); |
- EXPECT_EQ("en", cld_language); |
- EXPECT_TRUE(is_cld_reliable); |
-} |
- |
-// Tests that the language meta tag providing wrong information is ignored and |
-// CLD's language will be adopted by LanguageDetectionUtil due to an invalid |
-// meta tag. |
-TEST_F(LanguageDetectionUtilTest, InvalidLanguageMetaTagProviding) { |
- base::string16 contents = ASCIIToUTF16( |
- "<html><head><meta http-equiv='Content-Language' content='utf-8'></head>" |
- "<body>This is a page apparently written in English. Even though " |
- "content-language is provided, the value will be ignored and CLD's" |
- " language will be adopted if the value is invalid.</body></html>"); |
- std::string cld_language; |
- bool is_cld_reliable; |
- std::string language = LanguageDetectionUtil::DeterminePageLanguage( |
- std::string("utf-8"), std::string(), contents, &cld_language, |
- &is_cld_reliable); |
- EXPECT_EQ("en", language); |
- EXPECT_EQ("en", cld_language); |
- EXPECT_TRUE(is_cld_reliable); |
-} |
- |
-// Tests that the language meta tag providing wrong information is ignored |
-// because of valid html lang attribute. |
-TEST_F(LanguageDetectionUtilTest, AdoptHtmlLang) { |
- base::string16 contents = ASCIIToUTF16( |
- "<html lang='en'><head><meta http-equiv='Content-Language' content='ja'>" |
- "</head><body>This is a page apparently written in English. Even though " |
- "content-language is provided, the value will be ignored if the value " |
- "is suspicious.</body></html>"); |
- std::string cld_language; |
- bool is_cld_reliable; |
- std::string language = LanguageDetectionUtil::DeterminePageLanguage( |
- std::string("ja"), std::string("en"), contents, &cld_language, |
- &is_cld_reliable); |
- EXPECT_EQ("en", language); |
- EXPECT_EQ("en", cld_language); |
- EXPECT_TRUE(is_cld_reliable); |
-} |