| OLD | NEW |
| (Empty) |
| 1 // Copyright (c) 2013 The Chromium Authors. All rights reserved. | |
| 2 // Use of this source code is governed by a BSD-style license that can be | |
| 3 // found in the LICENSE file. | |
| 4 | |
| 5 #include "chrome/renderer/translate/translate_helper.h" | |
| 6 | |
| 7 #include "base/strings/utf_string_conversions.h" | |
| 8 #include "chrome/common/chrome_constants.h" | |
| 9 #include "testing/gtest/include/gtest/gtest.h" | |
| 10 | |
| 11 typedef testing::Test TranslateHelperTest; | |
| 12 | |
| 13 // Tests that well-known language code typos are fixed. | |
| 14 TEST_F(TranslateHelperTest, LanguageCodeTypoCorrection) { | |
| 15 std::string language; | |
| 16 | |
| 17 // Strip the second and later codes. | |
| 18 language = std::string("ja,en"); | |
| 19 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
| 20 EXPECT_EQ("ja", language); | |
| 21 | |
| 22 // Replace dash with hyphen. | |
| 23 language = std::string("ja_JP"); | |
| 24 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
| 25 EXPECT_EQ("ja-JP", language); | |
| 26 | |
| 27 // Correct wrong cases. | |
| 28 language = std::string("JA-jp"); | |
| 29 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
| 30 EXPECT_EQ("ja-JP", language); | |
| 31 } | |
| 32 | |
| 33 // Tests if the language codes' format is invalid. | |
| 34 TEST_F(TranslateHelperTest, IsValidLanguageCode) { | |
| 35 std::string language; | |
| 36 | |
| 37 language = std::string("ja"); | |
| 38 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
| 39 | |
| 40 language = std::string("ja-JP"); | |
| 41 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
| 42 | |
| 43 language = std::string("ceb"); | |
| 44 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
| 45 | |
| 46 language = std::string("ceb-XX"); | |
| 47 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
| 48 | |
| 49 // Invalid because the sub code consists of a number. | |
| 50 language = std::string("utf-8"); | |
| 51 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
| 52 | |
| 53 // Invalid because of six characters after hyphen. | |
| 54 language = std::string("ja-YUKARI"); | |
| 55 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
| 56 | |
| 57 // Invalid because of four characters. | |
| 58 language = std::string("DHMO"); | |
| 59 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
| 60 } | |
| 61 | |
| 62 // Tests that similar language table works. | |
| 63 TEST_F(TranslateHelperTest, SimilarLanguageCode) { | |
| 64 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("en", "en")); | |
| 65 EXPECT_FALSE(TranslateHelper::IsSameOrSimilarLanguages("en", "ja")); | |
| 66 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("bs", "hr")); | |
| 67 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("sr-ME", "sr")); | |
| 68 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("ne", "hi")); | |
| 69 EXPECT_FALSE(TranslateHelper::IsSameOrSimilarLanguages("bs", "hi")); | |
| 70 } | |
| 71 | |
| 72 // Tests that well-known languages which often have wrong server configuration | |
| 73 // are handles. | |
| 74 TEST_F(TranslateHelperTest, WellKnownWrongConfiguration) { | |
| 75 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en", "ja")); | |
| 76 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en-US", "ja")); | |
| 77 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en", "zh-CN")); | |
| 78 EXPECT_FALSE(TranslateHelper::MaybeServerWrongConfiguration("ja", "en")); | |
| 79 EXPECT_FALSE(TranslateHelper::MaybeServerWrongConfiguration("en", "he")); | |
| 80 } | |
| 81 | |
| 82 // Tests that the language meta tag providing wrong information is ignored by | |
| 83 // TranslateHelper due to disagreement between meta tag and CLD. | |
| 84 TEST_F(TranslateHelperTest, CLDDisagreeWithWrongLanguageCode) { | |
| 85 string16 contents = ASCIIToUTF16( | |
| 86 "<html><head><meta http-equiv='Content-Language' content='ja'></head>" | |
| 87 "<body>This is a page apparently written in English. Even though " | |
| 88 "content-language is provided, the value will be ignored if the value " | |
| 89 "is suspicious.</body></html>"); | |
| 90 std::string cld_language; | |
| 91 bool is_cld_reliable; | |
| 92 std::string language = | |
| 93 TranslateHelper::DeterminePageLanguage(std::string("ja"), std::string(), | |
| 94 contents, &cld_language, | |
| 95 &is_cld_reliable); | |
| 96 EXPECT_EQ(chrome::kUnknownLanguageCode, language); | |
| 97 EXPECT_EQ("en", cld_language); | |
| 98 EXPECT_TRUE(is_cld_reliable); | |
| 99 } | |
| 100 | |
| 101 // Tests that the language meta tag providing "en-US" style information is | |
| 102 // agreed by CLD. | |
| 103 TEST_F(TranslateHelperTest, CLDAgreeWithLanguageCodeHavingCountryCode) { | |
| 104 string16 contents = ASCIIToUTF16( | |
| 105 "<html><head><meta http-equiv='Content-Language' content='en-US'></head>" | |
| 106 "<body>This is a page apparently written in English. Even though " | |
| 107 "content-language is provided, the value will be ignored if the value " | |
| 108 "is suspicious.</body></html>"); | |
| 109 std::string cld_language; | |
| 110 bool is_cld_reliable; | |
| 111 std::string language = | |
| 112 TranslateHelper::DeterminePageLanguage(std::string("en-US"), | |
| 113 std::string(), contents, | |
| 114 &cld_language, &is_cld_reliable); | |
| 115 EXPECT_EQ("en-US", language); | |
| 116 EXPECT_EQ("en", cld_language); | |
| 117 EXPECT_TRUE(is_cld_reliable); | |
| 118 } | |
| 119 | |
| 120 // Tests that the language meta tag providing wrong information is ignored and | |
| 121 // CLD's language will be adopted by TranslateHelper due to an invalid meta tag. | |
| 122 TEST_F(TranslateHelperTest, InvalidLanguageMetaTagProviding) { | |
| 123 string16 contents = ASCIIToUTF16( | |
| 124 "<html><head><meta http-equiv='Content-Language' content='utf-8'></head>" | |
| 125 "<body>This is a page apparently written in English. Even though " | |
| 126 "content-language is provided, the value will be ignored and CLD's" | |
| 127 " language will be adopted if the value is invalid.</body></html>"); | |
| 128 std::string cld_language; | |
| 129 bool is_cld_reliable; | |
| 130 std::string language = | |
| 131 TranslateHelper::DeterminePageLanguage(std::string("utf-8"), | |
| 132 std::string(), contents, | |
| 133 &cld_language, &is_cld_reliable); | |
| 134 EXPECT_EQ("en", language); | |
| 135 EXPECT_EQ("en", cld_language); | |
| 136 EXPECT_TRUE(is_cld_reliable); | |
| 137 } | |
| 138 | |
| 139 // Tests that the language meta tag providing wrong information is ignored | |
| 140 // because of valid html lang attribute. | |
| 141 TEST_F(TranslateHelperTest, AdoptHtmlLang) { | |
| 142 string16 contents = ASCIIToUTF16( | |
| 143 "<html lang='en'><head><meta http-equiv='Content-Language' content='ja'>" | |
| 144 "</head><body>This is a page apparently written in English. Even though " | |
| 145 "content-language is provided, the value will be ignored if the value " | |
| 146 "is suspicious.</body></html>"); | |
| 147 std::string cld_language; | |
| 148 bool is_cld_reliable; | |
| 149 std::string language = | |
| 150 TranslateHelper::DeterminePageLanguage(std::string("ja"), | |
| 151 std::string("en"), | |
| 152 contents, &cld_language, | |
| 153 &is_cld_reliable); | |
| 154 EXPECT_EQ("en", language); | |
| 155 EXPECT_EQ("en", cld_language); | |
| 156 EXPECT_TRUE(is_cld_reliable); | |
| 157 } | |
| OLD | NEW |