OLD | NEW |
| (Empty) |
1 // Copyright (c) 2013 The Chromium Authors. All rights reserved. | |
2 // Use of this source code is governed by a BSD-style license that can be | |
3 // found in the LICENSE file. | |
4 | |
5 #include "chrome/renderer/translate/translate_helper.h" | |
6 | |
7 #include "base/strings/utf_string_conversions.h" | |
8 #include "chrome/common/chrome_constants.h" | |
9 #include "testing/gtest/include/gtest/gtest.h" | |
10 | |
11 typedef testing::Test TranslateHelperTest; | |
12 | |
13 // Tests that well-known language code typos are fixed. | |
14 TEST_F(TranslateHelperTest, LanguageCodeTypoCorrection) { | |
15 std::string language; | |
16 | |
17 // Strip the second and later codes. | |
18 language = std::string("ja,en"); | |
19 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
20 EXPECT_EQ("ja", language); | |
21 | |
22 // Replace dash with hyphen. | |
23 language = std::string("ja_JP"); | |
24 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
25 EXPECT_EQ("ja-JP", language); | |
26 | |
27 // Correct wrong cases. | |
28 language = std::string("JA-jp"); | |
29 TranslateHelper::CorrectLanguageCodeTypo(&language); | |
30 EXPECT_EQ("ja-JP", language); | |
31 } | |
32 | |
33 // Tests if the language codes' format is invalid. | |
34 TEST_F(TranslateHelperTest, IsValidLanguageCode) { | |
35 std::string language; | |
36 | |
37 language = std::string("ja"); | |
38 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
39 | |
40 language = std::string("ja-JP"); | |
41 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
42 | |
43 language = std::string("ceb"); | |
44 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
45 | |
46 language = std::string("ceb-XX"); | |
47 EXPECT_TRUE(TranslateHelper::IsValidLanguageCode(language)); | |
48 | |
49 // Invalid because the sub code consists of a number. | |
50 language = std::string("utf-8"); | |
51 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
52 | |
53 // Invalid because of six characters after hyphen. | |
54 language = std::string("ja-YUKARI"); | |
55 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
56 | |
57 // Invalid because of four characters. | |
58 language = std::string("DHMO"); | |
59 EXPECT_FALSE(TranslateHelper::IsValidLanguageCode(language)); | |
60 } | |
61 | |
62 // Tests that similar language table works. | |
63 TEST_F(TranslateHelperTest, SimilarLanguageCode) { | |
64 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("en", "en")); | |
65 EXPECT_FALSE(TranslateHelper::IsSameOrSimilarLanguages("en", "ja")); | |
66 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("bs", "hr")); | |
67 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("sr-ME", "sr")); | |
68 EXPECT_TRUE(TranslateHelper::IsSameOrSimilarLanguages("ne", "hi")); | |
69 EXPECT_FALSE(TranslateHelper::IsSameOrSimilarLanguages("bs", "hi")); | |
70 } | |
71 | |
72 // Tests that well-known languages which often have wrong server configuration | |
73 // are handles. | |
74 TEST_F(TranslateHelperTest, WellKnownWrongConfiguration) { | |
75 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en", "ja")); | |
76 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en-US", "ja")); | |
77 EXPECT_TRUE(TranslateHelper::MaybeServerWrongConfiguration("en", "zh-CN")); | |
78 EXPECT_FALSE(TranslateHelper::MaybeServerWrongConfiguration("ja", "en")); | |
79 EXPECT_FALSE(TranslateHelper::MaybeServerWrongConfiguration("en", "he")); | |
80 } | |
81 | |
82 // Tests that the language meta tag providing wrong information is ignored by | |
83 // TranslateHelper due to disagreement between meta tag and CLD. | |
84 TEST_F(TranslateHelperTest, CLDDisagreeWithWrongLanguageCode) { | |
85 string16 contents = ASCIIToUTF16( | |
86 "<html><head><meta http-equiv='Content-Language' content='ja'></head>" | |
87 "<body>This is a page apparently written in English. Even though " | |
88 "content-language is provided, the value will be ignored if the value " | |
89 "is suspicious.</body></html>"); | |
90 std::string cld_language; | |
91 bool is_cld_reliable; | |
92 std::string language = | |
93 TranslateHelper::DeterminePageLanguage(std::string("ja"), std::string(), | |
94 contents, &cld_language, | |
95 &is_cld_reliable); | |
96 EXPECT_EQ(chrome::kUnknownLanguageCode, language); | |
97 EXPECT_EQ("en", cld_language); | |
98 EXPECT_TRUE(is_cld_reliable); | |
99 } | |
100 | |
101 // Tests that the language meta tag providing "en-US" style information is | |
102 // agreed by CLD. | |
103 TEST_F(TranslateHelperTest, CLDAgreeWithLanguageCodeHavingCountryCode) { | |
104 string16 contents = ASCIIToUTF16( | |
105 "<html><head><meta http-equiv='Content-Language' content='en-US'></head>" | |
106 "<body>This is a page apparently written in English. Even though " | |
107 "content-language is provided, the value will be ignored if the value " | |
108 "is suspicious.</body></html>"); | |
109 std::string cld_language; | |
110 bool is_cld_reliable; | |
111 std::string language = | |
112 TranslateHelper::DeterminePageLanguage(std::string("en-US"), | |
113 std::string(), contents, | |
114 &cld_language, &is_cld_reliable); | |
115 EXPECT_EQ("en-US", language); | |
116 EXPECT_EQ("en", cld_language); | |
117 EXPECT_TRUE(is_cld_reliable); | |
118 } | |
119 | |
120 // Tests that the language meta tag providing wrong information is ignored and | |
121 // CLD's language will be adopted by TranslateHelper due to an invalid meta tag. | |
122 TEST_F(TranslateHelperTest, InvalidLanguageMetaTagProviding) { | |
123 string16 contents = ASCIIToUTF16( | |
124 "<html><head><meta http-equiv='Content-Language' content='utf-8'></head>" | |
125 "<body>This is a page apparently written in English. Even though " | |
126 "content-language is provided, the value will be ignored and CLD's" | |
127 " language will be adopted if the value is invalid.</body></html>"); | |
128 std::string cld_language; | |
129 bool is_cld_reliable; | |
130 std::string language = | |
131 TranslateHelper::DeterminePageLanguage(std::string("utf-8"), | |
132 std::string(), contents, | |
133 &cld_language, &is_cld_reliable); | |
134 EXPECT_EQ("en", language); | |
135 EXPECT_EQ("en", cld_language); | |
136 EXPECT_TRUE(is_cld_reliable); | |
137 } | |
138 | |
139 // Tests that the language meta tag providing wrong information is ignored | |
140 // because of valid html lang attribute. | |
141 TEST_F(TranslateHelperTest, AdoptHtmlLang) { | |
142 string16 contents = ASCIIToUTF16( | |
143 "<html lang='en'><head><meta http-equiv='Content-Language' content='ja'>" | |
144 "</head><body>This is a page apparently written in English. Even though " | |
145 "content-language is provided, the value will be ignored if the value " | |
146 "is suspicious.</body></html>"); | |
147 std::string cld_language; | |
148 bool is_cld_reliable; | |
149 std::string language = | |
150 TranslateHelper::DeterminePageLanguage(std::string("ja"), | |
151 std::string("en"), | |
152 contents, &cld_language, | |
153 &is_cld_reliable); | |
154 EXPECT_EQ("en", language); | |
155 EXPECT_EQ("en", cld_language); | |
156 EXPECT_TRUE(is_cld_reliable); | |
157 } | |
OLD | NEW |