OLD | NEW |
(Empty) | |
| 1 // Copyright (c) 2013 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. |
| 4 #include "chrome/browser/history/top_sites_cache.h" |
| 5 |
| 6 #include <set> |
| 7 |
| 8 #include "base/basictypes.h" |
| 9 #include "base/logging.h" |
| 10 #include "base/scoped_ptr.h" |
| 11 #include "base/strings/string16.h" |
| 12 #include "base/strings/string_number_conversions.h" |
| 13 #include "testing/gtest/include/gtest/gtest.h" |
| 14 |
| 15 namespace history { |
| 16 |
| 17 namespace { |
| 18 |
| 19 class TopSitesCacheTest : public testing::Test { |
| 20 protected: |
| 21 // Initializes |top_sites_| and |cache_| based on |spec|, which is a list of |
| 22 // URL strings with optional indents: indentated URLs redirect to the last |
| 23 // non-indented URL. Titles are assigned as "Title 1", "Title 2", etc., in the |
| 24 // order of appearance. See |kTopSitesSpecBasic| for an example. |
| 25 void InitTopSiteCache(char** spec, int size); |
| 26 |
| 27 MostVisitedURLList top_sites_; |
| 28 TopSitesCache cache_; |
| 29 }; |
| 30 |
| 31 void TopSitesCacheTest::InitTopSiteCache(char** spec, int size) { |
| 32 std::set<std::string> urls_seen; |
| 33 for (int i = 0; i < size; ++i) { |
| 34 char* spec_item = spec[i]; |
| 35 while (*spec_item && *spec_item == ' ') // Eat indent. |
| 36 ++spec_item; |
| 37 ASSERT_EQ(urls_seen.find(spec_item), urls_seen.end()) |
| 38 << "Duplicate URL found: " << spec_item; |
| 39 urls_seen.insert(spec_item); |
| 40 if (spec_item == spec[i]) { // No indent: add new MostVisitedURL. |
| 41 string16 title(L"Title " + base::Uint64ToString16(top_sites_.size() + 1)); |
| 42 top_sites_.push_back(MostVisitedURL(GURL(spec_item), title)); |
| 43 } |
| 44 ASSERT_TRUE(!top_sites_.empty()); |
| 45 // Set up redirect to canonical URL. Canonical URL redirects to itself, too. |
| 46 top_sites_.back().redirects.push_back(GURL(spec_item)); |
| 47 } |
| 48 cache_.SetTopSites(top_sites_); |
| 49 } |
| 50 |
| 51 TEST_F(TopSitesCacheTest, CanonicalURLComparator) { |
| 52 // Comprehensive test by comparing each pair in sorted list. O(n^2). |
| 53 const char* sorted_list[] = { |
| 54 "http://www.gogle.com/redirects_to_google", |
| 55 "http://www.google.com", |
| 56 "http://www.google.com/", |
| 57 "http://www.google.com/?q", |
| 58 "http://www.google.com/A", |
| 59 "http://www.google.com/index.html", |
| 60 "http://www.google.com/test", |
| 61 "http://www.google.com/test?q=3", |
| 62 "http://www.google.com/test?r=3", |
| 63 "http://www.google.com/test/zzzzz", |
| 64 "http://www.google.com/test-case", |
| 65 "http://www.google.com:80/", |
| 66 "https://www.google.com", |
| 67 }; |
| 68 for (int i = 0; i < arraysize(sorted_list); ++i) { |
| 69 EXPECT_FALSE( |
| 70 CanonicalURLComparator::CompareString(sorted_list[i], sorted_list[i])) |
| 71 << " for \"" << sorted_list[i] << "\" < \"" << sorted_list[i] << "\""; |
| 72 // Every disjoint pair-wise comparison. |
| 73 for (int j = i + 1; j < arraysize(sorted_list); ++j) { |
| 74 EXPECT_TRUE( |
| 75 CanonicalURLComparator::CompareString(sorted_list[i], sorted_list[j])) |
| 76 << " for \"" << sorted_list[i] << "\" < \"" << sorted_list[j] << "\""; |
| 77 EXPECT_FALSE( |
| 78 CanonicalURLComparator::CompareString(sorted_list[j], sorted_list[i])) |
| 79 << " for \"" << sorted_list[j] << "\" < \"" << sorted_list[i] << "\""; |
| 80 } |
| 81 } |
| 82 } |
| 83 |
| 84 char* kTopSitesSpecBasic[] = { |
| 85 "http://www.google.com", |
| 86 " http://www.gogle.com", |
| 87 " http://www.gooogle.com", |
| 88 "http://www.youtube.com/a/b", |
| 89 " http://www.youtube.com/a/b?test=1", |
| 90 "https://www.google.com", |
| 91 " https://www.gogle.com", |
| 92 "http://www.example.com:3141", |
| 93 }; |
| 94 |
| 95 TEST_F(TopSitesCacheTest, GetCanonicalURL) { |
| 96 InitTopSiteCache(kTopSitesSpecBasic, arraysize(kTopSitesSpecBasic)); |
| 97 // Already is canonical: redirects. |
| 98 EXPECT_EQ(GURL("http://www.google.com"), |
| 99 cache_.GetCanonicalURL(GURL("http://www.google.com"))); |
| 100 // Exact match with stored URL: redirects. |
| 101 EXPECT_EQ(GURL("http://www.google.com"), |
| 102 cache_.GetCanonicalURL(GURL("http://www.gooogle.com"))); |
| 103 // Recognizes despite trailing "/". |
| 104 EXPECT_EQ(GURL("http://www.google.com"), |
| 105 cache_.GetCanonicalURL(GURL("http://www.gooogle.com/"))); |
| 106 // Exact match with URL with query: redirects. |
| 107 EXPECT_EQ(GURL("http://www.youtube.com/a/b"), |
| 108 cache_.GetCanonicalURL(GURL("http://www.youtube.com/a/b?test=1"))); |
| 109 // No match with URL with query: as-is. |
| 110 EXPECT_EQ(GURL("http://www.youtube.com/a/b?test"), |
| 111 cache_.GetCanonicalURL(GURL("http://www.youtube.com/a/b?test"))); |
| 112 // Never-seen-before URL: as-is. |
| 113 EXPECT_EQ(GURL("http://maps.google.com/"), |
| 114 cache_.GetCanonicalURL(GURL("http://maps.google.com/"))); |
| 115 // Changing port number, does not match: as-is. |
| 116 EXPECT_EQ(GURL("http://www.example.com:80"), |
| 117 cache_.GetCanonicalURL(GURL("http://www.example.com:80"))); |
| 118 } |
| 119 |
| 120 TEST_F(TopSitesCacheTest, IsKnownUrl) { |
| 121 InitTopSiteCache(kTopSitesSpecBasic, arraysize(kTopSitesSpecBasic)); |
| 122 // Matches. |
| 123 EXPECT_TRUE(cache_.IsKnownURL(GURL("http://www.google.com"))); |
| 124 EXPECT_TRUE(cache_.IsKnownURL(GURL("http://www.gooogle.com"))); |
| 125 EXPECT_TRUE(cache_.IsKnownURL(GURL("http://www.google.com/"))); |
| 126 |
| 127 // Non-matches. |
| 128 EXPECT_FALSE(cache_.IsKnownURL(GURL("http://www.google.com?"))); |
| 129 EXPECT_FALSE(cache_.IsKnownURL(GURL("http://www.google.net"))); |
| 130 EXPECT_FALSE(cache_.IsKnownURL(GURL("http://www.google.com/stuff"))); |
| 131 EXPECT_FALSE(cache_.IsKnownURL(GURL("https://www.gooogle.com"))); |
| 132 } |
| 133 |
| 134 char* kTopSitesSpecPrefix[] = { |
| 135 "http://www.g.com", |
| 136 " http://www.g.com/test?q=3", |
| 137 " http://www.g.com/test/y?b", |
| 138 "http://www.g.com/2", |
| 139 " http://www.g.com/test/q", |
| 140 " http://www.g.com/test/y?a", |
| 141 "http://www.g.com/3", |
| 142 " http://www.g.com/testing", |
| 143 "http://www.g.com/test-hyphen", |
| 144 }; |
| 145 |
| 146 TEST_F(TopSitesCacheTest, GetCanonicalURLForPrefix) { |
| 147 InitTopSiteCache(kTopSitesSpecPrefix, arraysize(kTopSitesSpecPrefix)); |
| 148 // Already is canonical: redirects. |
| 149 EXPECT_EQ(GURL("http://www.g.com"), |
| 150 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com"))); |
| 151 // Exact match with stored URL: redirects. |
| 152 EXPECT_EQ(GURL("http://www.g.com"), |
| 153 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/test?q=3"))); |
| 154 // Prefix match: redirects. |
| 155 EXPECT_EQ(GURL("http://www.g.com"), |
| 156 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/test"))); |
| 157 // Competing prefix match: redirects to closest. |
| 158 EXPECT_EQ(GURL("http://www.g.com/2"), |
| 159 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/test/q"))); |
| 160 // Multiple prefix matches: redirects to first. |
| 161 EXPECT_EQ(GURL("http://www.g.com/2"), |
| 162 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/test/y"))); |
| 163 // No prefix match: as-is |
| 164 EXPECT_EQ(GURL("http://www.g.com/no-match"), |
| 165 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/no-match"))); |
| 166 // String prefix match but not URL-prefix match: as-is. |
| 167 EXPECT_EQ(GURL("http://www.g.com/t"), |
| 168 cache_.GetCanonicalURLForPrefix(GURL("http://www.g.com/t"))); |
| 169 // Different protocol: as-is. |
| 170 EXPECT_EQ(GURL("https://www.g.com/test"), |
| 171 cache_.GetCanonicalURLForPrefix(GURL("https://www.g.com/test"))); |
| 172 } |
| 173 |
| 174 TEST_F(TopSitesCacheTest, UrlStringIsPrefix) { |
| 175 struct { |
| 176 const char* s1; |
| 177 const char* s2; |
| 178 } true_cases[] = { |
| 179 {"http://www.google.com", "http://www.google.com"}, |
| 180 {"http://www.google.com/a/b", "http://www.google.com/a/b"}, |
| 181 {"http://www.google.com?test=3", "http://www.google.com/"}, |
| 182 {"http://www.google.com/", "http://www.google.com/test/with/dir/"}, |
| 183 {"http://www.google.com:360", "http://www.google.com:360/?q=1234"}, |
| 184 {"http://www.google.com:80", "http://www.google.com/gurl/is/smart"}, |
| 185 {"http://www.google.com/test", "http://www.google.com/test/with/dir/"}, |
| 186 {"http://www.google.com/test/", "http://www.google.com/test/with/dir"}, |
| 187 {"http://www.google.com/test?", "http://www.google.com/test/with/dir/"}, |
| 188 }; |
| 189 for (int i = 0; i < arraysize(true_cases); ++i) { |
| 190 EXPECT_TRUE(TopSitesCache::UrlIsPrefix(GURL(true_cases[i].s1), |
| 191 GURL(true_cases[i].s2))) |
| 192 << " for true_cases[" << i << "]"; |
| 193 } |
| 194 struct { |
| 195 const char* s1; |
| 196 const char* s2; |
| 197 } false_cases[] = { |
| 198 {"http://www.google.com/test", "http://www.google.com"}, |
| 199 {"http://www.google.com/a/b/", "http://www.google.com/a/b"}, // Arguable. |
| 200 {"http://www.google.co", "http://www.google.com"}, |
| 201 {"http://google.com", "http://www.google.com"}, |
| 202 {"http://www.google.com", "https://www.google.com"}, |
| 203 {"http://www.google.com/path", "http://www.google.com:137/path"}, |
| 204 {"http://www.google.com/same/dir", "http://www.youtube.com/same/dir"}, |
| 205 {"http://www.google.com/te", "http://www.google.com/test"}, |
| 206 {"http://www.google.com/test", "http://www.google.com/test-bed"}, |
| 207 {"http://www.google.com/test-", "http://www.google.com/test?"}, |
| 208 }; |
| 209 for (int i = 0; i < arraysize(false_cases); ++i) { |
| 210 EXPECT_FALSE(TopSitesCache::UrlIsPrefix(GURL(false_cases[i].s1), |
| 211 GURL(false_cases[i].s2))) |
| 212 << " for false_cases[" << i << "]"; |
| 213 } |
| 214 } |
| 215 |
| 216 } // namespace |
| 217 |
| 218 } // namespace history |
OLD | NEW |