OLD | NEW |
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #include "base/strings/utf_string_conversions.h" | |
6 #include "net/base/registry_controlled_domains/registry_controlled_domain.h" | 5 #include "net/base/registry_controlled_domains/registry_controlled_domain.h" |
7 #include "testing/gtest/include/gtest/gtest.h" | 6 #include "testing/gtest/include/gtest/gtest.h" |
8 #include "url/gurl.h" | 7 #include "url/gurl.h" |
9 #include "url/origin.h" | 8 #include "url/origin.h" |
10 #include "url/url_features.h" | |
11 | 9 |
12 namespace { | 10 namespace { |
13 | |
14 namespace test1 { | 11 namespace test1 { |
15 #include "net/base/registry_controlled_domains/effective_tld_names_unittest1-inc
.cc" | 12 #include "net/base/registry_controlled_domains/effective_tld_names_unittest1-inc
.cc" |
16 } | 13 } |
17 namespace test2 { | 14 namespace test2 { |
18 #include "net/base/registry_controlled_domains/effective_tld_names_unittest2-inc
.cc" | 15 #include "net/base/registry_controlled_domains/effective_tld_names_unittest2-inc
.cc" |
19 } | 16 } |
20 namespace test3 { | 17 namespace test3 { |
21 #include "net/base/registry_controlled_domains/effective_tld_names_unittest3-inc
.cc" | 18 #include "net/base/registry_controlled_domains/effective_tld_names_unittest3-inc
.cc" |
22 } | 19 } |
23 namespace test4 { | 20 namespace test4 { |
24 #include "net/base/registry_controlled_domains/effective_tld_names_unittest4-inc
.cc" | 21 #include "net/base/registry_controlled_domains/effective_tld_names_unittest4-inc
.cc" |
25 } | 22 } |
26 namespace test5 { | 23 namespace test5 { |
27 #include "net/base/registry_controlled_domains/effective_tld_names_unittest5-inc
.cc" | 24 #include "net/base/registry_controlled_domains/effective_tld_names_unittest5-inc
.cc" |
28 } | 25 } |
29 namespace test6 { | 26 namespace test6 { |
30 #include "net/base/registry_controlled_domains/effective_tld_names_unittest6-inc
.cc" | 27 #include "net/base/registry_controlled_domains/effective_tld_names_unittest6-inc
.cc" |
31 } | 28 } |
32 | |
33 } // namespace | 29 } // namespace |
34 | 30 |
35 namespace net { | 31 namespace net { |
36 namespace registry_controlled_domains { | 32 namespace registry_controlled_domains { |
37 | |
38 namespace { | 33 namespace { |
39 | 34 |
40 std::string GetDomainFromURL(const std::string& url) { | 35 std::string GetDomainFromURL(const std::string& url) { |
41 return GetDomainAndRegistry(GURL(url), EXCLUDE_PRIVATE_REGISTRIES); | 36 return GetDomainAndRegistry(GURL(url), EXCLUDE_PRIVATE_REGISTRIES); |
42 } | 37 } |
43 | 38 |
44 std::string GetDomainFromHost(const std::string& host) { | 39 std::string GetDomainFromHost(const std::string& host) { |
45 return GetDomainAndRegistry(host, EXCLUDE_PRIVATE_REGISTRIES); | 40 return GetDomainAndRegistry(host, EXCLUDE_PRIVATE_REGISTRIES); |
46 } | 41 } |
47 | 42 |
48 size_t GetRegistryLengthFromURL( | 43 size_t GetRegistryLengthFromURL( |
49 const std::string& url, | 44 const std::string& url, |
50 UnknownRegistryFilter unknown_filter) { | 45 UnknownRegistryFilter unknown_filter) { |
51 return GetRegistryLength(GURL(url), | 46 return GetRegistryLength(GURL(url), |
52 unknown_filter, | 47 unknown_filter, |
53 EXCLUDE_PRIVATE_REGISTRIES); | 48 EXCLUDE_PRIVATE_REGISTRIES); |
54 } | 49 } |
55 | 50 |
56 size_t GetRegistryLengthFromURLIncludingPrivate( | 51 size_t GetRegistryLengthFromURLIncludingPrivate( |
57 const std::string& url, | 52 const std::string& url, |
58 UnknownRegistryFilter unknown_filter) { | 53 UnknownRegistryFilter unknown_filter) { |
59 return GetRegistryLength(GURL(url), | 54 return GetRegistryLength(GURL(url), |
60 unknown_filter, | 55 unknown_filter, |
61 INCLUDE_PRIVATE_REGISTRIES); | 56 INCLUDE_PRIVATE_REGISTRIES); |
62 } | 57 } |
63 | 58 |
64 size_t PermissiveGetHostRegistryLength(base::StringPiece host) { | 59 size_t GetRegistryLengthFromHost( |
65 return PermissiveGetHostRegistryLength(host, EXCLUDE_UNKNOWN_REGISTRIES, | 60 const std::string& host, |
66 EXCLUDE_PRIVATE_REGISTRIES); | 61 UnknownRegistryFilter unknown_filter) { |
| 62 return GetRegistryLength(host, unknown_filter, EXCLUDE_PRIVATE_REGISTRIES); |
67 } | 63 } |
68 | 64 |
69 size_t PermissiveGetHostRegistryLength(base::StringPiece16 host) { | 65 size_t GetRegistryLengthFromHostIncludingPrivate( |
70 return PermissiveGetHostRegistryLength(host, EXCLUDE_UNKNOWN_REGISTRIES, | 66 const std::string& host, |
71 EXCLUDE_PRIVATE_REGISTRIES); | 67 UnknownRegistryFilter unknown_filter) { |
72 } | 68 return GetRegistryLength(host, unknown_filter, INCLUDE_PRIVATE_REGISTRIES); |
73 | |
74 size_t GetCanonicalHostRegistryLength(const std::string& host, | |
75 UnknownRegistryFilter unknown_filter) { | |
76 return GetCanonicalHostRegistryLength(host, unknown_filter, | |
77 EXCLUDE_PRIVATE_REGISTRIES); | |
78 } | |
79 | |
80 size_t GetCanonicalHostRegistryLengthIncludingPrivate(const std::string& host) { | |
81 return GetCanonicalHostRegistryLength(host, EXCLUDE_UNKNOWN_REGISTRIES, | |
82 INCLUDE_PRIVATE_REGISTRIES); | |
83 } | 69 } |
84 | 70 |
85 } // namespace | 71 } // namespace |
86 | 72 |
87 class RegistryControlledDomainTest : public testing::Test { | 73 class RegistryControlledDomainTest : public testing::Test { |
88 protected: | 74 protected: |
89 template <typename Graph> | 75 template <typename Graph> |
90 void UseDomainData(const Graph& graph) { | 76 void UseDomainData(const Graph& graph) { |
91 SetFindDomainGraph(graph, sizeof(Graph)); | 77 SetFindDomainGraph(graph, sizeof(Graph)); |
92 } | 78 } |
(...skipping 130 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
223 EXPECT_EQ(0U, GetRegistryLengthFromURL("http://localhost.", | 209 EXPECT_EQ(0U, GetRegistryLengthFromURL("http://localhost.", |
224 EXCLUDE_UNKNOWN_REGISTRIES)); | 210 EXCLUDE_UNKNOWN_REGISTRIES)); |
225 EXPECT_EQ(0U, GetRegistryLengthFromURL("http://localhost.", | 211 EXPECT_EQ(0U, GetRegistryLengthFromURL("http://localhost.", |
226 INCLUDE_UNKNOWN_REGISTRIES)); | 212 INCLUDE_UNKNOWN_REGISTRIES)); |
227 EXPECT_EQ(0U, GetRegistryLengthFromURL("http:////Comment", | 213 EXPECT_EQ(0U, GetRegistryLengthFromURL("http:////Comment", |
228 EXCLUDE_UNKNOWN_REGISTRIES)); | 214 EXCLUDE_UNKNOWN_REGISTRIES)); |
229 | 215 |
230 // Test std::string version of GetRegistryLength(). Uses the same | 216 // Test std::string version of GetRegistryLength(). Uses the same |
231 // underpinnings as the GURL version, so this is really more of a check of | 217 // underpinnings as the GURL version, so this is really more of a check of |
232 // CanonicalizeHost(). | 218 // CanonicalizeHost(). |
233 EXPECT_EQ(2U, GetCanonicalHostRegistryLength( | 219 EXPECT_EQ(2U, GetRegistryLengthFromHost("a.baz.jp", |
234 "a.baz.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 1 | 220 EXCLUDE_UNKNOWN_REGISTRIES)); // 1 |
235 EXPECT_EQ(3U, GetCanonicalHostRegistryLength( | 221 EXPECT_EQ(3U, GetRegistryLengthFromHost("a.baz.jp.", |
236 "a.baz.jp.", EXCLUDE_UNKNOWN_REGISTRIES)); // 1 | 222 EXCLUDE_UNKNOWN_REGISTRIES)); // 1 |
237 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 223 EXPECT_EQ(0U, GetRegistryLengthFromHost("ac.jp", |
238 "ac.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 2 | 224 EXCLUDE_UNKNOWN_REGISTRIES)); // 2 |
239 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 225 EXPECT_EQ(0U, GetRegistryLengthFromHost("a.bar.jp", |
240 "a.bar.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 3 | 226 EXCLUDE_UNKNOWN_REGISTRIES)); // 3 |
241 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 227 EXPECT_EQ(0U, GetRegistryLengthFromHost("bar.jp", |
242 "bar.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 3 | 228 EXCLUDE_UNKNOWN_REGISTRIES)); // 3 |
243 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 229 EXPECT_EQ(0U, GetRegistryLengthFromHost("baz.bar.jp", |
244 "baz.bar.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 3 4 | 230 EXCLUDE_UNKNOWN_REGISTRIES)); // 3 4 |
245 EXPECT_EQ(12U, GetCanonicalHostRegistryLength( | 231 EXPECT_EQ(12U, GetRegistryLengthFromHost("a.b.baz.bar.jp", |
246 "a.b.baz.bar.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 4 | 232 EXCLUDE_UNKNOWN_REGISTRIES)); // 4 |
247 EXPECT_EQ(6U, GetCanonicalHostRegistryLength( | 233 EXPECT_EQ(6U, GetRegistryLengthFromHost("baz.pref.bar.jp", |
248 "baz.pref.bar.jp", EXCLUDE_UNKNOWN_REGISTRIES)); // 5 | 234 EXCLUDE_UNKNOWN_REGISTRIES)); // 5 |
249 EXPECT_EQ(11U, GetCanonicalHostRegistryLength( | 235 EXPECT_EQ(11U, GetRegistryLengthFromHost("a.b.bar.baz.com", |
250 "a.b.bar.baz.com", EXCLUDE_UNKNOWN_REGISTRIES)); // 6 | 236 EXCLUDE_UNKNOWN_REGISTRIES)); // 6 |
251 EXPECT_EQ(3U, GetCanonicalHostRegistryLength( | 237 EXPECT_EQ(3U, GetRegistryLengthFromHost("a.d.c", |
252 "a.d.c", EXCLUDE_UNKNOWN_REGISTRIES)); // 7 | 238 EXCLUDE_UNKNOWN_REGISTRIES)); // 7 |
253 EXPECT_EQ(3U, GetCanonicalHostRegistryLength( | 239 EXPECT_EQ(3U, GetRegistryLengthFromHost(".a.d.c", |
254 ".a.d.c", EXCLUDE_UNKNOWN_REGISTRIES)); // 7 | 240 EXCLUDE_UNKNOWN_REGISTRIES)); // 7 |
255 EXPECT_EQ(3U, GetCanonicalHostRegistryLength( | 241 EXPECT_EQ(3U, GetRegistryLengthFromHost("..a.d.c", |
256 "..a.d.c", EXCLUDE_UNKNOWN_REGISTRIES)); // 7 | 242 EXCLUDE_UNKNOWN_REGISTRIES)); // 7 |
257 EXPECT_EQ(1U, GetCanonicalHostRegistryLength( | 243 EXPECT_EQ(1U, GetRegistryLengthFromHost("a.b.c", |
258 "a.b.c", EXCLUDE_UNKNOWN_REGISTRIES)); // 7 8 | 244 EXCLUDE_UNKNOWN_REGISTRIES)); // 7 8 |
259 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 245 EXPECT_EQ(0U, GetRegistryLengthFromHost("baz.com", |
260 "baz.com", EXCLUDE_UNKNOWN_REGISTRIES)); // none | 246 EXCLUDE_UNKNOWN_REGISTRIES)); // none |
261 EXPECT_EQ(0U, GetCanonicalHostRegistryLength( | 247 EXPECT_EQ(0U, GetRegistryLengthFromHost("baz.com.", |
262 "baz.com.", EXCLUDE_UNKNOWN_REGISTRIES)); // none | 248 EXCLUDE_UNKNOWN_REGISTRIES)); // none |
263 EXPECT_EQ(3U, GetCanonicalHostRegistryLength( | 249 EXPECT_EQ(3U, GetRegistryLengthFromHost("baz.com", |
264 "baz.com", INCLUDE_UNKNOWN_REGISTRIES)); // none | 250 INCLUDE_UNKNOWN_REGISTRIES)); // none |
265 EXPECT_EQ(4U, GetCanonicalHostRegistryLength( | 251 EXPECT_EQ(4U, GetRegistryLengthFromHost("baz.com.", |
266 "baz.com.", INCLUDE_UNKNOWN_REGISTRIES)); // none | 252 INCLUDE_UNKNOWN_REGISTRIES)); // none |
267 | 253 |
268 EXPECT_EQ(std::string::npos, GetCanonicalHostRegistryLength( | 254 EXPECT_EQ(std::string::npos, |
269 std::string(), EXCLUDE_UNKNOWN_REGISTRIES)); | 255 GetRegistryLengthFromHost(std::string(), EXCLUDE_UNKNOWN_REGISTRIES)); |
270 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("foo.com..", | 256 EXPECT_EQ(0U, GetRegistryLengthFromHost("foo.com..", |
271 EXCLUDE_UNKNOWN_REGISTRIES)); | 257 EXCLUDE_UNKNOWN_REGISTRIES)); |
272 EXPECT_EQ(0U, | 258 EXPECT_EQ(0U, GetRegistryLengthFromHost("..", |
273 GetCanonicalHostRegistryLength("..", EXCLUDE_UNKNOWN_REGISTRIES)); | 259 EXCLUDE_UNKNOWN_REGISTRIES)); |
274 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("192.168.0.1", | 260 EXPECT_EQ(0U, GetRegistryLengthFromHost("192.168.0.1", |
275 EXCLUDE_UNKNOWN_REGISTRIES)); | 261 EXCLUDE_UNKNOWN_REGISTRIES)); |
276 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("localhost", | 262 EXPECT_EQ(0U, GetRegistryLengthFromHost("localhost", |
277 EXCLUDE_UNKNOWN_REGISTRIES)); | 263 EXCLUDE_UNKNOWN_REGISTRIES)); |
278 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("localhost", | 264 EXPECT_EQ(0U, GetRegistryLengthFromHost("localhost", |
279 INCLUDE_UNKNOWN_REGISTRIES)); | 265 INCLUDE_UNKNOWN_REGISTRIES)); |
280 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("localhost.", | 266 EXPECT_EQ(0U, GetRegistryLengthFromHost("localhost.", |
281 EXCLUDE_UNKNOWN_REGISTRIES)); | 267 EXCLUDE_UNKNOWN_REGISTRIES)); |
282 EXPECT_EQ(0U, GetCanonicalHostRegistryLength("localhost.", | 268 EXPECT_EQ(0U, GetRegistryLengthFromHost("localhost.", |
283 INCLUDE_UNKNOWN_REGISTRIES)); | 269 INCLUDE_UNKNOWN_REGISTRIES)); |
284 | |
285 // IDN case. | |
286 EXPECT_EQ(10U, GetCanonicalHostRegistryLength("foo.xn--fiqs8s", | |
287 EXCLUDE_UNKNOWN_REGISTRIES)); | |
288 } | |
289 | |
290 TEST_F(RegistryControlledDomainTest, HostHasRegistryControlledDomain) { | |
291 UseDomainData(test1::kDafsa); | |
292 | |
293 // Invalid hosts. | |
294 EXPECT_FALSE(HostHasRegistryControlledDomain( | |
295 std::string(), EXCLUDE_UNKNOWN_REGISTRIES, EXCLUDE_PRIVATE_REGISTRIES)); | |
296 EXPECT_FALSE(HostHasRegistryControlledDomain( | |
297 "%00asdf", EXCLUDE_UNKNOWN_REGISTRIES, EXCLUDE_PRIVATE_REGISTRIES)); | |
298 | |
299 // Invalid host but valid R.C.D. | |
300 EXPECT_TRUE(HostHasRegistryControlledDomain( | |
301 "%00foo.jp", EXCLUDE_UNKNOWN_REGISTRIES, EXCLUDE_PRIVATE_REGISTRIES)); | |
302 | |
303 // Valid R.C.D. when canonicalized, even with an invalid prefix and an | |
304 // escaped dot. | |
305 EXPECT_TRUE(HostHasRegistryControlledDomain("%00foo.Google%2EjP", | |
306 EXCLUDE_UNKNOWN_REGISTRIES, | |
307 EXCLUDE_PRIVATE_REGISTRIES)); | |
308 | |
309 // Regular, no match. | |
310 EXPECT_FALSE(HostHasRegistryControlledDomain( | |
311 "bar.notatld", EXCLUDE_UNKNOWN_REGISTRIES, EXCLUDE_PRIVATE_REGISTRIES)); | |
312 | |
313 // Regular, match. | |
314 EXPECT_TRUE(HostHasRegistryControlledDomain( | |
315 "www.Google.Jp", EXCLUDE_UNKNOWN_REGISTRIES, EXCLUDE_PRIVATE_REGISTRIES)); | |
316 } | 270 } |
317 | 271 |
318 TEST_F(RegistryControlledDomainTest, TestSameDomainOrHost) { | 272 TEST_F(RegistryControlledDomainTest, TestSameDomainOrHost) { |
319 UseDomainData(test2::kDafsa); | 273 UseDomainData(test2::kDafsa); |
320 | 274 |
321 EXPECT_TRUE(CompareDomains("http://a.b.bar.jp/file.html", | 275 EXPECT_TRUE(CompareDomains("http://a.b.bar.jp/file.html", |
322 "http://a.b.bar.jp/file.html")); // b.bar.jp | 276 "http://a.b.bar.jp/file.html")); // b.bar.jp |
323 EXPECT_TRUE(CompareDomains("http://a.b.bar.jp/file.html", | 277 EXPECT_TRUE(CompareDomains("http://a.b.bar.jp/file.html", |
324 "http://b.b.bar.jp/file.html")); // b.bar.jp | 278 "http://b.b.bar.jp/file.html")); // b.bar.jp |
325 EXPECT_FALSE(CompareDomains("http://a.foo.jp/file.html", // foo.jp | 279 EXPECT_FALSE(CompareDomains("http://a.foo.jp/file.html", // foo.jp |
(...skipping 101 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
427 const char key0[] = | 381 const char key0[] = |
428 "a.b.6____________________________________________________" | 382 "a.b.6____________________________________________________" |
429 "________________________________________________6"; | 383 "________________________________________________6"; |
430 const char key1[] = | 384 const char key1[] = |
431 "a.b.7____________________________________________________" | 385 "a.b.7____________________________________________________" |
432 "________________________________________________7"; | 386 "________________________________________________7"; |
433 const char key2[] = | 387 const char key2[] = |
434 "a.b.a____________________________________________________" | 388 "a.b.a____________________________________________________" |
435 "________________________________________________8"; | 389 "________________________________________________8"; |
436 | 390 |
| 391 EXPECT_EQ(102U, GetRegistryLengthFromHost(key0, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 392 EXPECT_EQ(0U, GetRegistryLengthFromHost(key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
437 EXPECT_EQ(102U, | 393 EXPECT_EQ(102U, |
438 GetCanonicalHostRegistryLength(key0, EXCLUDE_UNKNOWN_REGISTRIES)); | 394 GetRegistryLengthFromHostIncludingPrivate( |
439 EXPECT_EQ(0U, | 395 key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
440 GetCanonicalHostRegistryLength(key1, EXCLUDE_UNKNOWN_REGISTRIES)); | 396 EXPECT_EQ(0U, GetRegistryLengthFromHost(key2, EXCLUDE_UNKNOWN_REGISTRIES)); |
441 EXPECT_EQ(102U, GetCanonicalHostRegistryLengthIncludingPrivate(key1)); | |
442 EXPECT_EQ(0U, | |
443 GetCanonicalHostRegistryLength(key2, EXCLUDE_UNKNOWN_REGISTRIES)); | |
444 } | 397 } |
445 | 398 |
446 TEST_F(RegistryControlledDomainTest, TestDafsaThreeByteOffsets) { | 399 TEST_F(RegistryControlledDomainTest, TestDafsaThreeByteOffsets) { |
447 UseDomainData(test4::kDafsa); | 400 UseDomainData(test4::kDafsa); |
448 | 401 |
449 // Testing to lookup keys in a DAFSA with three byte offsets. | 402 // Testing to lookup keys in a DAFSA with three byte offsets. |
450 // This DAFSA is constructed so that labels begin and end with unique | 403 // This DAFSA is constructed so that labels begin and end with unique |
451 // characters, which makes it impossible to merge labels. The byte array | 404 // characters, which makes it impossible to merge labels. The byte array |
452 // has a size of ~54k. A two byte offset can add at most add 8k to the | 405 // has a size of ~54k. A two byte offset can add at most add 8k to the |
453 // previous offset. Since we can skip only forward in memory, the nodes | 406 // previous offset. Since we can skip only forward in memory, the nodes |
454 // representing the return values must be located near the end of the byte | 407 // representing the return values must be located near the end of the byte |
455 // array. The probability that we can reach from an arbitrary inner node to | 408 // array. The probability that we can reach from an arbitrary inner node to |
456 // a return value without using a three byte offset is small (but not zero). | 409 // a return value without using a three byte offset is small (but not zero). |
457 // The test is repeated with some different keys and with a reasonable | 410 // The test is repeated with some different keys and with a reasonable |
458 // probability at least one of the tested paths has go over a three byte | 411 // probability at least one of the tested paths has go over a three byte |
459 // offset. | 412 // offset. |
460 | 413 |
461 const char key0[] = | 414 const char key0[] = |
462 "a.b.z6___________________________________________________" | 415 "a.b.Z6___________________________________________________" |
463 "_________________________________________________z6"; | 416 "_________________________________________________Z6"; |
464 const char key1[] = | 417 const char key1[] = |
465 "a.b.z7___________________________________________________" | 418 "a.b.Z7___________________________________________________" |
466 "_________________________________________________z7"; | 419 "_________________________________________________Z7"; |
467 const char key2[] = | 420 const char key2[] = |
468 "a.b.za___________________________________________________" | 421 "a.b.Za___________________________________________________" |
469 "_________________________________________________z8"; | 422 "_________________________________________________Z8"; |
470 | 423 |
| 424 EXPECT_EQ(104U, GetRegistryLengthFromHost(key0, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 425 EXPECT_EQ(0U, GetRegistryLengthFromHost(key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
471 EXPECT_EQ(104U, | 426 EXPECT_EQ(104U, |
472 GetCanonicalHostRegistryLength(key0, EXCLUDE_UNKNOWN_REGISTRIES)); | 427 GetRegistryLengthFromHostIncludingPrivate( |
473 EXPECT_EQ(0U, | 428 key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
474 GetCanonicalHostRegistryLength(key1, EXCLUDE_UNKNOWN_REGISTRIES)); | 429 EXPECT_EQ(0U, GetRegistryLengthFromHost(key2, EXCLUDE_UNKNOWN_REGISTRIES)); |
475 EXPECT_EQ(104U, GetCanonicalHostRegistryLengthIncludingPrivate(key1)); | |
476 EXPECT_EQ(0U, | |
477 GetCanonicalHostRegistryLength(key2, EXCLUDE_UNKNOWN_REGISTRIES)); | |
478 } | 430 } |
479 | 431 |
480 TEST_F(RegistryControlledDomainTest, TestDafsaJoinedPrefixes) { | 432 TEST_F(RegistryControlledDomainTest, TestDafsaJoinedPrefixes) { |
481 UseDomainData(test5::kDafsa); | 433 UseDomainData(test5::kDafsa); |
482 | 434 |
483 // Testing to lookup keys in a DAFSA with compressed prefixes. | 435 // Testing to lookup keys in a DAFSA with compressed prefixes. |
484 // This DAFSA is constructed from words with similar prefixes but distinct | 436 // This DAFSA is constructed from words with similar prefixes but distinct |
485 // suffixes. The DAFSA will then form a trie with the implicit source node | 437 // suffixes. The DAFSA will then form a trie with the implicit source node |
486 // as root. | 438 // as root. |
487 | 439 |
488 const char key0[] = "a.b.ai"; | 440 const char key0[] = "a.b.ai"; |
489 const char key1[] = "a.b.bj"; | 441 const char key1[] = "a.b.bj"; |
490 const char key2[] = "a.b.aak"; | 442 const char key2[] = "a.b.aak"; |
491 const char key3[] = "a.b.bbl"; | 443 const char key3[] = "a.b.bbl"; |
492 const char key4[] = "a.b.aaa"; | 444 const char key4[] = "a.b.aaa"; |
493 const char key5[] = "a.b.bbb"; | 445 const char key5[] = "a.b.bbb"; |
494 const char key6[] = "a.b.aaaam"; | 446 const char key6[] = "a.b.aaaam"; |
495 const char key7[] = "a.b.bbbbn"; | 447 const char key7[] = "a.b.bbbbn"; |
496 | 448 |
| 449 EXPECT_EQ(2U, GetRegistryLengthFromHost(key0, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 450 EXPECT_EQ(0U, GetRegistryLengthFromHost(key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
497 EXPECT_EQ(2U, | 451 EXPECT_EQ(2U, |
498 GetCanonicalHostRegistryLength(key0, EXCLUDE_UNKNOWN_REGISTRIES)); | 452 GetRegistryLengthFromHostIncludingPrivate( |
| 453 key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 454 EXPECT_EQ(3U, GetRegistryLengthFromHost(key2, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 455 EXPECT_EQ(0U, GetRegistryLengthFromHost(key3, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 456 EXPECT_EQ(3U, |
| 457 GetRegistryLengthFromHostIncludingPrivate( |
| 458 key3, EXCLUDE_UNKNOWN_REGISTRIES)); |
499 EXPECT_EQ(0U, | 459 EXPECT_EQ(0U, |
500 GetCanonicalHostRegistryLength(key1, EXCLUDE_UNKNOWN_REGISTRIES)); | 460 GetRegistryLengthFromHostIncludingPrivate( |
501 EXPECT_EQ(2U, GetCanonicalHostRegistryLengthIncludingPrivate(key1)); | 461 key4, EXCLUDE_UNKNOWN_REGISTRIES)); |
502 EXPECT_EQ(3U, | |
503 GetCanonicalHostRegistryLength(key2, EXCLUDE_UNKNOWN_REGISTRIES)); | |
504 EXPECT_EQ(0U, | 462 EXPECT_EQ(0U, |
505 GetCanonicalHostRegistryLength(key3, EXCLUDE_UNKNOWN_REGISTRIES)); | 463 GetRegistryLengthFromHostIncludingPrivate( |
506 EXPECT_EQ(3U, GetCanonicalHostRegistryLengthIncludingPrivate(key3)); | 464 key5, EXCLUDE_UNKNOWN_REGISTRIES)); |
507 EXPECT_EQ(0U, GetCanonicalHostRegistryLengthIncludingPrivate(key4)); | 465 EXPECT_EQ(5U, GetRegistryLengthFromHost(key6, EXCLUDE_UNKNOWN_REGISTRIES)); |
508 EXPECT_EQ(0U, GetCanonicalHostRegistryLengthIncludingPrivate(key5)); | 466 EXPECT_EQ(5U, GetRegistryLengthFromHost(key7, EXCLUDE_UNKNOWN_REGISTRIES)); |
509 EXPECT_EQ(5U, | |
510 GetCanonicalHostRegistryLength(key6, EXCLUDE_UNKNOWN_REGISTRIES)); | |
511 EXPECT_EQ(5U, | |
512 GetCanonicalHostRegistryLength(key7, EXCLUDE_UNKNOWN_REGISTRIES)); | |
513 } | 467 } |
514 | 468 |
515 TEST_F(RegistryControlledDomainTest, TestDafsaJoinedSuffixes) { | 469 TEST_F(RegistryControlledDomainTest, TestDafsaJoinedSuffixes) { |
516 UseDomainData(test6::kDafsa); | 470 UseDomainData(test6::kDafsa); |
517 | 471 |
518 // Testing to lookup keys in a DAFSA with compressed suffixes. | 472 // Testing to lookup keys in a DAFSA with compressed suffixes. |
519 // This DAFSA is constructed from words with similar suffixes but distinct | 473 // This DAFSA is constructed from words with similar suffixes but distinct |
520 // prefixes. The DAFSA will then form a trie with the implicit sink node as | 474 // prefixes. The DAFSA will then form a trie with the implicit sink node as |
521 // root. | 475 // root. |
522 | 476 |
523 const char key0[] = "a.b.ia"; | 477 const char key0[] = "a.b.ia"; |
524 const char key1[] = "a.b.jb"; | 478 const char key1[] = "a.b.jb"; |
525 const char key2[] = "a.b.kaa"; | 479 const char key2[] = "a.b.kaa"; |
526 const char key3[] = "a.b.lbb"; | 480 const char key3[] = "a.b.lbb"; |
527 const char key4[] = "a.b.aaa"; | 481 const char key4[] = "a.b.aaa"; |
528 const char key5[] = "a.b.bbb"; | 482 const char key5[] = "a.b.bbb"; |
529 const char key6[] = "a.b.maaaa"; | 483 const char key6[] = "a.b.maaaa"; |
530 const char key7[] = "a.b.nbbbb"; | 484 const char key7[] = "a.b.nbbbb"; |
531 | 485 |
| 486 EXPECT_EQ(2U, GetRegistryLengthFromHost(key0, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 487 EXPECT_EQ(0U, GetRegistryLengthFromHost(key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
532 EXPECT_EQ(2U, | 488 EXPECT_EQ(2U, |
533 GetCanonicalHostRegistryLength(key0, EXCLUDE_UNKNOWN_REGISTRIES)); | 489 GetRegistryLengthFromHostIncludingPrivate( |
| 490 key1, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 491 EXPECT_EQ(3U, GetRegistryLengthFromHost(key2, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 492 EXPECT_EQ(0U, GetRegistryLengthFromHost(key3, EXCLUDE_UNKNOWN_REGISTRIES)); |
| 493 EXPECT_EQ(3U, |
| 494 GetRegistryLengthFromHostIncludingPrivate( |
| 495 key3, EXCLUDE_UNKNOWN_REGISTRIES)); |
534 EXPECT_EQ(0U, | 496 EXPECT_EQ(0U, |
535 GetCanonicalHostRegistryLength(key1, EXCLUDE_UNKNOWN_REGISTRIES)); | 497 GetRegistryLengthFromHostIncludingPrivate( |
536 EXPECT_EQ(2U, GetCanonicalHostRegistryLengthIncludingPrivate(key1)); | 498 key4, EXCLUDE_UNKNOWN_REGISTRIES)); |
537 EXPECT_EQ(3U, | |
538 GetCanonicalHostRegistryLength(key2, EXCLUDE_UNKNOWN_REGISTRIES)); | |
539 EXPECT_EQ(0U, | 499 EXPECT_EQ(0U, |
540 GetCanonicalHostRegistryLength(key3, EXCLUDE_UNKNOWN_REGISTRIES)); | 500 GetRegistryLengthFromHostIncludingPrivate( |
541 EXPECT_EQ(3U, GetCanonicalHostRegistryLengthIncludingPrivate(key3)); | 501 key5, EXCLUDE_UNKNOWN_REGISTRIES)); |
542 EXPECT_EQ(0U, GetCanonicalHostRegistryLengthIncludingPrivate(key4)); | 502 EXPECT_EQ(5U, GetRegistryLengthFromHost(key6, EXCLUDE_UNKNOWN_REGISTRIES)); |
543 EXPECT_EQ(0U, GetCanonicalHostRegistryLengthIncludingPrivate(key5)); | 503 EXPECT_EQ(5U, GetRegistryLengthFromHost(key7, EXCLUDE_UNKNOWN_REGISTRIES)); |
544 EXPECT_EQ(5U, | |
545 GetCanonicalHostRegistryLength(key6, EXCLUDE_UNKNOWN_REGISTRIES)); | |
546 EXPECT_EQ(5U, | |
547 GetCanonicalHostRegistryLength(key7, EXCLUDE_UNKNOWN_REGISTRIES)); | |
548 } | 504 } |
549 | |
550 TEST_F(RegistryControlledDomainTest, Permissive) { | |
551 UseDomainData(test1::kDafsa); | |
552 | |
553 EXPECT_EQ(std::string::npos, PermissiveGetHostRegistryLength("")); | |
554 | |
555 // Regular non-canonical host name. | |
556 EXPECT_EQ(2U, PermissiveGetHostRegistryLength("Www.Google.Jp")); | |
557 EXPECT_EQ(3U, PermissiveGetHostRegistryLength("Www.Google.Jp.")); | |
558 | |
559 // Empty returns npos. | |
560 EXPECT_EQ(std::string::npos, PermissiveGetHostRegistryLength("")); | |
561 | |
562 // Trailing spaces are counted as part of the hostname, meaning this will | |
563 // not match a known registry. | |
564 EXPECT_EQ(0U, PermissiveGetHostRegistryLength("Www.Google.Jp ")); | |
565 | |
566 // Invalid characters at the beginning are OK if the suffix still matches. | |
567 EXPECT_EQ(2U, PermissiveGetHostRegistryLength("*%00#?.Jp")); | |
568 | |
569 // Escaped period, this will add new components. | |
570 EXPECT_EQ(4U, PermissiveGetHostRegistryLength("Www.Googl%45%2e%4Ap")); | |
571 | |
572 // IDN cases (not supported when not linking ICU). | |
573 #if !BUILDFLAG(USE_PLATFORM_ICU_ALTERNATIVES) | |
574 EXPECT_EQ(10U, PermissiveGetHostRegistryLength("foo.xn--fiqs8s")); | |
575 EXPECT_EQ(11U, PermissiveGetHostRegistryLength("foo.xn--fiqs8s.")); | |
576 EXPECT_EQ(18U, PermissiveGetHostRegistryLength("foo.%E4%B8%AD%E5%9B%BD")); | |
577 EXPECT_EQ(19U, PermissiveGetHostRegistryLength("foo.%E4%B8%AD%E5%9B%BD.")); | |
578 EXPECT_EQ(6U, | |
579 PermissiveGetHostRegistryLength("foo.\xE4\xB8\xAD\xE5\x9B\xBD")); | |
580 EXPECT_EQ(7U, | |
581 PermissiveGetHostRegistryLength("foo.\xE4\xB8\xAD\xE5\x9B\xBD.")); | |
582 // UTF-16 IDN. | |
583 EXPECT_EQ(2U, PermissiveGetHostRegistryLength( | |
584 base::WideToUTF16(L"foo.\x4e2d\x56fd"))); | |
585 | |
586 // Fullwidth dot (u+FF0E) that will get canonicalized to a dot. | |
587 EXPECT_EQ(2U, PermissiveGetHostRegistryLength("Www.Google\xEF\xBC\x8Ejp")); | |
588 // Same but also ending in a fullwidth dot. | |
589 EXPECT_EQ(5U, PermissiveGetHostRegistryLength( | |
590 "Www.Google\xEF\xBC\x8Ejp\xEF\xBC\x8E")); | |
591 // Escaped UTF-8, also with an escaped fullwidth "Jp". | |
592 // "Jp" = U+FF2A, U+FF50, UTF-8 = EF BC AA EF BD 90 | |
593 EXPECT_EQ(27U, PermissiveGetHostRegistryLength( | |
594 "Www.Google%EF%BC%8E%EF%BC%AA%EF%BD%90%EF%BC%8E")); | |
595 // UTF-16 (ending in a dot). | |
596 EXPECT_EQ(3U, PermissiveGetHostRegistryLength( | |
597 base::WideToUTF16(L"Www.Google\xFF0E\xFF2A\xFF50\xFF0E"))); | |
598 #endif | |
599 } | |
600 | |
601 } // namespace registry_controlled_domains | 505 } // namespace registry_controlled_domains |
602 } // namespace net | 506 } // namespace net |
OLD | NEW |