| OLD | NEW |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "extensions/common/url_pattern.h" | 5 #include "extensions/common/url_pattern.h" |
| 6 | 6 |
| 7 #include <stddef.h> | 7 #include <stddef.h> |
| 8 | 8 |
| 9 #include <ostream> | 9 #include <ostream> |
| 10 | 10 |
| (...skipping 123 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 134 int result = 0; | 134 int result = 0; |
| 135 for (size_t i = 0; i < arraysize(kValidSchemeMasks); ++i) | 135 for (size_t i = 0; i < arraysize(kValidSchemeMasks); ++i) |
| 136 result |= kValidSchemeMasks[i]; | 136 result |= kValidSchemeMasks[i]; |
| 137 return result; | 137 return result; |
| 138 } | 138 } |
| 139 | 139 |
| 140 URLPattern::URLPattern() | 140 URLPattern::URLPattern() |
| 141 : valid_schemes_(SCHEME_NONE), | 141 : valid_schemes_(SCHEME_NONE), |
| 142 match_all_urls_(false), | 142 match_all_urls_(false), |
| 143 match_subdomains_(false), | 143 match_subdomains_(false), |
| 144 match_effective_tld_(true), |
| 144 port_("*") {} | 145 port_("*") {} |
| 145 | 146 |
| 146 URLPattern::URLPattern(int valid_schemes) | 147 URLPattern::URLPattern(int valid_schemes) |
| 147 : valid_schemes_(valid_schemes), | 148 : valid_schemes_(valid_schemes), |
| 148 match_all_urls_(false), | 149 match_all_urls_(false), |
| 149 match_subdomains_(false), | 150 match_subdomains_(false), |
| 151 match_effective_tld_(true), |
| 150 port_("*") {} | 152 port_("*") {} |
| 151 | 153 |
| 152 URLPattern::URLPattern(int valid_schemes, base::StringPiece pattern) | 154 URLPattern::URLPattern(int valid_schemes, base::StringPiece pattern) |
| 153 // Strict error checking is used, because this constructor is only | 155 // Strict error checking is used, because this constructor is only |
| 154 // appropriate when we know |pattern| is valid. | 156 // appropriate when we know |pattern| is valid. |
| 155 : valid_schemes_(valid_schemes), | 157 : valid_schemes_(valid_schemes), |
| 156 match_all_urls_(false), | 158 match_all_urls_(false), |
| 157 match_subdomains_(false), | 159 match_subdomains_(false), |
| 160 match_effective_tld_(true), |
| 158 port_("*") { | 161 port_("*") { |
| 159 ParseResult result = Parse(pattern); | 162 ParseResult result = Parse(pattern); |
| 160 if (PARSE_SUCCESS != result) | 163 if (PARSE_SUCCESS != result) |
| 161 NOTREACHED() << "URLPattern invalid: " << pattern << " result " << result; | 164 NOTREACHED() << "URLPattern invalid: " << pattern << " result " << result; |
| 162 } | 165 } |
| 163 | 166 |
| 164 URLPattern::URLPattern(const URLPattern& other) = default; | 167 URLPattern::URLPattern(const URLPattern& other) = default; |
| 165 | 168 |
| 166 URLPattern::~URLPattern() { | 169 URLPattern::~URLPattern() { |
| 167 } | 170 } |
| 168 | 171 |
| 169 bool URLPattern::operator<(const URLPattern& other) const { | 172 bool URLPattern::operator<(const URLPattern& other) const { |
| 170 return GetAsString() < other.GetAsString(); | 173 return GetAsString() < other.GetAsString(); |
| 171 } | 174 } |
| 172 | 175 |
| 173 bool URLPattern::operator>(const URLPattern& other) const { | 176 bool URLPattern::operator>(const URLPattern& other) const { |
| 174 return GetAsString() > other.GetAsString(); | 177 return GetAsString() > other.GetAsString(); |
| 175 } | 178 } |
| 176 | 179 |
| 177 bool URLPattern::operator==(const URLPattern& other) const { | 180 bool URLPattern::operator==(const URLPattern& other) const { |
| 178 return GetAsString() == other.GetAsString(); | 181 return GetAsString() == other.GetAsString(); |
| 179 } | 182 } |
| 180 | 183 |
| 181 std::ostream& operator<<(std::ostream& out, const URLPattern& url_pattern) { | 184 std::ostream& operator<<(std::ostream& out, const URLPattern& url_pattern) { |
| 182 return out << '"' << url_pattern.GetAsString() << '"'; | 185 return out << '"' << url_pattern.GetAsString() << '"'; |
| 183 } | 186 } |
| 184 | 187 |
| 185 URLPattern::ParseResult URLPattern::Parse(base::StringPiece pattern) { | 188 URLPattern::ParseResult URLPattern::Parse(base::StringPiece pattern) { |
| 189 return Parse(pattern, DENY_WILDCARD_FOR_EFFECTIVE_TLD); |
| 190 } |
| 191 |
| 192 URLPattern::ParseResult URLPattern::Parse(base::StringPiece pattern, |
| 193 ParseOptions parse_options) { |
| 186 spec_.clear(); | 194 spec_.clear(); |
| 187 SetMatchAllURLs(false); | 195 SetMatchAllURLs(false); |
| 188 SetMatchSubdomains(false); | 196 SetMatchSubdomains(false); |
| 197 SetMatchEffectiveTld(true); |
| 189 SetPort("*"); | 198 SetPort("*"); |
| 190 | 199 |
| 191 // Special case pattern to match every valid URL. | 200 // Special case pattern to match every valid URL. |
| 192 if (pattern == kAllUrlsPattern) { | 201 if (pattern == kAllUrlsPattern) { |
| 193 SetMatchAllURLs(true); | 202 SetMatchAllURLs(true); |
| 194 return PARSE_SUCCESS; | 203 return PARSE_SUCCESS; |
| 195 } | 204 } |
| 196 | 205 |
| 197 // Parse out the scheme. | 206 // Parse out the scheme. |
| 198 size_t scheme_end_pos = pattern.find(url::kStandardSchemeSeparator); | 207 size_t scheme_end_pos = pattern.find(url::kStandardSchemeSeparator); |
| (...skipping 61 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 260 // Could be empty if the host only consists of whitespace characters. | 269 // Could be empty if the host only consists of whitespace characters. |
| 261 if (host_components.empty() || | 270 if (host_components.empty() || |
| 262 (host_components.size() == 1 && host_components[0].empty())) | 271 (host_components.size() == 1 && host_components[0].empty())) |
| 263 return PARSE_ERROR_EMPTY_HOST; | 272 return PARSE_ERROR_EMPTY_HOST; |
| 264 | 273 |
| 265 if (host_components[0] == "*") { | 274 if (host_components[0] == "*") { |
| 266 match_subdomains_ = true; | 275 match_subdomains_ = true; |
| 267 host_components.erase(host_components.begin(), | 276 host_components.erase(host_components.begin(), |
| 268 host_components.begin() + 1); | 277 host_components.begin() + 1); |
| 269 } | 278 } |
| 279 |
| 280 // If explicitly allowed, the last component can optionally be '*' to |
| 281 // match all effective TLDs. |
| 282 if (parse_options == ALLOW_WILDCARD_FOR_EFFECTIVE_TLD && |
| 283 host_components.size() > 1 && host_components.back() == "*") { |
| 284 match_effective_tld_ = false; |
| 285 host_components.pop_back(); |
| 286 } |
| 270 host_ = base::JoinString(host_components, "."); | 287 host_ = base::JoinString(host_components, "."); |
| 271 | 288 |
| 272 path_start_pos = host_end_pos; | 289 path_start_pos = host_end_pos; |
| 273 } | 290 } |
| 274 | 291 |
| 275 SetPath(pattern.substr(path_start_pos)); | 292 SetPath(pattern.substr(path_start_pos)); |
| 276 | 293 |
| 277 size_t port_pos = host_.find(':'); | 294 size_t port_pos = host_.find(':'); |
| 278 if (port_pos != std::string::npos) { | 295 if (port_pos != std::string::npos) { |
| 279 if (!SetPort(host_.substr(port_pos + 1))) | 296 if (!SetPort(host_.substr(port_pos + 1))) |
| (...skipping 34 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 314 host_.clear(); | 331 host_.clear(); |
| 315 SetPath("/*"); | 332 SetPath("/*"); |
| 316 } | 333 } |
| 317 } | 334 } |
| 318 | 335 |
| 319 void URLPattern::SetMatchSubdomains(bool val) { | 336 void URLPattern::SetMatchSubdomains(bool val) { |
| 320 spec_.clear(); | 337 spec_.clear(); |
| 321 match_subdomains_ = val; | 338 match_subdomains_ = val; |
| 322 } | 339 } |
| 323 | 340 |
| 341 void URLPattern::SetMatchEffectiveTld(bool val) { |
| 342 spec_.clear(); |
| 343 match_effective_tld_ = val; |
| 344 } |
| 345 |
| 324 bool URLPattern::SetScheme(base::StringPiece scheme) { | 346 bool URLPattern::SetScheme(base::StringPiece scheme) { |
| 325 spec_.clear(); | 347 spec_.clear(); |
| 326 scheme.CopyToString(&scheme_); | 348 scheme.CopyToString(&scheme_); |
| 327 if (scheme_ == "*") { | 349 if (scheme_ == "*") { |
| 328 valid_schemes_ &= (SCHEME_HTTP | SCHEME_HTTPS); | 350 valid_schemes_ &= (SCHEME_HTTP | SCHEME_HTTPS); |
| 329 } else if (!IsValidScheme(scheme_)) { | 351 } else if (!IsValidScheme(scheme_)) { |
| 330 return false; | 352 return false; |
| 331 } | 353 } |
| 332 return true; | 354 return true; |
| 333 } | 355 } |
| (...skipping 80 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 414 } | 436 } |
| 415 | 437 |
| 416 bool URLPattern::MatchesHost(base::StringPiece host) const { | 438 bool URLPattern::MatchesHost(base::StringPiece host) const { |
| 417 // TODO(devlin): This is a bit sad. Parsing urls is expensive. | 439 // TODO(devlin): This is a bit sad. Parsing urls is expensive. |
| 418 return MatchesHost( | 440 return MatchesHost( |
| 419 GURL(base::StringPrintf("%s%s%s/", url::kHttpScheme, | 441 GURL(base::StringPrintf("%s%s%s/", url::kHttpScheme, |
| 420 url::kStandardSchemeSeparator, host.data()))); | 442 url::kStandardSchemeSeparator, host.data()))); |
| 421 } | 443 } |
| 422 | 444 |
| 423 bool URLPattern::MatchesHost(const GURL& test) const { | 445 bool URLPattern::MatchesHost(const GURL& test) const { |
| 424 const base::StringPiece test_host( | 446 base::StringPiece test_host(CanonicalizeHostForMatching(test.host_piece())); |
| 425 CanonicalizeHostForMatching(test.host_piece())); | |
| 426 const base::StringPiece pattern_host(CanonicalizeHostForMatching(host_)); | 447 const base::StringPiece pattern_host(CanonicalizeHostForMatching(host_)); |
| 427 | 448 |
| 449 // If we don't care about matching the effective TLD, remove it. |
| 450 if (!match_effective_tld_) { |
| 451 int reg_length = net::registry_controlled_domains::GetRegistryLength( |
| 452 test, net::registry_controlled_domains::EXCLUDE_UNKNOWN_REGISTRIES, |
| 453 net::registry_controlled_domains::EXCLUDE_PRIVATE_REGISTRIES); |
| 454 if (reg_length > 0) { |
| 455 test_host = test_host.substr(0, test_host.size() - reg_length - 1); |
| 456 } |
| 457 } |
| 458 |
| 428 // If the hosts are exactly equal, we have a match. | 459 // If the hosts are exactly equal, we have a match. |
| 429 if (test_host == pattern_host) | 460 if (test_host == pattern_host) |
| 430 return true; | 461 return true; |
| 431 | 462 |
| 432 // If we're matching subdomains, and we have no host in the match pattern, | 463 // If we're matching subdomains, and we have no host in the match pattern, |
| 433 // that means that we're matching all hosts, which means we have a match no | 464 // that means that we're matching all hosts, which means we have a match no |
| 434 // matter what the test host is. | 465 // matter what the test host is. |
| 435 if (match_subdomains_ && pattern_host.empty()) | 466 if (match_subdomains_ && pattern_host.empty()) |
| 436 return true; | 467 return true; |
| 437 | 468 |
| (...skipping 84 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 522 if (scheme_ != url::kFileScheme && standard_scheme) { | 553 if (scheme_ != url::kFileScheme && standard_scheme) { |
| 523 if (match_subdomains_) { | 554 if (match_subdomains_) { |
| 524 spec += "*"; | 555 spec += "*"; |
| 525 if (!host_.empty()) | 556 if (!host_.empty()) |
| 526 spec += "."; | 557 spec += "."; |
| 527 } | 558 } |
| 528 | 559 |
| 529 if (!host_.empty()) | 560 if (!host_.empty()) |
| 530 spec += host_; | 561 spec += host_; |
| 531 | 562 |
| 563 if (!match_effective_tld_) { |
| 564 if (!host_.empty()) |
| 565 spec += "."; |
| 566 spec += "*"; |
| 567 } |
| 568 |
| 532 if (port_ != "*") { | 569 if (port_ != "*") { |
| 533 spec += ":"; | 570 spec += ":"; |
| 534 spec += port_; | 571 spec += port_; |
| 535 } | 572 } |
| 536 } | 573 } |
| 537 | 574 |
| 538 if (!path_.empty()) | 575 if (!path_.empty()) |
| 539 spec += path_; | 576 spec += path_; |
| 540 | 577 |
| 541 spec_ = std::move(spec); | 578 spec_ = std::move(spec); |
| (...skipping 88 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 630 } | 667 } |
| 631 | 668 |
| 632 return result; | 669 return result; |
| 633 } | 670 } |
| 634 | 671 |
| 635 // static | 672 // static |
| 636 const char* URLPattern::GetParseResultString( | 673 const char* URLPattern::GetParseResultString( |
| 637 URLPattern::ParseResult parse_result) { | 674 URLPattern::ParseResult parse_result) { |
| 638 return kParseResultMessages[parse_result]; | 675 return kParseResultMessages[parse_result]; |
| 639 } | 676 } |
| OLD | NEW |