| OLD | NEW |
| 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. | 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 #include "chrome/browser/autocomplete/history_url_provider.h" | 5 #include "chrome/browser/autocomplete/history_url_provider.h" |
| 6 | 6 |
| 7 #include <algorithm> | 7 #include <algorithm> |
| 8 | 8 |
| 9 #include "base/basictypes.h" | 9 #include "base/basictypes.h" |
| 10 #include "base/bind.h" | 10 #include "base/bind.h" |
| (...skipping 16 matching lines...) Expand all Loading... |
| 27 #include "chrome/browser/history/scored_history_match.h" | 27 #include "chrome/browser/history/scored_history_match.h" |
| 28 #include "chrome/browser/omnibox/omnibox_field_trial.h" | 28 #include "chrome/browser/omnibox/omnibox_field_trial.h" |
| 29 #include "chrome/browser/profiles/profile.h" | 29 #include "chrome/browser/profiles/profile.h" |
| 30 #include "chrome/browser/search_engines/template_url_service.h" | 30 #include "chrome/browser/search_engines/template_url_service.h" |
| 31 #include "chrome/browser/search_engines/template_url_service_factory.h" | 31 #include "chrome/browser/search_engines/template_url_service_factory.h" |
| 32 #include "chrome/common/chrome_switches.h" | 32 #include "chrome/common/chrome_switches.h" |
| 33 #include "chrome/common/net/url_fixer_upper.h" | 33 #include "chrome/common/net/url_fixer_upper.h" |
| 34 #include "chrome/common/pref_names.h" | 34 #include "chrome/common/pref_names.h" |
| 35 #include "chrome/common/url_constants.h" | 35 #include "chrome/common/url_constants.h" |
| 36 #include "components/bookmarks/browser/bookmark_utils.h" | 36 #include "components/bookmarks/browser/bookmark_utils.h" |
| 37 #include "components/metrics/proto/omnibox_input_type.pb.h" |
| 37 #include "net/base/net_util.h" | 38 #include "net/base/net_util.h" |
| 38 #include "net/base/registry_controlled_domains/registry_controlled_domain.h" | 39 #include "net/base/registry_controlled_domains/registry_controlled_domain.h" |
| 39 #include "url/gurl.h" | 40 #include "url/gurl.h" |
| 40 #include "url/url_parse.h" | 41 #include "url/url_parse.h" |
| 41 #include "url/url_util.h" | 42 #include "url/url_util.h" |
| 42 | 43 |
| 43 namespace { | 44 namespace { |
| 44 | 45 |
| 45 // If |create_if_necessary| is true, ensures that |matches| contains an | 46 // If |create_if_necessary| is true, ensures that |matches| contains an |
| 46 // entry for |info|, creating a new such entry if necessary (using | 47 // entry for |info|, creating a new such entry if necessary (using |
| (...skipping 282 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 329 const AutocompleteInput& input, | 330 const AutocompleteInput& input, |
| 330 history::URLDatabase* db) | 331 history::URLDatabase* db) |
| 331 : provider_(provider), | 332 : provider_(provider), |
| 332 db_(db), | 333 db_(db), |
| 333 type_(INVALID) { | 334 type_(INVALID) { |
| 334 const GURL& url = input.canonicalized_url(); | 335 const GURL& url = input.canonicalized_url(); |
| 335 // Detect email addresses. These cases will look like "http://user@site/", | 336 // Detect email addresses. These cases will look like "http://user@site/", |
| 336 // and because the history backend strips auth creds, we'll get a bogus exact | 337 // and because the history backend strips auth creds, we'll get a bogus exact |
| 337 // match below if the user has visited "site". | 338 // match below if the user has visited "site". |
| 338 if (!url.is_valid() || | 339 if (!url.is_valid() || |
| 339 ((input.type() == AutocompleteInput::UNKNOWN) && | 340 ((input.type() == metrics::OmniboxInputType::UNKNOWN) && |
| 340 input.parts().username.is_nonempty() && | 341 input.parts().username.is_nonempty() && |
| 341 !input.parts().password.is_nonempty() && | 342 !input.parts().password.is_nonempty() && |
| 342 !input.parts().path.is_nonempty())) | 343 !input.parts().path.is_nonempty())) |
| 343 return; | 344 return; |
| 344 | 345 |
| 345 if (db_->GetRowForURL(url, &url_row_)) { | 346 if (db_->GetRowForURL(url, &url_row_)) { |
| 346 type_ = VISITED; | 347 type_ = VISITED; |
| 347 return; | 348 return; |
| 348 } | 349 } |
| 349 | 350 |
| (...skipping 53 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 403 // running, we'd need to wait for it to return to the main thread before | 404 // running, we'd need to wait for it to return to the main thread before |
| 404 // doing this (we can't just write new data for it to read due to thread | 405 // doing this (we can't just write new data for it to read due to thread |
| 405 // safety issues). At that point it's just as fast, and easier, to simply | 406 // safety issues). At that point it's just as fast, and easier, to simply |
| 406 // re-run the query from scratch and ignore |minimal_changes|. | 407 // re-run the query from scratch and ignore |minimal_changes|. |
| 407 | 408 |
| 408 // Cancel any in-progress query. | 409 // Cancel any in-progress query. |
| 409 Stop(false); | 410 Stop(false); |
| 410 | 411 |
| 411 matches_.clear(); | 412 matches_.clear(); |
| 412 | 413 |
| 413 if ((input.type() == AutocompleteInput::INVALID) || | 414 if ((input.type() == metrics::OmniboxInputType::INVALID) || |
| 414 (input.type() == AutocompleteInput::FORCED_QUERY)) | 415 (input.type() == metrics::OmniboxInputType::FORCED_QUERY)) |
| 415 return; | 416 return; |
| 416 | 417 |
| 417 // Create a match for exactly what the user typed. This will only be used as | 418 // Create a match for exactly what the user typed. This will only be used as |
| 418 // a fallback in case we can't get the history service or URL DB; otherwise, | 419 // a fallback in case we can't get the history service or URL DB; otherwise, |
| 419 // we'll run this again in DoAutocomplete() and use that result instead. | 420 // we'll run this again in DoAutocomplete() and use that result instead. |
| 420 const bool trim_http = !AutocompleteInput::HasHTTPScheme(input.text()); | 421 const bool trim_http = !AutocompleteInput::HasHTTPScheme(input.text()); |
| 421 // Don't do this for queries -- while we can sometimes mark up a match for | 422 // Don't do this for queries -- while we can sometimes mark up a match for |
| 422 // this, it's not what the user wants, and just adds noise. | 423 // this, it's not what the user wants, and just adds noise. |
| 423 if (input.type() != AutocompleteInput::QUERY) { | 424 if (input.type() != metrics::OmniboxInputType::QUERY) { |
| 424 AutocompleteMatch what_you_typed(SuggestExactInput( | 425 AutocompleteMatch what_you_typed(SuggestExactInput( |
| 425 input.text(), input.canonicalized_url(), trim_http)); | 426 input.text(), input.canonicalized_url(), trim_http)); |
| 426 what_you_typed.relevance = CalculateRelevance(WHAT_YOU_TYPED, 0); | 427 what_you_typed.relevance = CalculateRelevance(WHAT_YOU_TYPED, 0); |
| 427 matches_.push_back(what_you_typed); | 428 matches_.push_back(what_you_typed); |
| 428 } | 429 } |
| 429 | 430 |
| 430 // We'll need the history service to run both passes, so try to obtain it. | 431 // We'll need the history service to run both passes, so try to obtain it. |
| 431 if (!profile_) | 432 if (!profile_) |
| 432 return; | 433 return; |
| 433 HistoryService* const history_service = | 434 HistoryService* const history_service = |
| (...skipping 155 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 589 // | 590 // |
| 590 // We display this to the user when there's a reasonable chance they actually | 591 // We display this to the user when there's a reasonable chance they actually |
| 591 // care: | 592 // care: |
| 592 // * Their input can be opened as a URL, and | 593 // * Their input can be opened as a URL, and |
| 593 // * We parsed the input as a URL, or it starts with an explicit "http:" or | 594 // * We parsed the input as a URL, or it starts with an explicit "http:" or |
| 594 // "https:". | 595 // "https:". |
| 595 // that is when their input can be opened as a URL. | 596 // that is when their input can be opened as a URL. |
| 596 // Otherwise, this is just low-quality noise. In the cases where we've parsed | 597 // Otherwise, this is just low-quality noise. In the cases where we've parsed |
| 597 // as UNKNOWN, we'll still show an accidental search infobar if need be. | 598 // as UNKNOWN, we'll still show an accidental search infobar if need be. |
| 598 bool have_what_you_typed_match = | 599 bool have_what_you_typed_match = |
| 599 (params->input.type() != AutocompleteInput::QUERY) && | 600 (params->input.type() != metrics::OmniboxInputType::QUERY) && |
| 600 ((params->input.type() != AutocompleteInput::UNKNOWN) || | 601 ((params->input.type() != metrics::OmniboxInputType::UNKNOWN) || |
| 601 (classifier.type() == VisitClassifier::UNVISITED_INTRANET) || | 602 (classifier.type() == VisitClassifier::UNVISITED_INTRANET) || |
| 602 !params->trim_http || | 603 !params->trim_http || |
| 603 (AutocompleteInput::NumNonHostComponents(params->input.parts()) > 0)); | 604 (AutocompleteInput::NumNonHostComponents(params->input.parts()) > 0)); |
| 604 AutocompleteMatch what_you_typed_match(SuggestExactInput( | 605 AutocompleteMatch what_you_typed_match(SuggestExactInput( |
| 605 params->input.text(), params->input.canonicalized_url(), | 606 params->input.text(), params->input.canonicalized_url(), |
| 606 params->trim_http)); | 607 params->trim_http)); |
| 607 what_you_typed_match.relevance = CalculateRelevance(WHAT_YOU_TYPED, 0); | 608 what_you_typed_match.relevance = CalculateRelevance(WHAT_YOU_TYPED, 0); |
| 608 | 609 |
| 609 // Get the matching URLs from the DB | 610 // Get the matching URLs from the DB |
| 610 history::URLRows url_matches; | 611 history::URLRows url_matches; |
| (...skipping 209 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 820 // make sure that this code does not trigger if the user did anything to | 821 // make sure that this code does not trigger if the user did anything to |
| 821 // indicate the desired match is a URL. For instance, "c/# foo" will not | 822 // indicate the desired match is a URL. For instance, "c/# foo" will not |
| 822 // pass the test because that will be classified as input type URL. The | 823 // pass the test because that will be classified as input type URL. The |
| 823 // parsed.CountCharactersBefore() in the test looks for the presence of a | 824 // parsed.CountCharactersBefore() in the test looks for the presence of a |
| 824 // reference fragment in the URL by checking whether the position differs | 825 // reference fragment in the URL by checking whether the position differs |
| 825 // included the delimiter (pound sign) versus not including the delimiter. | 826 // included the delimiter (pound sign) versus not including the delimiter. |
| 826 // (One cannot simply check url.ref() because it will not distinguish | 827 // (One cannot simply check url.ref() because it will not distinguish |
| 827 // between the input "c" and the input "c#", both of which will have empty | 828 // between the input "c" and the input "c#", both of which will have empty |
| 828 // reference fragments.) | 829 // reference fragments.) |
| 829 if ((type == UNVISITED_INTRANET) && | 830 if ((type == UNVISITED_INTRANET) && |
| 830 (input.type() != AutocompleteInput::URL) && url.username().empty() && | 831 (input.type() != metrics::OmniboxInputType::URL) && |
| 831 url.password().empty() && url.port().empty() && (url.path() == "/") && | 832 url.username().empty() && url.password().empty() && url.port().empty() && |
| 832 url.query().empty() && | 833 (url.path() == "/") && url.query().empty() && |
| 833 (parsed.CountCharactersBefore(url::Parsed::REF, true) != | 834 (parsed.CountCharactersBefore(url::Parsed::REF, true) != |
| 834 parsed.CountCharactersBefore(url::Parsed::REF, false))) { | 835 parsed.CountCharactersBefore(url::Parsed::REF, false))) { |
| 835 return false; | 836 return false; |
| 836 } | 837 } |
| 837 | 838 |
| 838 match->relevance = CalculateRelevance(type, 0); | 839 match->relevance = CalculateRelevance(type, 0); |
| 839 | 840 |
| 840 // If there are any other matches, then don't promote this match here, in | 841 // If there are any other matches, then don't promote this match here, in |
| 841 // hopes the caller will be able to inline autocomplete a better suggestion. | 842 // hopes the caller will be able to inline autocomplete a better suggestion. |
| 842 // DoAutocomplete() will fall back on this match if inline autocompletion | 843 // DoAutocomplete() will fall back on this match if inline autocompletion |
| 843 // fails. This matches how we react to never-visited URL inputs in the non- | 844 // fails. This matches how we react to never-visited URL inputs in the non- |
| 844 // intranet case. | 845 // intranet case. |
| 845 if (type == UNVISITED_INTRANET && !matches->empty()) | 846 if (type == UNVISITED_INTRANET && !matches->empty()) |
| 846 return false; | 847 return false; |
| 847 | 848 |
| 848 // Put it on the front of the HistoryMatches for redirect culling. | 849 // Put it on the front of the HistoryMatches for redirect culling. |
| 849 CreateOrPromoteMatch(classifier.url_row(), base::string16::npos, false, | 850 CreateOrPromoteMatch(classifier.url_row(), base::string16::npos, false, |
| 850 matches, true, true); | 851 matches, true, true); |
| 851 return true; | 852 return true; |
| 852 } | 853 } |
| 853 | 854 |
| 854 bool HistoryURLProvider::CanFindIntranetURL( | 855 bool HistoryURLProvider::CanFindIntranetURL( |
| 855 history::URLDatabase* db, | 856 history::URLDatabase* db, |
| 856 const AutocompleteInput& input) const { | 857 const AutocompleteInput& input) const { |
| 857 // Normally passing the first two conditions below ought to guarantee the | 858 // Normally passing the first two conditions below ought to guarantee the |
| 858 // third condition, but because FixupUserInput() can run and modify the | 859 // third condition, but because FixupUserInput() can run and modify the |
| 859 // input's text and parts between Parse() and here, it seems better to be | 860 // input's text and parts between Parse() and here, it seems better to be |
| 860 // paranoid and check. | 861 // paranoid and check. |
| 861 if ((input.type() != AutocompleteInput::UNKNOWN) || | 862 if ((input.type() != metrics::OmniboxInputType::UNKNOWN) || |
| 862 !LowerCaseEqualsASCII(input.scheme(), url::kHttpScheme) || | 863 !LowerCaseEqualsASCII(input.scheme(), url::kHttpScheme) || |
| 863 !input.parts().host.is_nonempty()) | 864 !input.parts().host.is_nonempty()) |
| 864 return false; | 865 return false; |
| 865 const std::string host(base::UTF16ToUTF8( | 866 const std::string host(base::UTF16ToUTF8( |
| 866 input.text().substr(input.parts().host.begin, input.parts().host.len))); | 867 input.text().substr(input.parts().host.begin, input.parts().host.len))); |
| 867 const size_t registry_length = | 868 const size_t registry_length = |
| 868 net::registry_controlled_domains::GetRegistryLength( | 869 net::registry_controlled_domains::GetRegistryLength( |
| 869 host, | 870 host, |
| 870 net::registry_controlled_domains::EXCLUDE_UNKNOWN_REGISTRIES, | 871 net::registry_controlled_domains::EXCLUDE_UNKNOWN_REGISTRIES, |
| 871 net::registry_controlled_domains::EXCLUDE_PRIVATE_REGISTRIES); | 872 net::registry_controlled_domains::EXCLUDE_PRIVATE_REGISTRIES); |
| (...skipping 283 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 1155 // If HistoryURL retrieves any matches (and hence we reach this code), we | 1156 // If HistoryURL retrieves any matches (and hence we reach this code), we |
| 1156 // are guaranteed that the beginning of input_text must be a word break. | 1157 // are guaranteed that the beginning of input_text must be a word break. |
| 1157 history::WordStarts offsets(1, 0u); | 1158 history::WordStarts offsets(1, 0u); |
| 1158 description_matches = | 1159 description_matches = |
| 1159 history::ScoredHistoryMatch::FilterTermMatchesByWordStarts( | 1160 history::ScoredHistoryMatch::FilterTermMatchesByWordStarts( |
| 1160 description_matches, offsets, description_word_starts, 0, | 1161 description_matches, offsets, description_word_starts, 0, |
| 1161 std::string::npos); | 1162 std::string::npos); |
| 1162 return SpansFromTermMatch( | 1163 return SpansFromTermMatch( |
| 1163 description_matches, clean_description.length(), false); | 1164 description_matches, clean_description.length(), false); |
| 1164 } | 1165 } |
| OLD | NEW |