| Index: chrome/browser/autocomplete/scored_history_match_unittest.cc
|
| diff --git a/chrome/browser/autocomplete/scored_history_match_unittest.cc b/chrome/browser/autocomplete/scored_history_match_unittest.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..cb1e57811073edef56364eb59aec06b82c2db1fa
|
| --- /dev/null
|
| +++ b/chrome/browser/autocomplete/scored_history_match_unittest.cc
|
| @@ -0,0 +1,492 @@
|
| +// Copyright (c) 2012 The Chromium Authors. All rights reserved.
|
| +// Use of this source code is governed by a BSD-style license that can be
|
| +// found in the LICENSE file.
|
| +
|
| +#include "chrome/browser/autocomplete/scored_history_match.h"
|
| +
|
| +#include <algorithm>
|
| +
|
| +#include "base/auto_reset.h"
|
| +#include "base/bind.h"
|
| +#include "base/memory/scoped_ptr.h"
|
| +#include "base/strings/string16.h"
|
| +#include "base/strings/utf_string_conversions.h"
|
| +#include "testing/gmock/include/gmock/gmock.h"
|
| +#include "testing/gtest/include/gtest/gtest.h"
|
| +
|
| +using base::ASCIIToUTF16;
|
| +using testing::ElementsAre;
|
| +using testing::Pair;
|
| +
|
| +namespace {
|
| +
|
| +// Returns a VisitInfoVector that includes |num_visits| spread over the
|
| +// last |frequency|*|num_visits| days (relative to |now|). A frequency of
|
| +// one means one visit each day, two means every other day, etc.
|
| +VisitInfoVector CreateVisitInfoVector(int num_visits,
|
| + int frequency,
|
| + base::Time now) {
|
| + VisitInfoVector visits;
|
| + for (int i = 0; i < num_visits; ++i) {
|
| + visits.push_back(
|
| + std::make_pair(now - base::TimeDelta::FromDays(i * frequency),
|
| + ui::PAGE_TRANSITION_LINK));
|
| + }
|
| + return visits;
|
| +}
|
| +
|
| +} // namespace
|
| +
|
| +class ScoredHistoryMatchTest : public testing::Test {
|
| + protected:
|
| + // Convenience function to create a history::URLRow with basic data for |url|,
|
| + // |title|, |visit_count|, and |typed_count|. |days_since_last_visit| gives
|
| + // the number of days ago to which to set the URL's last_visit.
|
| + history::URLRow MakeURLRow(const char* url,
|
| + const char* title,
|
| + int visit_count,
|
| + int days_since_last_visit,
|
| + int typed_count);
|
| +
|
| + // Convenience function to set the word starts information from a
|
| + // history::URLRow's URL and title.
|
| + void PopulateWordStarts(const history::URLRow& url_row,
|
| + RowWordStarts* word_starts);
|
| +
|
| + // Convenience functions for easily creating vectors of search terms.
|
| + String16Vector Make1Term(const char* term) const;
|
| + String16Vector Make2Terms(const char* term_1, const char* term_2) const;
|
| +
|
| + // Convenience function for GetTopicalityScore() that builds the term match
|
| + // and word break information automatically that are needed to call
|
| + // GetTopicalityScore(). It only works for scoring a single term, not
|
| + // multiple terms.
|
| + float GetTopicalityScoreOfTermAgainstURLAndTitle(const base::string16& term,
|
| + const base::string16& url,
|
| + const base::string16& title);
|
| +};
|
| +
|
| +history::URLRow ScoredHistoryMatchTest::MakeURLRow(const char* url,
|
| + const char* title,
|
| + int visit_count,
|
| + int days_since_last_visit,
|
| + int typed_count) {
|
| + history::URLRow row(GURL(url), 0);
|
| + row.set_title(ASCIIToUTF16(title));
|
| + row.set_visit_count(visit_count);
|
| + row.set_typed_count(typed_count);
|
| + row.set_last_visit(base::Time::NowFromSystemTime() -
|
| + base::TimeDelta::FromDays(days_since_last_visit));
|
| + return row;
|
| +}
|
| +
|
| +void ScoredHistoryMatchTest::PopulateWordStarts(const history::URLRow& url_row,
|
| + RowWordStarts* word_starts) {
|
| + String16SetFromString16(ASCIIToUTF16(url_row.url().spec()),
|
| + &word_starts->url_word_starts_);
|
| + String16SetFromString16(url_row.title(), &word_starts->title_word_starts_);
|
| +}
|
| +
|
| +String16Vector ScoredHistoryMatchTest::Make1Term(const char* term) const {
|
| + String16Vector original_terms;
|
| + original_terms.push_back(ASCIIToUTF16(term));
|
| + return original_terms;
|
| +}
|
| +
|
| +String16Vector ScoredHistoryMatchTest::Make2Terms(const char* term_1,
|
| + const char* term_2) const {
|
| + String16Vector original_terms;
|
| + original_terms.push_back(ASCIIToUTF16(term_1));
|
| + original_terms.push_back(ASCIIToUTF16(term_2));
|
| + return original_terms;
|
| +}
|
| +
|
| +float ScoredHistoryMatchTest::GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + const base::string16& term,
|
| + const base::string16& url,
|
| + const base::string16& title) {
|
| + // Make an empty match and simply populate the fields we need in order
|
| + // to call GetTopicalityScore().
|
| + ScoredHistoryMatch scored_match;
|
| + scored_match.url_matches = MatchTermInString(term, url, 0);
|
| + scored_match.title_matches = MatchTermInString(term, title, 0);
|
| + RowWordStarts word_starts;
|
| + String16SetFromString16(url, &word_starts.url_word_starts_);
|
| + String16SetFromString16(title, &word_starts.title_word_starts_);
|
| + WordStarts one_word_no_offset(1, 0u);
|
| + return scored_match.GetTopicalityScore(1, url, one_word_no_offset,
|
| + word_starts);
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, Scoring) {
|
| + // We use NowFromSystemTime() because MakeURLRow uses the same function
|
| + // to calculate last visit time when building a row.
|
| + base::Time now = base::Time::NowFromSystemTime();
|
| +
|
| + history::URLRow row_a(MakeURLRow("http://fedcba", "abcd bcd", 3, 30, 1));
|
| + RowWordStarts word_starts_a;
|
| + PopulateWordStarts(row_a, &word_starts_a);
|
| + WordStarts one_word_no_offset(1, 0u);
|
| + VisitInfoVector visits_a = CreateVisitInfoVector(3, 30, now);
|
| + // Mark one visit as typed.
|
| + visits_a[0].second = ui::PAGE_TRANSITION_TYPED;
|
| + ScoredHistoryMatch scored_a(row_a, visits_a, std::string(),
|
| + ASCIIToUTF16("abc"), Make1Term("abc"),
|
| + one_word_no_offset, word_starts_a, false, now);
|
| +
|
| + // Test scores based on visit_count.
|
| + history::URLRow row_b(MakeURLRow("http://abcdef", "abcd bcd", 10, 30, 1));
|
| + RowWordStarts word_starts_b;
|
| + PopulateWordStarts(row_b, &word_starts_b);
|
| + VisitInfoVector visits_b = CreateVisitInfoVector(10, 30, now);
|
| + visits_b[0].second = ui::PAGE_TRANSITION_TYPED;
|
| + ScoredHistoryMatch scored_b(row_b, visits_b, std::string(),
|
| + ASCIIToUTF16("abc"), Make1Term("abc"),
|
| + one_word_no_offset, word_starts_b, false, now);
|
| + EXPECT_GT(scored_b.raw_score, scored_a.raw_score);
|
| +
|
| + // Test scores based on last_visit.
|
| + history::URLRow row_c(MakeURLRow("http://abcdef", "abcd bcd", 3, 10, 1));
|
| + RowWordStarts word_starts_c;
|
| + PopulateWordStarts(row_c, &word_starts_c);
|
| + VisitInfoVector visits_c = CreateVisitInfoVector(3, 10, now);
|
| + visits_c[0].second = ui::PAGE_TRANSITION_TYPED;
|
| + ScoredHistoryMatch scored_c(row_c, visits_c, std::string(),
|
| + ASCIIToUTF16("abc"), Make1Term("abc"),
|
| + one_word_no_offset, word_starts_c, false, now);
|
| + EXPECT_GT(scored_c.raw_score, scored_a.raw_score);
|
| +
|
| + // Test scores based on typed_count.
|
| + history::URLRow row_d(MakeURLRow("http://abcdef", "abcd bcd", 3, 30, 3));
|
| + RowWordStarts word_starts_d;
|
| + PopulateWordStarts(row_d, &word_starts_d);
|
| + VisitInfoVector visits_d = CreateVisitInfoVector(3, 30, now);
|
| + visits_d[0].second = ui::PAGE_TRANSITION_TYPED;
|
| + visits_d[1].second = ui::PAGE_TRANSITION_TYPED;
|
| + visits_d[2].second = ui::PAGE_TRANSITION_TYPED;
|
| + ScoredHistoryMatch scored_d(row_d, visits_d, std::string(),
|
| + ASCIIToUTF16("abc"), Make1Term("abc"),
|
| + one_word_no_offset, word_starts_d, false, now);
|
| + EXPECT_GT(scored_d.raw_score, scored_a.raw_score);
|
| +
|
| + // Test scores based on a terms appearing multiple times.
|
| + history::URLRow row_e(MakeURLRow(
|
| + "http://csi.csi.csi/csi_csi",
|
| + "CSI Guide to CSI Las Vegas, CSI New York, CSI Provo", 3, 30, 3));
|
| + RowWordStarts word_starts_e;
|
| + PopulateWordStarts(row_e, &word_starts_e);
|
| + const VisitInfoVector visits_e = visits_d;
|
| + ScoredHistoryMatch scored_e(row_e, visits_e, std::string(),
|
| + ASCIIToUTF16("csi"), Make1Term("csi"),
|
| + one_word_no_offset, word_starts_e, false, now);
|
| + EXPECT_LT(scored_e.raw_score, 1400);
|
| +
|
| + // Test that a result with only a mid-term match (i.e., not at a word
|
| + // boundary) scores 0.
|
| + ScoredHistoryMatch scored_f(row_a, visits_a, std::string(),
|
| + ASCIIToUTF16("cd"), Make1Term("cd"),
|
| + one_word_no_offset, word_starts_a, false, now);
|
| + EXPECT_EQ(scored_f.raw_score, 0);
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, ScoringBookmarks) {
|
| + // We use NowFromSystemTime() because MakeURLRow uses the same function
|
| + // to calculate last visit time when building a row.
|
| + base::Time now = base::Time::NowFromSystemTime();
|
| +
|
| + std::string url_string("http://fedcba");
|
| + const GURL url(url_string);
|
| + history::URLRow row(MakeURLRow(url_string.c_str(), "abcd bcd", 8, 3, 1));
|
| + RowWordStarts word_starts;
|
| + PopulateWordStarts(row, &word_starts);
|
| + WordStarts one_word_no_offset(1, 0u);
|
| + VisitInfoVector visits = CreateVisitInfoVector(8, 3, now);
|
| + ScoredHistoryMatch scored(row, visits, std::string(), ASCIIToUTF16("abc"),
|
| + Make1Term("abc"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + // Now check that if URL is bookmarked then its score increases.
|
| + base::AutoReset<int> reset(&ScoredHistoryMatch::bookmark_value_, 5);
|
| + ScoredHistoryMatch scored_with_bookmark(
|
| + row, visits, std::string(), ASCIIToUTF16("abc"), Make1Term("abc"),
|
| + one_word_no_offset, word_starts, true, now);
|
| + EXPECT_GT(scored_with_bookmark.raw_score, scored.raw_score);
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, ScoringTLD) {
|
| + // We use NowFromSystemTime() because MakeURLRow uses the same function
|
| + // to calculate last visit time when building a row.
|
| + base::Time now = base::Time::NowFromSystemTime();
|
| +
|
| + // By default the URL should not be returned for a query that includes "com".
|
| + std::string url_string("http://fedcba.com/");
|
| + const GURL url(url_string);
|
| + history::URLRow row(MakeURLRow(url_string.c_str(), "", 8, 3, 1));
|
| + RowWordStarts word_starts;
|
| + PopulateWordStarts(row, &word_starts);
|
| + WordStarts two_words_no_offsets(2, 0u);
|
| + VisitInfoVector visits = CreateVisitInfoVector(8, 3, now);
|
| + ScoredHistoryMatch scored(row, visits, std::string(), ASCIIToUTF16("fed com"),
|
| + Make2Terms("fed", "com"), two_words_no_offsets,
|
| + word_starts, false, now);
|
| + EXPECT_EQ(0, scored.raw_score);
|
| +
|
| + // Now allow credit for the match in the TLD.
|
| + base::AutoReset<bool> reset(&ScoredHistoryMatch::allow_tld_matches_, true);
|
| + ScoredHistoryMatch scored_with_tld(
|
| + row, visits, std::string(), ASCIIToUTF16("fed com"),
|
| + Make2Terms("fed", "com"), two_words_no_offsets, word_starts, false, now);
|
| + EXPECT_GT(scored_with_tld.raw_score, 0);
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, ScoringScheme) {
|
| + // We use NowFromSystemTime() because MakeURLRow uses the same function
|
| + // to calculate last visit time when building a row.
|
| + base::Time now = base::Time::NowFromSystemTime();
|
| +
|
| + // By default the URL should not be returned for a query that includes "http".
|
| + std::string url_string("http://fedcba/");
|
| + const GURL url(url_string);
|
| + history::URLRow row(MakeURLRow(url_string.c_str(), "", 8, 3, 1));
|
| + RowWordStarts word_starts;
|
| + PopulateWordStarts(row, &word_starts);
|
| + WordStarts two_words_no_offsets(2, 0u);
|
| + VisitInfoVector visits = CreateVisitInfoVector(8, 3, now);
|
| + ScoredHistoryMatch scored(row, visits, std::string(),
|
| + ASCIIToUTF16("fed http"), Make2Terms("fed", "http"),
|
| + two_words_no_offsets, word_starts, false, now);
|
| + EXPECT_EQ(0, scored.raw_score);
|
| +
|
| + // Now allow credit for the match in the scheme.
|
| + base::AutoReset<bool> reset(&ScoredHistoryMatch::allow_scheme_matches_, true);
|
| + ScoredHistoryMatch scored_with_scheme(
|
| + row, visits, std::string(), ASCIIToUTF16("fed http"),
|
| + Make2Terms("fed", "http"), two_words_no_offsets, word_starts, false, now);
|
| + EXPECT_GT(scored_with_scheme.raw_score, 0);
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, Inlining) {
|
| + // We use NowFromSystemTime() because MakeURLRow uses the same function
|
| + // to calculate last visit time when building a row.
|
| + base::Time now = base::Time::NowFromSystemTime();
|
| + RowWordStarts word_starts;
|
| + WordStarts one_word_no_offset(1, 0u);
|
| + VisitInfoVector visits;
|
| +
|
| + {
|
| + history::URLRow row(
|
| + MakeURLRow("http://www.google.com", "abcdef", 3, 30, 1));
|
| + PopulateWordStarts(row, &word_starts);
|
| + ScoredHistoryMatch scored_a(row, visits, std::string(), ASCIIToUTF16("g"),
|
| + Make1Term("g"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_a.can_inline);
|
| + EXPECT_FALSE(scored_a.match_in_scheme);
|
| + ScoredHistoryMatch scored_b(row, visits, std::string(), ASCIIToUTF16("w"),
|
| + Make1Term("w"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_b.can_inline);
|
| + EXPECT_FALSE(scored_b.match_in_scheme);
|
| + ScoredHistoryMatch scored_c(row, visits, std::string(), ASCIIToUTF16("h"),
|
| + Make1Term("h"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_c.can_inline);
|
| + EXPECT_TRUE(scored_c.match_in_scheme);
|
| + ScoredHistoryMatch scored_d(row, visits, std::string(), ASCIIToUTF16("o"),
|
| + Make1Term("o"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_FALSE(scored_d.can_inline);
|
| + EXPECT_FALSE(scored_d.match_in_scheme);
|
| + }
|
| +
|
| + {
|
| + history::URLRow row(MakeURLRow("http://teams.foo.com", "abcdef", 3, 30, 1));
|
| + PopulateWordStarts(row, &word_starts);
|
| + ScoredHistoryMatch scored_a(row, visits, std::string(), ASCIIToUTF16("t"),
|
| + Make1Term("t"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_a.can_inline);
|
| + EXPECT_FALSE(scored_a.match_in_scheme);
|
| + ScoredHistoryMatch scored_b(row, visits, std::string(), ASCIIToUTF16("f"),
|
| + Make1Term("f"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_FALSE(scored_b.can_inline);
|
| + EXPECT_FALSE(scored_b.match_in_scheme);
|
| + ScoredHistoryMatch scored_c(row, visits, std::string(), ASCIIToUTF16("o"),
|
| + Make1Term("o"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_FALSE(scored_c.can_inline);
|
| + EXPECT_FALSE(scored_c.match_in_scheme);
|
| + }
|
| +
|
| + {
|
| + history::URLRow row(
|
| + MakeURLRow("https://www.testing.com", "abcdef", 3, 30, 1));
|
| + PopulateWordStarts(row, &word_starts);
|
| + ScoredHistoryMatch scored_a(row, visits, std::string(), ASCIIToUTF16("t"),
|
| + Make1Term("t"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_a.can_inline);
|
| + EXPECT_FALSE(scored_a.match_in_scheme);
|
| + ScoredHistoryMatch scored_b(row, visits, std::string(), ASCIIToUTF16("h"),
|
| + Make1Term("h"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_b.can_inline);
|
| + EXPECT_TRUE(scored_b.match_in_scheme);
|
| + ScoredHistoryMatch scored_c(row, visits, std::string(), ASCIIToUTF16("w"),
|
| + Make1Term("w"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_TRUE(scored_c.can_inline);
|
| + EXPECT_FALSE(scored_c.match_in_scheme);
|
| + }
|
| +
|
| + {
|
| + history::URLRow row(
|
| + MakeURLRow("http://www.xn--1lq90ic7f1rc.cn/xnblah", "abcd", 3, 30, 1));
|
| + PopulateWordStarts(row, &word_starts);
|
| + ScoredHistoryMatch scored_a(row, visits, "zh-CN", ASCIIToUTF16("x"),
|
| + Make1Term("x"), one_word_no_offset, word_starts,
|
| + false, now);
|
| + EXPECT_FALSE(scored_a.can_inline);
|
| + EXPECT_FALSE(scored_a.match_in_scheme);
|
| + ScoredHistoryMatch scored_b(row, visits, "zh-CN", ASCIIToUTF16("xn"),
|
| + Make1Term("xn"), one_word_no_offset,
|
| + word_starts, false, now);
|
| + EXPECT_FALSE(scored_b.can_inline);
|
| + EXPECT_FALSE(scored_b.match_in_scheme);
|
| + ScoredHistoryMatch scored_c(row, visits, "zh-CN", ASCIIToUTF16("w"),
|
| + Make1Term("w"), one_word_no_offset,
|
| + word_starts, false, now);
|
| + EXPECT_TRUE(scored_c.can_inline);
|
| + EXPECT_FALSE(scored_c.match_in_scheme);
|
| + }
|
| +}
|
| +
|
| +TEST_F(ScoredHistoryMatchTest, GetTopicalityScoreTrailingSlash) {
|
| + const float hostname = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("def"), ASCIIToUTF16("http://abc.def.com/"),
|
| + ASCIIToUTF16("Non-Matching Title"));
|
| + const float hostname_no_slash = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("def"), ASCIIToUTF16("http://abc.def.com"),
|
| + ASCIIToUTF16("Non-Matching Title"));
|
| + EXPECT_EQ(hostname_no_slash, hostname);
|
| +}
|
| +
|
| +// This function only tests scoring of single terms that match exactly
|
| +// once somewhere in the URL or title.
|
| +TEST_F(ScoredHistoryMatchTest, GetTopicalityScore) {
|
| + base::string16 url = ASCIIToUTF16(
|
| + "http://abc.def.com/path1/path2?"
|
| + "arg1=val1&arg2=val2#hash_component");
|
| + base::string16 title = ASCIIToUTF16("here is a title");
|
| + const float hostname_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("abc"), url, title);
|
| + const float hostname_mid_word_score =
|
| + GetTopicalityScoreOfTermAgainstURLAndTitle(ASCIIToUTF16("bc"), url,
|
| + title);
|
| + const float domain_name_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("def"), url, title);
|
| + const float domain_name_mid_word_score =
|
| + GetTopicalityScoreOfTermAgainstURLAndTitle(ASCIIToUTF16("ef"), url,
|
| + title);
|
| + const float tld_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("com"), url, title);
|
| + const float tld_mid_word_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("om"), url, title);
|
| + const float path_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("path1"), url, title);
|
| + const float path_mid_word_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("ath1"), url, title);
|
| + const float arg_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("arg2"), url, title);
|
| + const float arg_mid_word_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("rg2"), url, title);
|
| + const float protocol_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("htt"), url, title);
|
| + const float protocol_mid_word_score =
|
| + GetTopicalityScoreOfTermAgainstURLAndTitle(ASCIIToUTF16("tt"), url,
|
| + title);
|
| + const float title_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("her"), url, title);
|
| + const float title_mid_word_score = GetTopicalityScoreOfTermAgainstURLAndTitle(
|
| + ASCIIToUTF16("er"), url, title);
|
| + // Verify hostname and domain name > path > arg.
|
| + EXPECT_GT(hostname_score, path_score);
|
| + EXPECT_GT(domain_name_score, path_score);
|
| + EXPECT_GT(path_score, arg_score);
|
| + // Verify that domain name > path and domain name > arg for non-word
|
| + // boundaries.
|
| + EXPECT_GT(hostname_mid_word_score, path_mid_word_score);
|
| + EXPECT_GT(domain_name_mid_word_score, path_mid_word_score);
|
| + EXPECT_GT(domain_name_mid_word_score, arg_mid_word_score);
|
| + EXPECT_GT(hostname_mid_word_score, arg_mid_word_score);
|
| + // Also verify that the matches at non-word-boundaries all score
|
| + // worse than the matches at word boundaries. These three sets suffice.
|
| + EXPECT_GT(arg_score, hostname_mid_word_score);
|
| + EXPECT_GT(arg_score, domain_name_mid_word_score);
|
| + EXPECT_GT(title_score, title_mid_word_score);
|
| + // Check that title matches fit somewhere reasonable compared to the
|
| + // various types of URL matches.
|
| + EXPECT_GT(title_score, arg_score);
|
| + EXPECT_GT(arg_score, title_mid_word_score);
|
| + // Finally, verify that protocol matches and top level domain name
|
| + // matches (.com, .net, etc.) score worse than some of the mid-word
|
| + // matches that actually count.
|
| + EXPECT_GT(hostname_mid_word_score, protocol_score);
|
| + EXPECT_GT(hostname_mid_word_score, protocol_mid_word_score);
|
| + EXPECT_GT(hostname_mid_word_score, tld_score);
|
| + EXPECT_GT(hostname_mid_word_score, tld_mid_word_score);
|
| +}
|
| +
|
| +// Test the function GetFinalRelevancyScore().
|
| +TEST_F(ScoredHistoryMatchTest, GetFinalRelevancyScore) {
|
| + // hqp_relevance_buckets = "0.0:100,1.0:200,4.0:500,8.0:900,10.0:1000";
|
| + std::vector<ScoredHistoryMatch::ScoreMaxRelevance> hqp_buckets;
|
| + hqp_buckets.push_back(std::make_pair(0.0, 100));
|
| + hqp_buckets.push_back(std::make_pair(1.0, 200));
|
| + hqp_buckets.push_back(std::make_pair(4.0, 500));
|
| + hqp_buckets.push_back(std::make_pair(8.0, 900));
|
| + hqp_buckets.push_back(std::make_pair(10.0, 1000));
|
| + // Check when topicality score is zero.
|
| + float topicality_score = 0.0;
|
| + float frequency_score = 10.0;
|
| + // intermediate_score = 0.0 * 10.0 = 0.0.
|
| + EXPECT_EQ(0, ScoredHistoryMatch::GetFinalRelevancyScore(
|
| + topicality_score, frequency_score, hqp_buckets));
|
| +
|
| + // Check when intermediate score falls at the border range.
|
| + topicality_score = 0.4f;
|
| + frequency_score = 10.0f;
|
| + // intermediate_score = 0.5 * 10.0 = 4.0.
|
| + EXPECT_EQ(500, ScoredHistoryMatch::GetFinalRelevancyScore(
|
| + topicality_score, frequency_score, hqp_buckets));
|
| +
|
| + // Checking the score that falls into one of the buckets.
|
| + topicality_score = 0.5f;
|
| + frequency_score = 10.0f;
|
| + // intermediate_score = 0.5 * 10.0 = 5.0.
|
| + EXPECT_EQ(600, // 500 + (((900 - 500)/(8 -4)) * 1) = 600.
|
| + ScoredHistoryMatch::GetFinalRelevancyScore(
|
| + topicality_score, frequency_score, hqp_buckets));
|
| +
|
| + // Never give the score greater than maximum specified.
|
| + topicality_score = 0.5f;
|
| + frequency_score = 22.0f;
|
| + // intermediate_score = 0.5 * 22.0 = 11.0
|
| + EXPECT_EQ(1000, ScoredHistoryMatch::GetFinalRelevancyScore(
|
| + topicality_score, frequency_score, hqp_buckets));
|
| +}
|
| +
|
| +// Test the function GetHQPBucketsFromString().
|
| +TEST_F(ScoredHistoryMatchTest, GetHQPBucketsFromString) {
|
| + std::string buckets_str = "0.0:400,1.5:600,12.0:1300,20.0:1399";
|
| + std::vector<ScoredHistoryMatch::ScoreMaxRelevance> hqp_buckets;
|
| +
|
| + EXPECT_TRUE(
|
| + ScoredHistoryMatch::GetHQPBucketsFromString(buckets_str, &hqp_buckets));
|
| + EXPECT_THAT(hqp_buckets, ElementsAre(Pair(0.0, 400), Pair(1.5, 600),
|
| + Pair(12.0, 1300), Pair(20.0, 1399)));
|
| + // invalid string.
|
| + buckets_str = "0.0,400,1.5,600";
|
| + EXPECT_FALSE(
|
| + ScoredHistoryMatch::GetHQPBucketsFromString(buckets_str, &hqp_buckets));
|
| +}
|
|
|