Index: chrome/browser/predictors/resource_prefetch_predictor_tables.cc |
diff --git a/chrome/browser/predictors/resource_prefetch_predictor_tables.cc b/chrome/browser/predictors/resource_prefetch_predictor_tables.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..f434b1af503a15a1a74fb2ae5ef4b3cf1b95075f |
--- /dev/null |
+++ b/chrome/browser/predictors/resource_prefetch_predictor_tables.cc |
@@ -0,0 +1,515 @@ |
+// Copyright (c) 2014 The Chromium Authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+#include "chrome/browser/predictors/resource_prefetch_predictor_tables.h" |
+ |
+#include <algorithm> |
+#include <utility> |
Lei Zhang
2014/09/09 03:32:19
nit: blank line after
Zhen Wang
2014/09/13 00:36:32
Done.
|
+#include "base/logging.h" |
+#include "base/metrics/histogram.h" |
+#include "base/strings/stringprintf.h" |
+#include "content/public/browser/browser_thread.h" |
+#include "sql/statement.h" |
+ |
+using content::BrowserThread; |
+using sql::Statement; |
+ |
+namespace { |
+ |
+const char kUrlResourceTableName[] = "resource_prefetch_predictor_url"; |
+const char kUrlMetadataTableName[] = "resource_prefetch_predictor_url_metadata"; |
+const char kHostResourceTableName[] = "resource_prefetch_predictor_host"; |
+const char kHostMetadataTableName[] = |
+ "resource_prefetch_predictor_host_metadata"; |
+ |
+void BindResourceRowToStatement( |
+ const predictors::ResourcePrefetchPredictorTables::ResourceRow& row, |
+ const std::string& primary_key, |
+ Statement* statement) { |
+ statement->BindString(0, primary_key); |
+ statement->BindString(1, row.resource_url.spec()); |
+ statement->BindInt(2, static_cast<int>(row.resource_type)); |
+ statement->BindInt(3, row.number_of_hits); |
+ statement->BindInt(4, row.number_of_misses); |
+ statement->BindInt(5, row.consecutive_misses); |
+ statement->BindDouble(6, row.average_position); |
+} |
+ |
+bool StepAndInitializeResourceRow( |
+ Statement* statement, |
+ predictors::ResourcePrefetchPredictorTables::ResourceRow* row) { |
+ if (!statement->Step()) |
+ return false; |
+ |
+ row->primary_key = statement->ColumnString(0); |
+ row->resource_url = GURL(statement->ColumnString(1)); |
+ row->resource_type = static_cast<content::ResourceType>( |
+ statement->ColumnInt(2)); |
+ row->number_of_hits = statement->ColumnInt(3); |
+ row->number_of_misses = statement->ColumnInt(4); |
+ row->consecutive_misses = statement->ColumnInt(5); |
+ row->average_position = statement->ColumnDouble(6); |
+ return true; |
+} |
+ |
+} // namespace |
+ |
+namespace predictors { |
+ |
+// static |
+const size_t ResourcePrefetchPredictorTables::kMaxStringLength = 1024; |
+ |
+ResourcePrefetchPredictorTables::ResourceRow::ResourceRow() |
+ : resource_type(content::RESOURCE_TYPE_LAST_TYPE), |
+ number_of_hits(0), |
+ number_of_misses(0), |
+ consecutive_misses(0), |
+ average_position(0.0), |
+ score(0.0) { |
+} |
+ |
+ResourcePrefetchPredictorTables::ResourceRow::ResourceRow( |
+ const ResourceRow& other) |
+ : primary_key(other.primary_key), |
+ resource_url(other.resource_url), |
+ resource_type(other.resource_type), |
+ number_of_hits(other.number_of_hits), |
+ number_of_misses(other.number_of_misses), |
+ consecutive_misses(other.consecutive_misses), |
+ average_position(other.average_position), |
+ score(other.score) { |
+} |
+ |
+ResourcePrefetchPredictorTables::ResourceRow::ResourceRow( |
+ const std::string& i_primary_key, |
+ const std::string& i_resource_url, |
+ content::ResourceType i_resource_type, |
+ int i_number_of_hits, |
+ int i_number_of_misses, |
+ int i_consecutive_misses, |
+ double i_average_position) |
+ : primary_key(i_primary_key), |
+ resource_url(i_resource_url), |
+ resource_type(i_resource_type), |
+ number_of_hits(i_number_of_hits), |
+ number_of_misses(i_number_of_misses), |
+ consecutive_misses(i_consecutive_misses), |
+ average_position(i_average_position) { |
+ UpdateScore(); |
+} |
+ |
+void ResourcePrefetchPredictorTables::ResourceRow::UpdateScore() { |
+ // The score is calculated so that when the rows are sorted, the stylesheets |
+ // and scripts appear first, sorted by position(ascending) and then the rest |
+ // of the resources sorted by position(ascending). |
+ static const int kMaxResourcesPerType = 100; |
+ switch (resource_type) { |
+ case content::RESOURCE_TYPE_STYLESHEET: |
+ case content::RESOURCE_TYPE_SCRIPT: |
+ score = (2 * kMaxResourcesPerType) - average_position; |
+ break; |
+ |
+ case content::RESOURCE_TYPE_IMAGE: |
+ score = kMaxResourcesPerType - average_position; |
Lei Zhang
2014/09/09 03:32:20
nit: combine with default? i.e.
case content::RES
Zhen Wang
2014/09/13 00:36:32
Done.
|
+ break; |
+ |
+ default: |
+ score = kMaxResourcesPerType - average_position; |
+ break; |
+ } |
+} |
+ |
+bool ResourcePrefetchPredictorTables::ResourceRow::operator==( |
+ const ResourceRow& rhs) const { |
+ return primary_key == rhs.primary_key && |
+ resource_url == rhs.resource_url && |
+ resource_type == rhs.resource_type && |
+ number_of_hits == rhs.number_of_hits && |
+ number_of_misses == rhs.number_of_misses && |
+ consecutive_misses == rhs.consecutive_misses && |
+ average_position == rhs.average_position && |
+ score == rhs.score; |
+} |
+ |
+bool ResourcePrefetchPredictorTables::ResourceRowSorter::operator()( |
+ const ResourceRow& x, const ResourceRow& y) const { |
+ return x.score > y.score; |
+} |
+ |
+ResourcePrefetchPredictorTables::PrefetchData::PrefetchData( |
+ PrefetchKeyType i_key_type, |
+ const std::string& i_primary_key) |
+ : key_type(i_key_type), |
+ primary_key(i_primary_key) { |
+} |
+ |
+ResourcePrefetchPredictorTables::PrefetchData::PrefetchData( |
+ const PrefetchData& other) |
+ : key_type(other.key_type), |
+ primary_key(other.primary_key), |
+ last_visit(other.last_visit), |
+ resources(other.resources) { |
+} |
+ |
+ResourcePrefetchPredictorTables::PrefetchData::~PrefetchData() { |
+} |
+ |
+bool ResourcePrefetchPredictorTables::PrefetchData::operator==( |
+ const PrefetchData& rhs) const { |
+ return key_type == rhs.key_type && primary_key == rhs.primary_key && |
+ resources == rhs.resources; |
+} |
+ |
+void ResourcePrefetchPredictorTables::GetAllData( |
+ PrefetchDataMap* url_data_map, |
+ PrefetchDataMap* host_data_map) { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
Lei Zhang
2014/09/09 03:32:19
Generally we DCHECK we are on the correct thread,
Zhen Wang
2014/09/13 00:36:32
Done.
|
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ DCHECK(url_data_map); |
+ DCHECK(host_data_map); |
+ url_data_map->clear(); |
+ host_data_map->clear(); |
+ |
+ std::vector<std::string> urls_to_delete, hosts_to_delete; |
+ GetAllDataHelper(PREFETCH_KEY_TYPE_URL, url_data_map, &urls_to_delete); |
+ GetAllDataHelper(PREFETCH_KEY_TYPE_HOST, host_data_map, &hosts_to_delete); |
+ |
+ if (!urls_to_delete.empty() || !hosts_to_delete.empty()) |
+ DeleteData(urls_to_delete, hosts_to_delete); |
+} |
+ |
+void ResourcePrefetchPredictorTables::UpdateData( |
+ const PrefetchData& url_data, |
+ const PrefetchData& host_data) { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ DCHECK(!url_data.is_host() && host_data.is_host()); |
+ DCHECK(!url_data.primary_key.empty() || !host_data.primary_key.empty()); |
+ |
+ DB()->BeginTransaction(); |
+ |
+ bool success = (url_data.primary_key.empty() || UpdateDataHelper(url_data)) && |
+ (host_data.primary_key.empty() || UpdateDataHelper(host_data)); |
+ if (!success) |
+ DB()->RollbackTransaction(); |
+ |
+ DB()->CommitTransaction(); |
+} |
+ |
+void ResourcePrefetchPredictorTables::DeleteData( |
+ const std::vector<std::string>& urls, |
+ const std::vector<std::string>& hosts) { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ DCHECK(!urls.empty() || !hosts.empty()); |
+ |
+ if (!urls.empty()) |
+ DeleteDataHelper(PREFETCH_KEY_TYPE_URL, urls); |
+ if (!hosts.empty()) |
+ DeleteDataHelper(PREFETCH_KEY_TYPE_HOST, hosts); |
+} |
+ |
+void ResourcePrefetchPredictorTables::DeleteSingleDataPoint( |
+ const std::string& key, |
+ PrefetchKeyType key_type) { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ DeleteDataHelper(key_type, std::vector<std::string>(1, key)); |
+} |
+ |
+void ResourcePrefetchPredictorTables::DeleteAllData() { |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ Statement deleter(DB()->GetUniqueStatement( |
+ base::StringPrintf("DELETE FROM %s", kUrlResourceTableName).c_str())); |
+ deleter.Run(); |
+ deleter.Assign(DB()->GetUniqueStatement( |
+ base::StringPrintf("DELETE FROM %s", kUrlMetadataTableName).c_str())); |
+ deleter.Run(); |
+ deleter.Assign(DB()->GetUniqueStatement( |
+ base::StringPrintf("DELETE FROM %s", kHostResourceTableName).c_str())); |
+ deleter.Run(); |
+ deleter.Assign(DB()->GetUniqueStatement( |
+ base::StringPrintf("DELETE FROM %s", kHostMetadataTableName).c_str())); |
+ deleter.Run(); |
+} |
+ |
+ResourcePrefetchPredictorTables::ResourcePrefetchPredictorTables() |
+ : PredictorTableBase() { |
+} |
+ |
+ResourcePrefetchPredictorTables::~ResourcePrefetchPredictorTables() { |
+} |
+ |
+void ResourcePrefetchPredictorTables::GetAllDataHelper( |
+ PrefetchKeyType key_type, |
+ PrefetchDataMap* data_map, |
+ std::vector<std::string>* to_delete) { |
+ bool is_host = key_type == PREFETCH_KEY_TYPE_HOST; |
+ |
+ // Read the resources table and organize it per primary key. |
+ const char* resource_table_name = is_host ? kHostResourceTableName : |
+ kUrlResourceTableName; |
+ Statement resource_reader(DB()->GetUniqueStatement( |
+ base::StringPrintf("SELECT * FROM %s", resource_table_name).c_str())); |
+ |
+ ResourceRow row; |
+ while (StepAndInitializeResourceRow(&resource_reader, &row)) { |
+ row.UpdateScore(); |
+ std::string primary_key = row.primary_key; |
+ // Don't need to store primary key since the data is grouped by primary key. |
+ row.primary_key.clear(); |
+ |
+ PrefetchDataMap::iterator it = data_map->find(primary_key); |
+ if (it == data_map->end()) { |
+ it = data_map->insert(std::make_pair( |
+ primary_key, PrefetchData(key_type, primary_key))).first; |
+ } |
+ it->second.resources.push_back(row); |
+ } |
+ |
+ // Sort each of the resource row vectors by score. |
+ for (PrefetchDataMap::iterator it = data_map->begin(); it != data_map->end(); |
+ ++it) { |
+ std::sort(it->second.resources.begin(), |
+ it->second.resources.end(), |
+ ResourceRowSorter()); |
+ } |
+ |
+ // Read the metadata and keep track of entries that have metadata, but no |
+ // resource entries, so they can be deleted. |
+ const char* metadata_table_name = is_host ? kHostMetadataTableName : |
+ kUrlMetadataTableName; |
+ Statement metadata_reader(DB()->GetUniqueStatement( |
+ base::StringPrintf("SELECT * FROM %s", metadata_table_name).c_str())); |
+ |
+ while (metadata_reader.Step()) { |
+ std::string primary_key = metadata_reader.ColumnString(0); |
+ |
+ PrefetchDataMap::iterator it = data_map->find(primary_key); |
+ if (it != data_map->end()) { |
+ int64 last_visit = metadata_reader.ColumnInt64(1); |
+ it->second.last_visit = base::Time::FromInternalValue(last_visit); |
+ } else { |
+ to_delete->push_back(primary_key); |
+ } |
+ } |
+} |
+ |
+bool ResourcePrefetchPredictorTables::UpdateDataHelper( |
+ const PrefetchData& data) { |
+ DCHECK(!data.primary_key.empty()); |
+ |
+ if (!StringsAreSmallerThanDBLimit(data)) { |
+ UMA_HISTOGRAM_BOOLEAN("ResourcePrefetchPredictor.DbStringTooLong", true); |
+ return false; |
+ } |
+ |
+ // Delete the older data from both the tables. |
+ scoped_ptr<Statement> deleter(data.is_host() ? |
+ GetHostResourceDeleteStatement() : GetUrlResourceDeleteStatement()); |
+ deleter->BindString(0, data.primary_key); |
+ if (!deleter->Run()) |
+ return false; |
+ |
+ deleter.reset(data.is_host() ? GetHostMetadataDeleteStatement() : |
+ GetUrlMetadataDeleteStatement()); |
+ deleter->BindString(0, data.primary_key); |
+ if (!deleter->Run()) |
+ return false; |
+ |
+ // Add the new data to the tables. |
+ const ResourceRows& resources = data.resources; |
+ for (ResourceRows::const_iterator it = resources.begin(); |
+ it != resources.end(); ++it) { |
+ scoped_ptr<Statement> resource_inserter(data.is_host() ? |
+ GetHostResourceUpdateStatement() : GetUrlResourceUpdateStatement()); |
+ BindResourceRowToStatement(*it, data.primary_key, resource_inserter.get()); |
+ if (!resource_inserter->Run()) |
+ return false; |
+ } |
+ |
+ scoped_ptr<Statement> metadata_inserter(data.is_host() ? |
+ GetHostMetadataUpdateStatement() : GetUrlMetadataUpdateStatement()); |
+ metadata_inserter->BindString(0, data.primary_key); |
+ metadata_inserter->BindInt64(1, data.last_visit.ToInternalValue()); |
+ if (!metadata_inserter->Run()) |
+ return false; |
+ |
+ return true; |
+} |
+ |
+void ResourcePrefetchPredictorTables::DeleteDataHelper( |
+ PrefetchKeyType key_type, |
+ const std::vector<std::string>& keys) { |
+ bool is_host = key_type == PREFETCH_KEY_TYPE_HOST; |
+ |
+ for (std::vector<std::string>::const_iterator it = keys.begin(); |
+ it != keys.end(); ++it) { |
+ scoped_ptr<Statement> deleter(is_host ? GetHostResourceDeleteStatement() : |
+ GetUrlResourceDeleteStatement()); |
+ deleter->BindString(0, *it); |
+ deleter->Run(); |
+ |
+ deleter.reset(is_host ? GetHostMetadataDeleteStatement() : |
+ GetUrlMetadataDeleteStatement()); |
+ deleter->BindString(0, *it); |
+ deleter->Run(); |
+ } |
+} |
+ |
+bool ResourcePrefetchPredictorTables::StringsAreSmallerThanDBLimit( |
+ const PrefetchData& data) const { |
+ if (data.primary_key.length() > kMaxStringLength) |
+ return false; |
+ |
+ for (ResourceRows::const_iterator it = data.resources.begin(); |
+ it != data.resources.end(); ++it) { |
+ if (it->resource_url.spec().length() > kMaxStringLength) |
+ return false; |
+ } |
+ return true; |
+} |
+ |
+void ResourcePrefetchPredictorTables::CreateTableIfNonExistent() { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ const char* resource_table_creator = |
Lei Zhang
2014/09/09 03:32:20
nit: const char resource_table_creator[]
Zhen Wang
2014/09/13 00:36:32
Done.
|
+ "CREATE TABLE %s ( " |
+ "main_page_url TEXT, " |
+ "resource_url TEXT, " |
+ "resource_type INTEGER, " |
+ "number_of_hits INTEGER, " |
+ "number_of_misses INTEGER, " |
+ "consecutive_misses INTEGER, " |
+ "average_position DOUBLE, " |
+ "PRIMARY KEY(main_page_url, resource_url))"; |
+ const char* metadata_table_creator = |
+ "CREATE TABLE %s ( " |
+ "main_page_url TEXT, " |
+ "last_visit_time INTEGER, " |
+ "PRIMARY KEY(main_page_url))"; |
+ |
+ sql::Connection* db = DB(); |
+ bool success = |
+ (db->DoesTableExist(kUrlResourceTableName) || |
+ db->Execute(base::StringPrintf(resource_table_creator, |
+ kUrlResourceTableName).c_str())) && |
+ (db->DoesTableExist(kUrlMetadataTableName) || |
+ db->Execute(base::StringPrintf(metadata_table_creator, |
+ kUrlMetadataTableName).c_str())) && |
+ (db->DoesTableExist(kHostResourceTableName) || |
+ db->Execute(base::StringPrintf(resource_table_creator, |
+ kHostResourceTableName).c_str())) && |
+ (db->DoesTableExist(kHostMetadataTableName) || |
+ db->Execute(base::StringPrintf(metadata_table_creator, |
+ kHostMetadataTableName).c_str())); |
+ |
+ if (!success) |
+ ResetDB(); |
+} |
+ |
+void ResourcePrefetchPredictorTables::LogDatabaseStats() { |
+ CHECK(BrowserThread::CurrentlyOn(BrowserThread::DB)); |
+ if (CantAccessDatabase()) |
+ return; |
+ |
+ Statement statement(DB()->GetUniqueStatement( |
+ base::StringPrintf("SELECT count(*) FROM %s", |
+ kUrlResourceTableName).c_str())); |
+ if (statement.Step()) |
+ UMA_HISTOGRAM_COUNTS("ResourcePrefetchPredictor.UrlTableRowCount", |
+ statement.ColumnInt(0)); |
+ |
+ statement.Assign(DB()->GetUniqueStatement( |
+ base::StringPrintf("SELECT count(*) FROM %s", |
+ kHostResourceTableName).c_str())); |
+ if (statement.Step()) |
+ UMA_HISTOGRAM_COUNTS("ResourcePrefetchPredictor.HostTableRowCount", |
+ statement.ColumnInt(0)); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetUrlResourceDeleteStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf("DELETE FROM %s WHERE main_page_url=?", |
+ kUrlResourceTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetUrlResourceUpdateStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf( |
+ "INSERT INTO %s " |
+ "(main_page_url, resource_url, resource_type, number_of_hits, " |
+ "number_of_misses, consecutive_misses, average_position) " |
+ "VALUES (?,?,?,?,?,?,?)", kUrlResourceTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetUrlMetadataDeleteStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf("DELETE FROM %s WHERE main_page_url=?", |
+ kUrlMetadataTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetUrlMetadataUpdateStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf( |
+ "INSERT INTO %s (main_page_url, last_visit_time) VALUES (?,?)", |
+ kUrlMetadataTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetHostResourceDeleteStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf("DELETE FROM %s WHERE main_page_url=?", |
+ kHostResourceTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetHostResourceUpdateStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf( |
+ "INSERT INTO %s " |
+ "(main_page_url, resource_url, resource_type, number_of_hits, " |
+ "number_of_misses, consecutive_misses, average_position) " |
+ "VALUES (?,?,?,?,?,?,?)", kHostResourceTableName).c_str())); |
+} |
+ |
+Statement* |
+ ResourcePrefetchPredictorTables::GetHostMetadataDeleteStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf("DELETE FROM %s WHERE main_page_url=?", |
+ kHostMetadataTableName).c_str())); |
+} |
+ |
+Statement* ResourcePrefetchPredictorTables::GetHostMetadataUpdateStatement() { |
+ return new Statement(DB()->GetCachedStatement( |
+ SQL_FROM_HERE, |
+ base::StringPrintf( |
+ "INSERT INTO %s (main_page_url, last_visit_time) VALUES (?,?)", |
+ kHostMetadataTableName).c_str())); |
+} |
+ |
+} // namespace predictors |