OLD | NEW |
(Empty) | |
| 1 // Copyright 2014 The Chromium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. |
| 4 |
| 5 #ifndef CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_ |
| 6 #define CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_ |
| 7 |
| 8 #include <map> |
| 9 #include <string> |
| 10 #include <vector> |
| 11 |
| 12 #include "base/gtest_prod_util.h" |
| 13 #include "base/memory/linked_ptr.h" |
| 14 #include "base/memory/scoped_ptr.h" |
| 15 #include "base/memory/weak_ptr.h" |
| 16 #include "base/task/cancelable_task_tracker.h" |
| 17 #include "base/time/time.h" |
| 18 #include "chrome/browser/history/history_types.h" |
| 19 #include "chrome/browser/predictors/resource_prefetch_common.h" |
| 20 #include "chrome/browser/predictors/resource_prefetch_predictor_tables.h" |
| 21 #include "chrome/browser/predictors/resource_prefetcher.h" |
| 22 #include "components/keyed_service/core/keyed_service.h" |
| 23 #include "content/public/browser/notification_observer.h" |
| 24 #include "content/public/browser/notification_registrar.h" |
| 25 #include "content/public/common/resource_type.h" |
| 26 #include "url/gurl.h" |
| 27 |
| 28 class PredictorsHandler; |
| 29 class Profile; |
| 30 |
| 31 namespace content { |
| 32 class WebContents; |
| 33 } |
| 34 |
| 35 namespace net { |
| 36 class URLRequest; |
| 37 } |
| 38 |
| 39 namespace predictors { |
| 40 |
| 41 class ResourcePrefetcherManager; |
| 42 |
| 43 // Contains logic for learning what can be prefetched and for kicking off |
| 44 // speculative prefetching. |
| 45 // - The class is a profile keyed service owned by the profile. |
| 46 // - All the non-static methods of this class need to be called on the UI |
| 47 // thread. |
| 48 // |
| 49 // The overall flow of the resource prefetching algorithm is as follows: |
| 50 // |
| 51 // * ResourcePrefetchPredictorObserver - Listens for URL requests, responses and |
| 52 // redirects on the IO thread (via ResourceDispatcherHostDelegate) and posts |
| 53 // tasks to the ResourcePrefetchPredictor on the UI thread. This is owned by |
| 54 // the ProfileIOData for the profile. |
| 55 // * ResourcePrefetchPredictorTables - Persists ResourcePrefetchPredictor data |
| 56 // to a sql database. Runs entirely on the DB thread. Owned by the |
| 57 // PredictorDatabase. |
| 58 // * ResourcePrefetchPredictor - Learns about resource requirements per URL in |
| 59 // the UI thread through the ResourcePrefetchPredictorObserver and persists |
| 60 // it to disk in the DB thread through the ResourcePrefetchPredictorTables. It |
| 61 // initiates resource prefetching using the ResourcePrefetcherManager. Owned |
| 62 // by profile. |
| 63 // * ResourcePrefetcherManager - Manages the ResourcePrefetchers that do the |
| 64 // prefetching on the IO thread. The manager is owned by the |
| 65 // ResourcePrefetchPredictor and interfaces between the predictor on the UI |
| 66 // thread and the prefetchers on the IO thread. |
| 67 // * ResourcePrefetcher - Lives entirely on the IO thread, owned by the |
| 68 // ResourcePrefetcherManager, and issues net::URLRequest to fetch resources. |
| 69 // |
| 70 // TODO(shishir): Do speculative prefetching for https resources and/or https |
| 71 // main frame urls. |
| 72 // TODO(zhenw): Currently only main frame requests/redirects/responses are |
| 73 // recorded. Consider recording sub-frame responses independently or together |
| 74 // with main frame. |
| 75 class ResourcePrefetchPredictor |
| 76 : public KeyedService, |
| 77 public content::NotificationObserver, |
| 78 public base::SupportsWeakPtr<ResourcePrefetchPredictor> { |
| 79 public: |
| 80 // Stores the data that we need to get from the URLRequest. |
| 81 struct URLRequestSummary { |
| 82 URLRequestSummary(); |
| 83 URLRequestSummary(const URLRequestSummary& other); |
| 84 ~URLRequestSummary(); |
| 85 |
| 86 NavigationID navigation_id; |
| 87 GURL resource_url; |
| 88 content::ResourceType resource_type; |
| 89 |
| 90 // Only for responses. |
| 91 std::string mime_type; |
| 92 bool was_cached; |
| 93 GURL redirect_url; // Empty unless request was redirected to a valid url. |
| 94 }; |
| 95 |
| 96 ResourcePrefetchPredictor(const ResourcePrefetchPredictorConfig& config, |
| 97 Profile* profile); |
| 98 virtual ~ResourcePrefetchPredictor(); |
| 99 |
| 100 // Thread safe. |
| 101 static bool ShouldRecordRequest(net::URLRequest* request, |
| 102 content::ResourceType resource_type); |
| 103 static bool ShouldRecordResponse(net::URLRequest* response); |
| 104 static bool ShouldRecordRedirect(net::URLRequest* response); |
| 105 |
| 106 // Determines the ResourceType from the mime type, defaulting to the |
| 107 // |fallback| if the ResourceType could not be determined. |
| 108 static content::ResourceType GetResourceTypeFromMimeType( |
| 109 const std::string& mime_type, |
| 110 content::ResourceType fallback); |
| 111 |
| 112 // 'ResourcePrefetchPredictorObserver' calls the below functions to inform the |
| 113 // predictor of main frame and resource requests. Should only be called if the |
| 114 // corresponding Should* functions return true. |
| 115 void RecordURLRequest(const URLRequestSummary& request); |
| 116 void RecordURLResponse(const URLRequestSummary& response); |
| 117 void RecordURLRedirect(const URLRequestSummary& response); |
| 118 |
| 119 // Called when the main frame of a page completes loading. |
| 120 void RecordMainFrameLoadComplete(const NavigationID& navigation_id); |
| 121 |
| 122 // Called by ResourcePrefetcherManager to notify that prefetching has finished |
| 123 // for a navigation. Should take ownership of |requests|. |
| 124 virtual void FinishedPrefetchForNavigation( |
| 125 const NavigationID& navigation_id, |
| 126 PrefetchKeyType key_type, |
| 127 ResourcePrefetcher::RequestVector* requests); |
| 128 |
| 129 private: |
| 130 friend class ::PredictorsHandler; |
| 131 friend class ResourcePrefetchPredictorTest; |
| 132 |
| 133 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, DeleteUrls); |
| 134 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, |
| 135 LazilyInitializeEmpty); |
| 136 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, |
| 137 LazilyInitializeWithData); |
| 138 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, |
| 139 NavigationNotRecorded); |
| 140 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, NavigationUrlInDB); |
| 141 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, NavigationUrlNotInDB); |
| 142 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, |
| 143 NavigationUrlNotInDBAndDBFull); |
| 144 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, OnMainFrameRequest); |
| 145 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, OnMainFrameRedirect); |
| 146 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest, |
| 147 OnSubresourceResponse); |
| 148 |
| 149 enum InitializationState { |
| 150 NOT_INITIALIZED = 0, |
| 151 INITIALIZING = 1, |
| 152 INITIALIZED = 2 |
| 153 }; |
| 154 |
| 155 // Stores prefetching results. |
| 156 struct Result { |
| 157 // Takes ownership of requests. |
| 158 Result(PrefetchKeyType key_type, |
| 159 ResourcePrefetcher::RequestVector* requests); |
| 160 ~Result(); |
| 161 |
| 162 PrefetchKeyType key_type; |
| 163 scoped_ptr<ResourcePrefetcher::RequestVector> requests; |
| 164 |
| 165 private: |
| 166 DISALLOW_COPY_AND_ASSIGN(Result); |
| 167 }; |
| 168 |
| 169 typedef ResourcePrefetchPredictorTables::ResourceRow ResourceRow; |
| 170 typedef ResourcePrefetchPredictorTables::ResourceRows ResourceRows; |
| 171 typedef ResourcePrefetchPredictorTables::PrefetchData PrefetchData; |
| 172 typedef ResourcePrefetchPredictorTables::PrefetchDataMap PrefetchDataMap; |
| 173 typedef std::map<NavigationID, linked_ptr<std::vector<URLRequestSummary> > > |
| 174 NavigationMap; |
| 175 typedef std::map<NavigationID, Result*> ResultsMap; |
| 176 |
| 177 // Returns true if the main page request is supported for prediction. |
| 178 static bool IsHandledMainPage(net::URLRequest* request); |
| 179 |
| 180 // Returns true if the subresource request is supported for prediction. |
| 181 static bool IsHandledSubresource(net::URLRequest* request); |
| 182 |
| 183 // Returns true if the request (should have a response in it) is cacheable. |
| 184 static bool IsCacheable(const net::URLRequest* request); |
| 185 |
| 186 // content::NotificationObserver methods OVERRIDE. |
| 187 virtual void Observe(int type, |
| 188 const content::NotificationSource& source, |
| 189 const content::NotificationDetails& details) OVERRIDE; |
| 190 |
| 191 // KeyedService methods OVERRIDE. |
| 192 virtual void Shutdown() OVERRIDE; |
| 193 |
| 194 // Functions called on different network events pertaining to the loading of |
| 195 // main frame resource or sub resources. |
| 196 void OnMainFrameRequest(const URLRequestSummary& request); |
| 197 void OnMainFrameResponse(const URLRequestSummary& response); |
| 198 void OnMainFrameRedirect(const URLRequestSummary& response); |
| 199 void OnSubresourceResponse(const URLRequestSummary& response); |
| 200 |
| 201 // Called when onload completes for a navigation. We treat this point as the |
| 202 // "completion" of the navigation. The resources requested by the page upto |
| 203 // this point are the only ones considered for prefetching. |
| 204 void OnNavigationComplete(const NavigationID& navigation_id); |
| 205 |
| 206 // Returns true if there is PrefetchData that can be used for the |
| 207 // navigation and fills in the |prefetch_data| to resources that need to be |
| 208 // prefetched. |
| 209 bool GetPrefetchData(const NavigationID& navigation_id, |
| 210 ResourcePrefetcher::RequestVector* prefetch_requests, |
| 211 PrefetchKeyType* key_type); |
| 212 |
| 213 // Converts a PrefetchData into a ResourcePrefetcher::RequestVector. |
| 214 void PopulatePrefetcherRequest(const PrefetchData& data, |
| 215 ResourcePrefetcher::RequestVector* requests); |
| 216 |
| 217 // Starts prefetching if it is enabled and prefetching data exists for the |
| 218 // NavigationID either at the URL or at the host level. |
| 219 void StartPrefetching(const NavigationID& navigation_id); |
| 220 |
| 221 // Stops prefetching that may be in progress corresponding to |navigation_id|. |
| 222 void StopPrefetching(const NavigationID& navigation_id); |
| 223 |
| 224 // Starts initialization by posting a task to the DB thread to read the |
| 225 // predictor database. |
| 226 void StartInitialization(); |
| 227 |
| 228 // Callback for task to read predictor database. Takes ownership of |
| 229 // |url_data_map| and |host_data_map|. |
| 230 void CreateCaches(scoped_ptr<PrefetchDataMap> url_data_map, |
| 231 scoped_ptr<PrefetchDataMap> host_data_map); |
| 232 |
| 233 // Called during initialization when history is read and the predictor |
| 234 // database has been read. |
| 235 void OnHistoryAndCacheLoaded(); |
| 236 |
| 237 // Removes data for navigations where the onload never fired. Will cleanup |
| 238 // inflight_navigations_ and results_map_. |
| 239 void CleanupAbandonedNavigations(const NavigationID& navigation_id); |
| 240 |
| 241 // Deletes all URLs from the predictor database, the caches and removes all |
| 242 // inflight navigations. |
| 243 void DeleteAllUrls(); |
| 244 |
| 245 // Deletes data for the input |urls| and their corresponding hosts from the |
| 246 // predictor database and caches. |
| 247 void DeleteUrls(const history::URLRows& urls); |
| 248 |
| 249 // Callback for GetUrlVisitCountTask. |
| 250 void OnVisitCountLookup(size_t visit_count, |
| 251 const NavigationID& navigation_id, |
| 252 const std::vector<URLRequestSummary>& requests); |
| 253 |
| 254 // Removes the oldest entry in the input |data_map|, also deleting it from the |
| 255 // predictor database. |
| 256 void RemoveOldestEntryInPrefetchDataMap(PrefetchKeyType key_type, |
| 257 PrefetchDataMap* data_map); |
| 258 |
| 259 // Merges resources in |new_resources| into the |data_map| and correspondingly |
| 260 // updates the predictor database. |
| 261 void LearnNavigation(const std::string& key, |
| 262 PrefetchKeyType key_type, |
| 263 const std::vector<URLRequestSummary>& new_resources, |
| 264 size_t max_data_map_size, |
| 265 PrefetchDataMap* data_map); |
| 266 |
| 267 // Reports accuracy by comparing prefetched resources with resources that are |
| 268 // actually used by the page. |
| 269 void ReportAccuracyStats(PrefetchKeyType key_type, |
| 270 const std::vector<URLRequestSummary>& actual, |
| 271 ResourcePrefetcher::RequestVector* prefetched) const; |
| 272 |
| 273 // Reports predicted accuracy i.e. by comparing resources that are actually |
| 274 // used by the page with those that may have been prefetched. |
| 275 void ReportPredictedAccuracyStats( |
| 276 PrefetchKeyType key_type, |
| 277 const std::vector<URLRequestSummary>& actual, |
| 278 const ResourcePrefetcher::RequestVector& predicted) const; |
| 279 void ReportPredictedAccuracyStatsHelper( |
| 280 PrefetchKeyType key_type, |
| 281 const ResourcePrefetcher::RequestVector& predicted, |
| 282 const std::map<GURL, bool>& actual, |
| 283 size_t total_resources_fetched_from_network, |
| 284 size_t max_assumed_prefetched) const; |
| 285 |
| 286 // Used for testing to inject mock tables. |
| 287 void set_mock_tables(scoped_refptr<ResourcePrefetchPredictorTables> tables) { |
| 288 tables_ = tables; |
| 289 } |
| 290 |
| 291 Profile* const profile_; |
| 292 ResourcePrefetchPredictorConfig const config_; |
| 293 InitializationState initialization_state_; |
| 294 scoped_refptr<ResourcePrefetchPredictorTables> tables_; |
| 295 scoped_refptr<ResourcePrefetcherManager> prefetch_manager_; |
| 296 content::NotificationRegistrar notification_registrar_; |
| 297 base::CancelableTaskTracker history_lookup_consumer_; |
| 298 |
| 299 // Map of all the navigations in flight to their resource requests. |
| 300 NavigationMap inflight_navigations_; |
| 301 |
| 302 // Copy of the data in the predictor tables. |
| 303 scoped_ptr<PrefetchDataMap> url_table_cache_; |
| 304 scoped_ptr<PrefetchDataMap> host_table_cache_; |
| 305 |
| 306 ResultsMap results_map_; |
| 307 STLValueDeleter<ResultsMap> results_map_deleter_; |
| 308 |
| 309 DISALLOW_COPY_AND_ASSIGN(ResourcePrefetchPredictor); |
| 310 }; |
| 311 |
| 312 } // namespace predictors |
| 313 |
| 314 #endif // CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_ |
OLD | NEW |