1 // Copyright 2014 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #ifndef CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_
6 #define CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_
12 #include "base/gtest_prod_util.h"
13 #include "base/memory/linked_ptr.h"
14 #include "base/memory/scoped_ptr.h"
15 #include "base/memory/weak_ptr.h"
16 #include "base/task/cancelable_task_tracker.h"
17 #include "base/time/time.h"
18 #include "chrome/browser/history/history_types.h"
19 #include "chrome/browser/predictors/resource_prefetch_common.h"
20 #include "chrome/browser/predictors/resource_prefetch_predictor_tables.h"
21 #include "chrome/browser/predictors/resource_prefetcher.h"
22 #include "components/keyed_service/core/keyed_service.h"
23 #include "content/public/browser/notification_observer.h"
24 #include "content/public/browser/notification_registrar.h"
25 #include "content/public/common/resource_type.h"
28 class PredictorsHandler
;
39 namespace predictors
{
41 class ResourcePrefetcherManager
;
43 // Contains logic for learning what can be prefetched and for kicking off
44 // speculative prefetching.
45 // - The class is a profile keyed service owned by the profile.
46 // - All the non-static methods of this class need to be called on the UI
49 // The overall flow of the resource prefetching algorithm is as follows:
51 // * ResourcePrefetchPredictorObserver - Listens for URL requests, responses and
52 // redirects on the IO thread (via ResourceDispatcherHostDelegate) and posts
53 // tasks to the ResourcePrefetchPredictor on the UI thread. This is owned by
54 // the ProfileIOData for the profile.
55 // * ResourcePrefetchPredictorTables - Persists ResourcePrefetchPredictor data
56 // to a sql database. Runs entirely on the DB thread. Owned by the
58 // * ResourcePrefetchPredictor - Learns about resource requirements per URL in
59 // the UI thread through the ResourcePrefetchPredictorObserver and persists
60 // it to disk in the DB thread through the ResourcePrefetchPredictorTables. It
61 // initiates resource prefetching using the ResourcePrefetcherManager. Owned
63 // * ResourcePrefetcherManager - Manages the ResourcePrefetchers that do the
64 // prefetching on the IO thread. The manager is owned by the
65 // ResourcePrefetchPredictor and interfaces between the predictor on the UI
66 // thread and the prefetchers on the IO thread.
67 // * ResourcePrefetcher - Lives entirely on the IO thread, owned by the
68 // ResourcePrefetcherManager, and issues net::URLRequest to fetch resources.
70 // TODO(shishir): Do speculative prefetching for https resources and/or https
72 // TODO(zhenw): Currently only main frame requests/redirects/responses are
73 // recorded. Consider recording sub-frame responses independently or together
75 class ResourcePrefetchPredictor
76 : public KeyedService
,
77 public content::NotificationObserver
,
78 public base::SupportsWeakPtr
<ResourcePrefetchPredictor
> {
80 // Stores the data that we need to get from the URLRequest.
81 struct URLRequestSummary
{
83 URLRequestSummary(const URLRequestSummary
& other
);
86 NavigationID navigation_id
;
88 content::ResourceType resource_type
;
90 // Only for responses.
91 std::string mime_type
;
93 GURL redirect_url
; // Empty unless request was redirected to a valid url.
96 ResourcePrefetchPredictor(const ResourcePrefetchPredictorConfig
& config
,
98 virtual ~ResourcePrefetchPredictor();
101 static bool ShouldRecordRequest(net::URLRequest
* request
,
102 content::ResourceType resource_type
);
103 static bool ShouldRecordResponse(net::URLRequest
* response
);
104 static bool ShouldRecordRedirect(net::URLRequest
* response
);
106 // Determines the ResourceType from the mime type, defaulting to the
107 // |fallback| if the ResourceType could not be determined.
108 static content::ResourceType
GetResourceTypeFromMimeType(
109 const std::string
& mime_type
,
110 content::ResourceType fallback
);
112 // 'ResourcePrefetchPredictorObserver' calls the below functions to inform the
113 // predictor of main frame and resource requests. Should only be called if the
114 // corresponding Should* functions return true.
115 void RecordURLRequest(const URLRequestSummary
& request
);
116 void RecordURLResponse(const URLRequestSummary
& response
);
117 void RecordURLRedirect(const URLRequestSummary
& response
);
119 // Called when the main frame of a page completes loading.
120 void RecordMainFrameLoadComplete(const NavigationID
& navigation_id
);
122 // Called by ResourcePrefetcherManager to notify that prefetching has finished
123 // for a navigation. Should take ownership of |requests|.
124 virtual void FinishedPrefetchForNavigation(
125 const NavigationID
& navigation_id
,
126 PrefetchKeyType key_type
,
127 ResourcePrefetcher::RequestVector
* requests
);
130 friend class ::PredictorsHandler
;
131 friend class ResourcePrefetchPredictorTest
;
133 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
, DeleteUrls
);
134 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
,
135 LazilyInitializeEmpty
);
136 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
,
137 LazilyInitializeWithData
);
138 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
,
139 NavigationNotRecorded
);
140 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
, NavigationUrlInDB
);
141 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
, NavigationUrlNotInDB
);
142 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
,
143 NavigationUrlNotInDBAndDBFull
);
144 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
, OnMainFrameRequest
);
145 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
, OnMainFrameRedirect
);
146 FRIEND_TEST_ALL_PREFIXES(ResourcePrefetchPredictorTest
,
147 OnSubresourceResponse
);
149 enum InitializationState
{
155 // Stores prefetching results.
157 // Takes ownership of requests.
158 Result(PrefetchKeyType key_type
,
159 ResourcePrefetcher::RequestVector
* requests
);
162 PrefetchKeyType key_type
;
163 scoped_ptr
<ResourcePrefetcher::RequestVector
> requests
;
166 DISALLOW_COPY_AND_ASSIGN(Result
);
169 typedef ResourcePrefetchPredictorTables::ResourceRow ResourceRow
;
170 typedef ResourcePrefetchPredictorTables::ResourceRows ResourceRows
;
171 typedef ResourcePrefetchPredictorTables::PrefetchData PrefetchData
;
172 typedef ResourcePrefetchPredictorTables::PrefetchDataMap PrefetchDataMap
;
173 typedef std::map
<NavigationID
, linked_ptr
<std::vector
<URLRequestSummary
> > >
175 typedef std::map
<NavigationID
, Result
*> ResultsMap
;
177 // Returns true if the main page request is supported for prediction.
178 static bool IsHandledMainPage(net::URLRequest
* request
);
180 // Returns true if the subresource request is supported for prediction.
181 static bool IsHandledSubresource(net::URLRequest
* request
);
183 // Returns true if the request (should have a response in it) is cacheable.
184 static bool IsCacheable(const net::URLRequest
* request
);
186 // content::NotificationObserver methods OVERRIDE.
187 virtual void Observe(int type
,
188 const content::NotificationSource
& source
,
189 const content::NotificationDetails
& details
) OVERRIDE
;
191 // KeyedService methods OVERRIDE.
192 virtual void Shutdown() OVERRIDE
;
194 // Functions called on different network events pertaining to the loading of
195 // main frame resource or sub resources.
196 void OnMainFrameRequest(const URLRequestSummary
& request
);
197 void OnMainFrameResponse(const URLRequestSummary
& response
);
198 void OnMainFrameRedirect(const URLRequestSummary
& response
);
199 void OnSubresourceResponse(const URLRequestSummary
& response
);
201 // Called when onload completes for a navigation. We treat this point as the
202 // "completion" of the navigation. The resources requested by the page upto
203 // this point are the only ones considered for prefetching.
204 void OnNavigationComplete(const NavigationID
& navigation_id
);
206 // Returns true if there is PrefetchData that can be used for the
207 // navigation and fills in the |prefetch_data| to resources that need to be
209 bool GetPrefetchData(const NavigationID
& navigation_id
,
210 ResourcePrefetcher::RequestVector
* prefetch_requests
,
211 PrefetchKeyType
* key_type
);
213 // Converts a PrefetchData into a ResourcePrefetcher::RequestVector.
214 void PopulatePrefetcherRequest(const PrefetchData
& data
,
215 ResourcePrefetcher::RequestVector
* requests
);
217 // Starts prefetching if it is enabled and prefetching data exists for the
218 // NavigationID either at the URL or at the host level.
219 void StartPrefetching(const NavigationID
& navigation_id
);
221 // Stops prefetching that may be in progress corresponding to |navigation_id|.
222 void StopPrefetching(const NavigationID
& navigation_id
);
224 // Starts initialization by posting a task to the DB thread to read the
225 // predictor database.
226 void StartInitialization();
228 // Callback for task to read predictor database. Takes ownership of
229 // |url_data_map| and |host_data_map|.
230 void CreateCaches(scoped_ptr
<PrefetchDataMap
> url_data_map
,
231 scoped_ptr
<PrefetchDataMap
> host_data_map
);
233 // Called during initialization when history is read and the predictor
234 // database has been read.
235 void OnHistoryAndCacheLoaded();
237 // Removes data for navigations where the onload never fired. Will cleanup
238 // inflight_navigations_ and results_map_.
239 void CleanupAbandonedNavigations(const NavigationID
& navigation_id
);
241 // Deletes all URLs from the predictor database, the caches and removes all
242 // inflight navigations.
243 void DeleteAllUrls();
245 // Deletes data for the input |urls| and their corresponding hosts from the
246 // predictor database and caches.
247 void DeleteUrls(const history::URLRows
& urls
);
249 // Callback for GetUrlVisitCountTask.
250 void OnVisitCountLookup(size_t visit_count
,
251 const NavigationID
& navigation_id
,
252 const std::vector
<URLRequestSummary
>& requests
);
254 // Removes the oldest entry in the input |data_map|, also deleting it from the
255 // predictor database.
256 void RemoveOldestEntryInPrefetchDataMap(PrefetchKeyType key_type
,
257 PrefetchDataMap
* data_map
);
259 // Merges resources in |new_resources| into the |data_map| and correspondingly
260 // updates the predictor database.
261 void LearnNavigation(const std::string
& key
,
262 PrefetchKeyType key_type
,
263 const std::vector
<URLRequestSummary
>& new_resources
,
264 size_t max_data_map_size
,
265 PrefetchDataMap
* data_map
);
267 // Reports accuracy by comparing prefetched resources with resources that are
268 // actually used by the page.
269 void ReportAccuracyStats(PrefetchKeyType key_type
,
270 const std::vector
<URLRequestSummary
>& actual
,
271 ResourcePrefetcher::RequestVector
* prefetched
) const;
273 // Reports predicted accuracy i.e. by comparing resources that are actually
274 // used by the page with those that may have been prefetched.
275 void ReportPredictedAccuracyStats(
276 PrefetchKeyType key_type
,
277 const std::vector
<URLRequestSummary
>& actual
,
278 const ResourcePrefetcher::RequestVector
& predicted
) const;
279 void ReportPredictedAccuracyStatsHelper(
280 PrefetchKeyType key_type
,
281 const ResourcePrefetcher::RequestVector
& predicted
,
282 const std::map
<GURL
, bool>& actual
,
283 size_t total_resources_fetched_from_network
,
284 size_t max_assumed_prefetched
) const;
286 // Used for testing to inject mock tables.
287 void set_mock_tables(scoped_refptr
<ResourcePrefetchPredictorTables
> tables
) {
291 Profile
* const profile_
;
292 ResourcePrefetchPredictorConfig
const config_
;
293 InitializationState initialization_state_
;
294 scoped_refptr
<ResourcePrefetchPredictorTables
> tables_
;
295 scoped_refptr
<ResourcePrefetcherManager
> prefetch_manager_
;
296 content::NotificationRegistrar notification_registrar_
;
297 base::CancelableTaskTracker history_lookup_consumer_
;
299 // Map of all the navigations in flight to their resource requests.
300 NavigationMap inflight_navigations_
;
302 // Copy of the data in the predictor tables.
303 scoped_ptr
<PrefetchDataMap
> url_table_cache_
;
304 scoped_ptr
<PrefetchDataMap
> host_table_cache_
;
306 ResultsMap results_map_
;
307 STLValueDeleter
<ResultsMap
> results_map_deleter_
;
309 DISALLOW_COPY_AND_ASSIGN(ResourcePrefetchPredictor
);
312 } // namespace predictors
314 #endif // CHROME_BROWSER_PREDICTORS_RESOURCE_PREFETCH_PREDICTOR_H_