Removing uses of X11 native key events.
[chromium-blink-merge.git] / net / base / sdch_manager.h
blobf78f1dd43b51ece681e559c7f6cc8efca55191f6
1 // Copyright (c) 2011 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 // Provides global database of differential decompression dictionaries for the
6 // SDCH filter (processes sdch enconded content).
8 // Exactly one instance of SdchManager is built, and all references are made
9 // into that collection.
11 // The SdchManager maintains a collection of memory resident dictionaries. It
12 // can find a dictionary (based on a server specification of a hash), store a
13 // dictionary, and make judgements about what URLs can use, set, etc. a
14 // dictionary.
16 // These dictionaries are acquired over the net, and include a header
17 // (containing metadata) as well as a VCDIFF dictionary (for use by a VCDIFF
18 // module) to decompress data.
20 #ifndef NET_BASE_SDCH_MANAGER_H_
21 #define NET_BASE_SDCH_MANAGER_H_
23 #include <map>
24 #include <set>
25 #include <string>
27 #include "base/gtest_prod_util.h"
28 #include "base/memory/ref_counted.h"
29 #include "base/memory/scoped_ptr.h"
30 #include "base/threading/non_thread_safe.h"
31 #include "base/time/time.h"
32 #include "net/base/net_export.h"
33 #include "url/gurl.h"
35 namespace net {
37 //------------------------------------------------------------------------------
38 // Create a public interface to help us load SDCH dictionaries.
39 // The SdchManager class allows registration to support this interface.
40 // A browser may register a fetcher that is used by the dictionary managers to
41 // get data from a specified URL. This allows us to use very high level browser
42 // functionality in this base (when the functionality can be provided).
43 class NET_EXPORT SdchFetcher {
44 public:
45 class NET_EXPORT Delegate {
46 public:
47 virtual ~Delegate() {}
49 // Called whenever the SdchFetcher has successfully retrieved a
50 // dictionary. |dictionary_text| contains the body of the dictionary
51 // retrieved from |dictionary_url|.
52 virtual void AddSdchDictionary(const std::string& dictionary_text,
53 const GURL& dictionary_url) = 0;
56 SdchFetcher() {}
57 virtual ~SdchFetcher() {}
59 // The Schedule() method is called when there is a need to get a dictionary
60 // from a server. The callee is responsible for getting that dictionary_text,
61 // and then calling back to AddSdchDictionary() in the Delegate instance.
62 virtual void Schedule(const GURL& dictionary_url) = 0;
64 // The Cancel() method is called to cancel all pending dictionary fetches.
65 // This is used for implementation of ClearData() below.
66 virtual void Cancel() = 0;
68 private:
69 DISALLOW_COPY_AND_ASSIGN(SdchFetcher);
72 //------------------------------------------------------------------------------
74 class NET_EXPORT SdchManager
75 : public SdchFetcher::Delegate,
76 public NON_EXPORTED_BASE(base::NonThreadSafe) {
77 public:
78 // A list of errors that appeared and were either resolved, or used to turn
79 // off sdch encoding.
80 enum ProblemCodes {
81 MIN_PROBLEM_CODE,
83 // Content-encoding correction problems.
84 ADDED_CONTENT_ENCODING = 1,
85 FIXED_CONTENT_ENCODING = 2,
86 FIXED_CONTENT_ENCODINGS = 3,
88 // Content decoding errors.
89 DECODE_HEADER_ERROR = 4,
90 DECODE_BODY_ERROR = 5,
92 // More content-encoding correction problems.
93 OPTIONAL_GUNZIP_ENCODING_ADDED = 6,
95 // Content encoding correction when we're not even tagged as HTML!?!
96 BINARY_ADDED_CONTENT_ENCODING = 7,
97 BINARY_FIXED_CONTENT_ENCODING = 8,
98 BINARY_FIXED_CONTENT_ENCODINGS = 9,
100 // Dictionary selection for use problems.
101 DICTIONARY_FOUND_HAS_WRONG_DOMAIN = 10,
102 DICTIONARY_FOUND_HAS_WRONG_PORT_LIST = 11,
103 DICTIONARY_FOUND_HAS_WRONG_PATH = 12,
104 DICTIONARY_FOUND_HAS_WRONG_SCHEME = 13,
105 DICTIONARY_HASH_NOT_FOUND = 14,
106 DICTIONARY_HASH_MALFORMED = 15,
108 // Dictionary saving problems.
109 DICTIONARY_HAS_NO_HEADER = 20,
110 DICTIONARY_HEADER_LINE_MISSING_COLON = 21,
111 DICTIONARY_MISSING_DOMAIN_SPECIFIER = 22,
112 DICTIONARY_SPECIFIES_TOP_LEVEL_DOMAIN = 23,
113 DICTIONARY_DOMAIN_NOT_MATCHING_SOURCE_URL = 24,
114 DICTIONARY_PORT_NOT_MATCHING_SOURCE_URL = 25,
115 DICTIONARY_HAS_NO_TEXT = 26,
116 DICTIONARY_REFERER_URL_HAS_DOT_IN_PREFIX = 27,
118 // Dictionary loading problems.
119 DICTIONARY_LOAD_ATTEMPT_FROM_DIFFERENT_HOST = 30,
120 DICTIONARY_SELECTED_FOR_SSL = 31,
121 DICTIONARY_ALREADY_LOADED = 32,
122 DICTIONARY_SELECTED_FROM_NON_HTTP = 33,
123 DICTIONARY_IS_TOO_LARGE= 34,
124 DICTIONARY_COUNT_EXCEEDED = 35,
125 DICTIONARY_ALREADY_SCHEDULED_TO_DOWNLOAD = 36,
126 DICTIONARY_ALREADY_TRIED_TO_DOWNLOAD = 37,
128 // Failsafe hack.
129 ATTEMPT_TO_DECODE_NON_HTTP_DATA = 40,
132 // Content-Encoding problems detected, with no action taken.
133 MULTIENCODING_FOR_NON_SDCH_REQUEST = 50,
134 SDCH_CONTENT_ENCODE_FOR_NON_SDCH_REQUEST = 51,
136 // Dictionary manager issues.
137 DOMAIN_BLACKLIST_INCLUDES_TARGET = 61,
139 // Problematic decode recovery methods.
140 META_REFRESH_RECOVERY = 70, // Dictionary not found.
141 // defunct = 71, // Almost the same as META_REFRESH_UNSUPPORTED.
142 // defunct = 72, // Almost the same as CACHED_META_REFRESH_UNSUPPORTED.
143 // defunct = 73, // PASSING_THROUGH_NON_SDCH plus
144 // RESPONSE_TENTATIVE_SDCH in ../filter/sdch_filter.cc.
145 META_REFRESH_UNSUPPORTED = 74, // Unrecoverable error.
146 CACHED_META_REFRESH_UNSUPPORTED = 75, // As above, but pulled from cache.
147 PASSING_THROUGH_NON_SDCH = 76, // Tagged sdch but missing dictionary-hash.
148 INCOMPLETE_SDCH_CONTENT = 77, // Last window was not completely decoded.
149 PASS_THROUGH_404_CODE = 78, // URL not found message passing through.
151 // This next report is very common, and not really an error scenario, but
152 // it exercises the error recovery logic.
153 PASS_THROUGH_OLD_CACHED = 79, // Back button got pre-SDCH cached content.
155 // Common decoded recovery methods.
156 META_REFRESH_CACHED_RECOVERY = 80, // Probably startup tab loading.
157 // defunct = 81, // Now tracked by ResponseCorruptionDetectionCause histo.
159 // Non SDCH problems, only accounted for to make stat counting complete
160 // (i.e., be able to be sure all dictionary advertisements are accounted
161 // for).
163 UNFLUSHED_CONTENT = 90, // Possible error in filter chaining.
164 // defunct = 91, // MISSING_TIME_STATS (Should never happen.)
165 CACHE_DECODED = 92, // No timing stats recorded.
166 // defunct = 93, // OVER_10_MINUTES (No timing stats recorded.)
167 UNINITIALIZED = 94, // Filter never even got initialized.
168 PRIOR_TO_DICTIONARY = 95, // We hadn't even parsed a dictionary selector.
169 DECODE_ERROR = 96, // Something went wrong during decode.
171 // Problem during the latency test.
172 LATENCY_TEST_DISALLOWED = 100, // SDCH now failing, but it worked before!
174 MAX_PROBLEM_CODE // Used to bound histogram.
177 // Use the following static limits to block DOS attacks until we implement
178 // a cached dictionary evicition strategy.
179 static const size_t kMaxDictionarySize;
180 static const size_t kMaxDictionaryCount;
182 // There is one instance of |Dictionary| for each memory-cached SDCH
183 // dictionary.
184 class NET_EXPORT_PRIVATE Dictionary : public base::RefCounted<Dictionary> {
185 public:
186 // Sdch filters can get our text to use in decoding compressed data.
187 const std::string& text() const { return text_; }
189 private:
190 friend class base::RefCounted<Dictionary>;
191 friend class SdchManager; // Only manager can construct an instance.
192 FRIEND_TEST_ALL_PREFIXES(SdchManagerTest, PathMatch);
194 // Construct a vc-diff usable dictionary from the dictionary_text starting
195 // at the given offset. The supplied client_hash should be used to
196 // advertise the dictionary's availability relative to the suppplied URL.
197 Dictionary(const std::string& dictionary_text,
198 size_t offset,
199 const std::string& client_hash,
200 const GURL& url,
201 const std::string& domain,
202 const std::string& path,
203 const base::Time& expiration,
204 const std::set<int>& ports);
205 virtual ~Dictionary();
207 const GURL& url() const { return url_; }
208 const std::string& client_hash() const { return client_hash_; }
210 // Security method to check if we can advertise this dictionary for use
211 // if the |target_url| returns SDCH compressed data.
212 bool CanAdvertise(const GURL& target_url);
214 // Security methods to check if we can establish a new dictionary with the
215 // given data, that arrived in response to get of dictionary_url.
216 static bool CanSet(const std::string& domain, const std::string& path,
217 const std::set<int>& ports, const GURL& dictionary_url);
219 // Security method to check if we can use a dictionary to decompress a
220 // target that arrived with a reference to this dictionary.
221 bool CanUse(const GURL& referring_url);
223 // Compare paths to see if they "match" for dictionary use.
224 static bool PathMatch(const std::string& path,
225 const std::string& restriction);
227 // Compare domains to see if the "match" for dictionary use.
228 static bool DomainMatch(const GURL& url, const std::string& restriction);
231 // The actual text of the dictionary.
232 std::string text_;
234 // Part of the hash of text_ that the client uses to advertise the fact that
235 // it has a specific dictionary pre-cached.
236 std::string client_hash_;
238 // The GURL that arrived with the text_ in a URL request to specify where
239 // this dictionary may be used.
240 const GURL url_;
242 // Metadate "headers" in before dictionary text contained the following:
243 // Each dictionary payload consists of several headers, followed by the text
244 // of the dictionary. The following are the known headers.
245 const std::string domain_;
246 const std::string path_;
247 const base::Time expiration_; // Implied by max-age.
248 const std::set<int> ports_;
250 DISALLOW_COPY_AND_ASSIGN(Dictionary);
253 SdchManager();
254 virtual ~SdchManager();
256 // Clear data (for browser data removal).
257 void ClearData();
259 // Record stats on various errors.
260 static void SdchErrorRecovery(ProblemCodes problem);
262 // Register a fetcher that this class can use to obtain dictionaries.
263 void set_sdch_fetcher(scoped_ptr<SdchFetcher> fetcher);
265 // Enables or disables SDCH compression.
266 static void EnableSdchSupport(bool enabled);
268 static bool sdch_enabled() { return g_sdch_enabled_; }
270 // Enables or disables SDCH compression over secure connection.
271 static void EnableSecureSchemeSupport(bool enabled);
273 static bool secure_scheme_supported() { return g_secure_scheme_supported_; }
275 // Briefly prevent further advertising of SDCH on this domain (if SDCH is
276 // enabled). After enough calls to IsInSupportedDomain() the blacklisting
277 // will be removed. Additional blacklists take exponentially more calls
278 // to IsInSupportedDomain() before the blacklisting is undone.
279 // Used when filter errors are found from a given domain, but it is plausible
280 // that the cause is temporary (such as application startup, where cached
281 // entries are used, but a dictionary is not yet loaded).
282 void BlacklistDomain(const GURL& url, ProblemCodes blacklist_reason);
284 // Used when SEVERE filter errors are found from a given domain, to prevent
285 // further use of SDCH on that domain.
286 void BlacklistDomainForever(const GURL& url, ProblemCodes blacklist_reason);
288 // Unit test only, this function resets enabling of sdch, and clears the
289 // blacklist.
290 void ClearBlacklistings();
292 // Unit test only, this function resets the blacklisting count for a domain.
293 void ClearDomainBlacklisting(const std::string& domain);
295 // Unit test only: indicate how many more times a domain will be blacklisted.
296 int BlackListDomainCount(const std::string& domain);
298 // Unit test only: Indicate what current blacklist increment is for a domain.
299 int BlacklistDomainExponential(const std::string& domain);
301 // Check to see if SDCH is enabled (globally), and the given URL is in a
302 // supported domain (i.e., not blacklisted, and either the specific supported
303 // domain, or all domains were assumed supported). If it is blacklist, reduce
304 // by 1 the number of times it will be reported as blacklisted.
305 bool IsInSupportedDomain(const GURL& url);
307 // Schedule the URL fetching to load a dictionary. This will always return
308 // before the dictionary is actually loaded and added.
309 // After the implied task does completes, the dictionary will have been
310 // cached in memory.
311 void FetchDictionary(const GURL& request_url, const GURL& dictionary_url);
313 // Security test function used before initiating a FetchDictionary.
314 // Return true if fetch is legal.
315 bool CanFetchDictionary(const GURL& referring_url,
316 const GURL& dictionary_url) const;
318 // Find the vcdiff dictionary (the body of the sdch dictionary that appears
319 // after the meta-data headers like Domain:...) with the given |server_hash|
320 // to use to decompreses data that arrived as SDCH encoded content. Check to
321 // be sure the returned |dictionary| can be used for decoding content supplied
322 // in response to a request for |referring_url|.
323 // Return null in |dictionary| if there is no matching legal dictionary.
324 void GetVcdiffDictionary(const std::string& server_hash,
325 const GURL& referring_url,
326 scoped_refptr<Dictionary>* dictionary);
328 // Get list of available (pre-cached) dictionaries that we have already loaded
329 // into memory. The list is a comma separated list of (client) hashes per
330 // the SDCH spec.
331 void GetAvailDictionaryList(const GURL& target_url, std::string* list);
333 // Construct the pair of hashes for client and server to identify an SDCH
334 // dictionary. This is only made public to facilitate unit testing, but is
335 // otherwise private
336 static void GenerateHash(const std::string& dictionary_text,
337 std::string* client_hash, std::string* server_hash);
339 // For Latency testing only, we need to know if we've succeeded in doing a
340 // round trip before starting our comparative tests. If ever we encounter
341 // problems with SDCH, we opt-out of the test unless/until we perform a
342 // complete SDCH decoding.
343 bool AllowLatencyExperiment(const GURL& url) const;
345 void SetAllowLatencyExperiment(const GURL& url, bool enable);
347 int GetFetchesCountForTesting() const {
348 return fetches_count_for_testing_;
351 // Implementation of SdchFetcher::Delegate.
353 // Add an SDCH dictionary to our list of availible
354 // dictionaries. This addition will fail if addition is illegal
355 // (data in the dictionary is not acceptable from the
356 // dictionary_url; dictionary already added, etc.).
357 virtual void AddSdchDictionary(const std::string& dictionary_text,
358 const GURL& dictionary_url) OVERRIDE;
360 private:
361 struct BlacklistInfo {
362 BlacklistInfo()
363 : count(0),
364 exponential_count(0),
365 reason(MIN_PROBLEM_CODE) {}
367 int count; // # of times to refuse SDCH advertisement.
368 int exponential_count; // Current exponential backoff ratchet.
369 ProblemCodes reason; // Why domain was blacklisted.
372 typedef std::map<std::string, BlacklistInfo> DomainBlacklistInfo;
373 typedef std::set<std::string> ExperimentSet;
375 // A map of dictionaries info indexed by the hash that the server provides.
376 typedef std::map<std::string, scoped_refptr<Dictionary> > DictionaryMap;
378 // Support SDCH compression, by advertising in headers.
379 static bool g_sdch_enabled_;
381 // Support SDCH compression for HTTPS requests and responses. When supported,
382 // HTTPS applicable dictionaries MUST have been acquired securely via HTTPS.
383 static bool g_secure_scheme_supported_;
385 // A simple implementation of a RFC 3548 "URL safe" base64 encoder.
386 static void UrlSafeBase64Encode(const std::string& input,
387 std::string* output);
388 DictionaryMap dictionaries_;
390 // An instance that can fetch a dictionary given a URL.
391 scoped_ptr<SdchFetcher> fetcher_;
393 // List domains where decode failures have required disabling sdch.
394 DomainBlacklistInfo blacklisted_domains_;
396 // List of hostnames for which a latency experiment is allowed (because a
397 // round trip test has recently passed).
398 ExperimentSet allow_latency_experiment_;
400 int fetches_count_for_testing_;
402 DISALLOW_COPY_AND_ASSIGN(SdchManager);
405 } // namespace net
407 #endif // NET_BASE_SDCH_MANAGER_H_