1 // Copyright (c) 2011 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 // Filter performs filtering on data streams. Sample usage:
7 // IStream* pre_filter_source;
9 // Filter* filter = Filter::Factory(filter_type, size);
10 // int pre_filter_data_len = filter->stream_buffer_size();
11 // pre_filter_source->read(filter->stream_buffer(), pre_filter_data_len);
13 // filter->FlushStreamBuffer(pre_filter_data_len);
15 // char post_filter_buf[kBufferSize];
16 // int post_filter_data_len = kBufferSize;
17 // filter->ReadFilteredData(post_filter_buf, &post_filter_data_len);
19 // To filter a data stream, the caller first gets filter's stream_buffer_
20 // through its accessor and fills in stream_buffer_ with pre-filter data, next
21 // calls FlushStreamBuffer to notify Filter, then calls ReadFilteredData
22 // repeatedly to get all the filtered data. After all data have been fitlered
23 // and read out, the caller may fill in stream_buffer_ again. This
24 // WriteBuffer-Flush-Read cycle is repeated until reaching the end of data
27 // The lifetime of a Filter instance is completely controlled by its caller.
29 #ifndef NET_BASE_FILTER_H__
30 #define NET_BASE_FILTER_H__
36 #include "base/basictypes.h"
37 #include "base/gtest_prod_util.h"
38 #include "base/memory/ref_counted.h"
39 #include "base/memory/scoped_ptr.h"
40 #include "base/time.h"
41 #include "net/base/net_export.h"
49 //------------------------------------------------------------------------------
50 // Define an interface class that allows access to contextual information
51 // supplied by the owner of this filter. In the case where there are a chain of
52 // filters, there is only one owner of all the chained filters, and that context
53 // is passed to the constructor of all those filters. To be clear, the context
54 // does NOT reflect the position in a chain, or the fact that there are prior
55 // or later filters in a chain.
56 class NET_EXPORT_PRIVATE FilterContext
{
58 // Enum to control what histograms are emitted near end-of-life of this
60 enum StatisticSelector
{
63 SDCH_EXPERIMENT_DECODE
,
64 SDCH_EXPERIMENT_HOLDBACK
,
67 virtual ~FilterContext();
69 // What mime type was specified in the header for this data?
70 // Only makes senses for some types of contexts, and returns false
71 // when not applicable.
72 virtual bool GetMimeType(std::string
* mime_type
) const = 0;
74 // What URL was used to access this data?
75 // Return false if gurl is not present.
76 virtual bool GetURL(GURL
* gurl
) const = 0;
78 // When was this data requested from a server?
79 virtual base::Time
GetRequestTime() const = 0;
81 // Is data supplied from cache, or fresh across the net?
82 virtual bool IsCachedContent() const = 0;
84 // Is this a download?
85 virtual bool IsDownload() const = 0;
87 // Was this data flagged as a response to a request with an SDCH dictionary?
88 virtual bool IsSdchResponse() const = 0;
90 // How many bytes were read from the net or cache so far (and potentially
91 // pushed into a filter for processing)?
92 virtual int64
GetByteReadCount() const = 0;
94 // What response code was received with the associated network transaction?
95 // For example: 200 is ok. 4xx are error codes. etc.
96 virtual int GetResponseCode() const = 0;
98 // The following method forces the context to emit a specific set of
99 // statistics as selected by the argument.
100 virtual void RecordPacketStats(StatisticSelector statistic
) const = 0;
103 //------------------------------------------------------------------------------
104 class NET_EXPORT_PRIVATE Filter
{
106 // Return values of function ReadFilteredData.
108 // Read filtered data successfully
110 // Read filtered data successfully, and the data in the buffer has been
111 // consumed by the filter, but more data is needed in order to continue
112 // filtering. At this point, the caller is free to reuse the filter
113 // buffer to provide more data.
114 FILTER_NEED_MORE_DATA
,
115 // Read filtered data successfully, and filter reaches the end of the data
118 // There is an error during filtering.
122 // Specifies type of filters that can be created.
126 FILTER_TYPE_GZIP_HELPING_SDCH
, // Gzip possible, but pass through allowed.
128 FILTER_TYPE_SDCH_POSSIBLE
, // Sdch possible, but pass through allowed.
129 FILTER_TYPE_UNSUPPORTED
,
134 // Creates a Filter object.
135 // Parameters: Filter_types specifies the type of filter created;
136 // filter_context allows filters to acquire additional details needed for
137 // construction and operation, such as a specification of requisite input
139 // If success, the function returns the pointer to the Filter object created.
140 // If failed or a filter is not needed, the function returns NULL.
142 // Note: filter_types is an array of filter types (content encoding types as
143 // provided in an HTTP header), which will be chained together serially to do
144 // successive filtering of data. The types in the vector are ordered based on
145 // encoding order, and the filters are chained to operate in the reverse
146 // (decoding) order. For example, types[0] = FILTER_TYPE_SDCH,
147 // types[1] = FILTER_TYPE_GZIP will cause data to first be gunzip filtered,
148 // and the resulting output from that filter will be sdch decoded.
149 static Filter
* Factory(const std::vector
<FilterType
>& filter_types
,
150 const FilterContext
& filter_context
);
152 // A simpler version of Factory() which creates a single, unchained
153 // Filter of type FILTER_TYPE_GZIP, or NULL if the filter could not be
155 static Filter
* GZipFactory();
157 // External call to obtain data from this filter chain. If ther is no
158 // next_filter_, then it obtains data from this specific filter.
159 FilterStatus
ReadData(char* dest_buffer
, int* dest_len
);
161 // Returns a pointer to the stream_buffer_.
162 IOBuffer
* stream_buffer() const { return stream_buffer_
.get(); }
164 // Returns the maximum size of stream_buffer_ in number of chars.
165 int stream_buffer_size() const { return stream_buffer_size_
; }
167 // Returns the total number of chars remaining in stream_buffer_ to be
170 // If the function returns 0 then all data has been filtered, and the caller
171 // is safe to copy new data into stream_buffer_.
172 int stream_data_len() const { return stream_data_len_
; }
174 // Flushes stream_buffer_ for next round of filtering. After copying data to
175 // stream_buffer_, the caller should call this function to notify Filter to
176 // start filtering. Then after this function is called, the caller can get
177 // post-filtered data using ReadFilteredData. The caller must not write to
178 // stream_buffer_ and call this function again before stream_buffer_ is
179 // emptied out by ReadFilteredData.
181 // The input stream_data_len is the length (in number of chars) of valid
182 // data in stream_buffer_. It can not be greater than stream_buffer_size_.
183 // The function returns true if success, and false otherwise.
184 bool FlushStreamBuffer(int stream_data_len
);
186 // Translate the text of a filter name (from Content-Encoding header) into a
188 static FilterType
ConvertEncodingToType(const std::string
& filter_type
);
190 // Given a array of encoding_types, try to do some error recovery adjustment
191 // to the list. This includes handling known bugs in the Apache server (where
192 // redundant gzip encoding is specified), as well as issues regarding SDCH
193 // encoding, where various proxies and anti-virus products modify or strip the
194 // encodings. These fixups require context, which includes whether this
195 // response was made to an SDCH request (i.e., an available dictionary was
196 // advertised in the GET), as well as the mime type of the content.
197 static void FixupEncodingTypes(const FilterContext
& filter_context
,
198 std::vector
<FilterType
>* encoding_types
);
201 friend class GZipUnitTest
;
202 friend class SdchFilterChainingTest
;
206 // Filters the data stored in stream_buffer_ and writes the output into the
207 // dest_buffer passed in.
209 // Upon entry, *dest_len is the total size (in number of chars) of the
210 // destination buffer. Upon exit, *dest_len is the actual number of chars
211 // written into the destination buffer.
213 // This function will fail if there is no pre-filter data in the
214 // stream_buffer_. On the other hand, *dest_len can be 0 upon successful
215 // return. For example, a decoding filter may process some pre-filter data
216 // but not produce output yet.
217 virtual FilterStatus
ReadFilteredData(char* dest_buffer
, int* dest_len
) = 0;
219 // Copy pre-filter data directly to destination buffer without decoding.
220 FilterStatus
CopyOut(char* dest_buffer
, int* dest_len
);
222 FilterStatus
last_status() const { return last_status_
; }
224 // Buffer to hold the data to be filtered (the input queue).
225 scoped_refptr
<IOBuffer
> stream_buffer_
;
227 // Maximum size of stream_buffer_ in number of chars.
228 int stream_buffer_size_
;
230 // Pointer to the next data in stream_buffer_ to be filtered.
231 char* next_stream_data_
;
233 // Total number of remaining chars in stream_buffer_ to be filtered.
234 int stream_data_len_
;
237 // Allocates and initializes stream_buffer_ and stream_buffer_size_.
238 void InitBuffer(int size
);
240 // A factory helper for creating filters for within a chain of potentially
241 // multiple encodings. If a chain of filters is created, then this may be
242 // called multiple times during the filter creation process. In most simple
243 // cases, this is only called once. Returns NULL and cleans up (deleting
244 // filter_list) if a new filter can't be constructed.
245 static Filter
* PrependNewFilter(FilterType type_id
,
246 const FilterContext
& filter_context
,
248 Filter
* filter_list
);
250 // Helper methods for PrependNewFilter. If initialization is successful,
251 // they return a fully initialized Filter. Otherwise, return NULL.
252 static Filter
* InitGZipFilter(FilterType type_id
, int buffer_size
);
253 static Filter
* InitSdchFilter(FilterType type_id
,
254 const FilterContext
& filter_context
,
257 // Helper function to empty our output into the next filter's input.
258 void PushDataIntoNextFilter();
260 // Constructs a filter with an internal buffer of the given size.
261 // Only meant to be called by unit tests that need to control the buffer size.
262 static Filter
* FactoryForTests(const std::vector
<FilterType
>& filter_types
,
263 const FilterContext
& filter_context
,
266 // An optional filter to process output from this filter.
267 scoped_ptr
<Filter
> next_filter_
;
268 // Remember what status or local filter last returned so we can better handle
270 FilterStatus last_status_
;
272 DISALLOW_COPY_AND_ASSIGN(Filter
);
277 #endif // NET_BASE_FILTER_H__