1 ///////////////////////////////////////////////////////////////////////////////
2 // p_square_quantile.hpp
4 // Copyright 2005 Daniel Egloff. Distributed under the Boost
5 // Software License, Version 1.0. (See accompanying file
6 // LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
8 #ifndef BOOST_ACCUMULATORS_STATISTICS_P_SQUARE_QUANTILE_HPP_DE_01_01_2006
9 #define BOOST_ACCUMULATORS_STATISTICS_P_SQUARE_QUANTILE_HPP_DE_01_01_2006
13 #include <boost/array.hpp>
14 #include <boost/mpl/placeholders.hpp>
15 #include <boost/type_traits/is_same.hpp>
16 #include <boost/parameter/keyword.hpp>
17 #include <boost/accumulators/framework/accumulator_base.hpp>
18 #include <boost/accumulators/framework/extractor.hpp>
19 #include <boost/accumulators/numeric/functional.hpp>
20 #include <boost/accumulators/framework/parameters/sample.hpp>
21 #include <boost/accumulators/framework/depends_on.hpp>
22 #include <boost/accumulators/statistics_fwd.hpp>
23 #include <boost/accumulators/statistics/count.hpp>
24 #include <boost/accumulators/statistics/parameters/quantile_probability.hpp>
26 namespace boost
{ namespace accumulators
31 ///////////////////////////////////////////////////////////////////////////////
32 // p_square_quantile_impl
33 // single quantile estimation
35 @brief Single quantile estimation with the \f$P^2\f$ algorithm
37 The \f$P^2\f$ algorithm estimates a quantile dynamically without storing samples. Instead of
38 storing the whole sample cumulative distribution, only five points (markers) are stored. The heights
39 of these markers are the minimum and the maximum of the samples and the current estimates of the
40 \f$(p/2)\f$-, \f$p\f$- and \f$(1+p)/2\f$-quantiles. Their positions are equal to the number
41 of samples that are smaller or equal to the markers. Each time a new samples is recorded, the
42 positions of the markers are updated and if necessary their heights are adjusted using a piecewise-
45 For further details, see
47 R. Jain and I. Chlamtac, The P^2 algorithmus fordynamic calculation of quantiles and
48 histograms without storing observations, Communications of the ACM,
49 Volume 28 (October), Number 10, 1985, p. 1076-1085.
51 @param quantile_probability
53 template<typename Sample
, typename Impl
>
54 struct p_square_quantile_impl
57 typedef typename
numeric::functional::average
<Sample
, std::size_t>::result_type float_type
;
58 typedef array
<float_type
, 5> array_type
;
59 // for boost::result_of
60 typedef float_type result_type
;
62 template<typename Args
>
63 p_square_quantile_impl(Args
const &args
)
64 : p(is_same
<Impl
, for_median
>::value
? 0.5 : args
[quantile_probability
| 0.5])
68 , positions_increments()
70 for(std::size_t i
= 0; i
< 5; ++i
)
72 this->actual_positions
[i
] = i
+ 1;
75 this->desired_positions
[0] = 1.;
76 this->desired_positions
[1] = 1. + 2. * this->p
;
77 this->desired_positions
[2] = 1. + 4. * this->p
;
78 this->desired_positions
[3] = 3. + 2. * this->p
;
79 this->desired_positions
[4] = 5.;
81 this->positions_increments
[0] = 0.;
82 this->positions_increments
[1] = this->p
/ 2.;
83 this->positions_increments
[2] = this->p
;
84 this->positions_increments
[3] = (1. + this->p
) / 2.;
85 this->positions_increments
[4] = 1.;
88 template<typename Args
>
89 void operator ()(Args
const &args
)
91 std::size_t cnt
= count(args
);
93 // accumulate 5 first samples
96 this->heights
[cnt
- 1] = args
[sample
];
98 // complete the initialization of heights by sorting
101 std::sort(this->heights
.begin(), this->heights
.end());
106 std::size_t sample_cell
= 1; // k
108 // find cell k such that heights[k-1] <= args[sample] < heights[k] and ajust extreme values
109 if (args
[sample
] < this->heights
[0])
111 this->heights
[0] = args
[sample
];
114 else if (this->heights
[4] <= args
[sample
])
116 this->heights
[4] = args
[sample
];
121 typedef typename
array_type::iterator iterator
;
122 iterator it
= std::upper_bound(
123 this->heights
.begin()
124 , this->heights
.end()
128 sample_cell
= std::distance(this->heights
.begin(), it
);
131 // update positions of markers above sample_cell
132 for(std::size_t i
= sample_cell
; i
< 5; ++i
)
134 ++this->actual_positions
[i
];
137 // update desired positions of all markers
138 for(std::size_t i
= 0; i
< 5; ++i
)
140 this->desired_positions
[i
] += this->positions_increments
[i
];
143 // adjust heights and actual positions of markers 1 to 3 if necessary
144 for(std::size_t i
= 1; i
<= 3; ++i
)
146 // offset to desired positions
147 float_type d
= this->desired_positions
[i
] - this->actual_positions
[i
];
149 // offset to next position
150 float_type dp
= this->actual_positions
[i
+ 1] - this->actual_positions
[i
];
152 // offset to previous position
153 float_type dm
= this->actual_positions
[i
- 1] - this->actual_positions
[i
];
156 float_type hp
= (this->heights
[i
+ 1] - this->heights
[i
]) / dp
;
157 float_type hm
= (this->heights
[i
- 1] - this->heights
[i
]) / dm
;
159 if((d
>= 1. && dp
> 1.) || (d
<= -1. && dm
< -1.))
161 short sign_d
= static_cast<short>(d
/ std::abs(d
));
163 // try adjusting heights[i] using p-squared formula
164 float_type h
= this->heights
[i
] + sign_d
/ (dp
- dm
) * ((sign_d
- dm
) * hp
165 + (dp
- sign_d
) * hm
);
167 if(this->heights
[i
- 1] < h
&& h
< this->heights
[i
+ 1])
169 this->heights
[i
] = h
;
173 // use linear formula
176 this->heights
[i
] += hp
;
180 this->heights
[i
] -= hm
;
183 this->actual_positions
[i
] += sign_d
;
189 result_type
result(dont_care
) const
191 return this->heights
[2];
195 float_type p
; // the quantile probability p
196 array_type heights
; // q_i
197 array_type actual_positions
; // n_i
198 array_type desired_positions
; // n'_i
199 array_type positions_increments
; // dn'_i
202 } // namespace detail
204 ///////////////////////////////////////////////////////////////////////////////
205 // tag::p_square_quantile
209 struct p_square_quantile
214 typedef accumulators::impl::p_square_quantile_impl
<mpl::_1
, regular
> impl
;
216 struct p_square_quantile_for_median
221 typedef accumulators::impl::p_square_quantile_impl
<mpl::_1
, for_median
> impl
;
225 ///////////////////////////////////////////////////////////////////////////////
226 // extract::p_square_quantile
227 // extract::p_square_quantile_for_median
231 extractor
<tag::p_square_quantile
> const p_square_quantile
= {};
232 extractor
<tag::p_square_quantile_for_median
> const p_square_quantile_for_median
= {};
235 using extract::p_square_quantile
;
236 using extract::p_square_quantile_for_median
;
238 // So that p_square_quantile can be automatically substituted with
239 // weighted_p_square_quantile when the weight parameter is non-void
241 struct as_weighted_feature
<tag::p_square_quantile
>
243 typedef tag::weighted_p_square_quantile type
;
247 struct feature_of
<tag::weighted_p_square_quantile
>
248 : feature_of
<tag::p_square_quantile
>
252 }} // namespace boost::accumulators