1 // Copyright (c) 2008, Google Inc.
2 // All rights reserved.
4 // Redistribution and use in source and binary forms, with or without
5 // modification, are permitted provided that the following conditions are
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above
11 // copyright notice, this list of conditions and the following disclaimer
12 // in the documentation and/or other materials provided with the
14 // * Neither the name of Google Inc. nor the names of its
15 // contributors may be used to endorse or promote products derived from
16 // this software without specific prior written permission.
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31 // All Rights Reserved.
33 // Author: Daniel Ford
37 #include <algorithm> // For min()
39 #include "base/commandlineflags.h"
43 // The approximate gap in bytes between sampling actions.
44 // I.e., we take one sample approximately once every
45 // tcmalloc_sample_parameter bytes of allocation
46 // i.e. about once every 512KB if value is 1<<19.
47 #ifdef NO_TCMALLOC_SAMPLES
48 DEFINE_int64(tcmalloc_sample_parameter
, 0,
49 "Unused: code is compiled with NO_TCMALLOC_SAMPLES");
51 DEFINE_int64(tcmalloc_sample_parameter
,
52 EnvToInt64("TCMALLOC_SAMPLE_PARAMETER", 0),
53 "The approximate gap in bytes between sampling actions. "
54 "This must be between 1 and 2^58.");
59 // Statics for Sampler
60 double Sampler::log_table_
[1<<kFastlogNumBits
];
62 // Populate the lookup table for FastLog2.
63 // This approximates the log2 curve with a step function.
64 // Steps have height equal to log2 of the mid-point of the step.
65 void Sampler::PopulateFastLog2Table() {
66 for (int i
= 0; i
< (1<<kFastlogNumBits
); i
++) {
67 log_table_
[i
] = (log(1.0 + static_cast<double>(i
+0.5)/(1<<kFastlogNumBits
))
72 int Sampler::GetSamplePeriod() {
73 return FLAGS_tcmalloc_sample_parameter
;
76 // Run this before using your sampler
77 void Sampler::Init(uint32_t seed
) {
82 rnd_
= static_cast<uint32_t>(reinterpret_cast<uintptr_t>(this));
87 // Step it forward 20 times for good measure
88 for (int i
= 0; i
< 20; i
++) {
89 rnd_
= NextRandom(rnd_
);
92 bytes_until_sample_
= PickNextSamplingPoint();
95 // Initialize the Statics for the Sampler class
96 void Sampler::InitStatics() {
97 PopulateFastLog2Table();
100 // Generates a geometric variable with the specified mean (512K by default).
101 // This is done by generating a random number between 0 and 1 and applying
102 // the inverse cumulative distribution function for an exponential.
103 // Specifically: Let m be the inverse of the sample period, then
104 // the probability distribution function is m*exp(-mx) so the CDF is
105 // p = 1 - exp(-mx), so
106 // q = 1 - p = exp(-mx)
109 // log_2(q) * (-log_e(2) * 1/m) = x
110 // In the code, q is actually in the range 1 to 2**26, hence the -26 below
111 size_t Sampler::PickNextSamplingPoint() {
112 rnd_
= NextRandom(rnd_
);
113 // Take the top 26 bits as the random number
114 // (This plus the 1<<58 sampling bound give a max possible step of
115 // 5194297183973780480 bytes.)
116 const uint64_t prng_mod_power
= 48; // Number of bits in prng
117 // The uint32_t cast is to prevent a (hard-to-reproduce) NAN
118 // under piii debug for some binaries.
119 double q
= static_cast<uint32_t>(rnd_
>> (prng_mod_power
- 26)) + 1.0;
120 // Put the computed p-value through the CDF of a geometric.
121 // For faster performance (save ~1/20th exec time), replace
122 // min(0.0, FastLog2(q) - 26) by (Fastlog2(q) - 26.000705)
123 // The value 26.000705 is used rather than 26 to compensate
124 // for inaccuracies in FastLog2 which otherwise result in a
126 return static_cast<size_t>(min(0.0, (FastLog2(q
) - 26)) * (-log(2.0)
127 * FLAGS_tcmalloc_sample_parameter
) + 1);
130 } // namespace tcmalloc