3 * Arbitrary section name based PHP profiling.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
22 * @author Aaron Schulz
26 * Custom PHP profiler for parser/DB type section names that xhprof/xdebug can't handle
30 class SectionProfiler
{
31 /** @var array Map of (mem,real,cpu) */
33 /** @var array Map of (mem,real,cpu) */
35 /** @var array List of resolved profile calls with start/end data */
36 protected $stack = [];
37 /** @var array Queue of open profile calls with start data */
38 protected $workStack = [];
40 /** @var array Map of (function name => aggregate data array) */
41 protected $collated = [];
43 protected $collateDone = false;
45 /** @var bool Whether to collect the full stack trace or just aggregates */
46 protected $collateOnly = true;
47 /** @var array Cache of a standard broken collation entry */
48 protected $errorEntry;
49 /** @var callable Cache of a profile out callback */
50 protected $profileOutCallback;
53 * @param array $params
55 public function __construct( array $params = [] ) {
56 $this->errorEntry
= $this->getErrorEntry();
57 $this->collateOnly
= empty( $params['trace'] );
58 $this->profileOutCallback
= function ( $profiler, $section ) {
59 $profiler->profileOutInternal( $section );
64 * @param string $section
65 * @return ScopedCallback
67 public function scopedProfileIn( $section ) {
68 $this->profileInInternal( $section );
70 return new SectionProfileCallback( $this, $section );
74 * @param ScopedCallback $section
76 public function scopedProfileOut( ScopedCallback
&$section ) {
81 * Get the aggregated inclusive profiling data for each method
83 * The percent time for each time is based on the current "total" time
84 * used is based on all methods so far. This method can therefore be
85 * called several times in between several profiling calls without the
86 * delays in usage of the profiler skewing the results. A "-total" entry
87 * is always included in the results.
89 * @return array List of method entries arrays, each having:
90 * - name : method name
91 * - calls : the number of invoking calls
92 * - real : real time elapsed (ms)
93 * - %real : percent real time
94 * - cpu : real time elapsed (ms)
95 * - %cpu : percent real time
96 * - memory : memory used (bytes)
97 * - %memory : percent memory used
98 * - min_real : min real time in a call (ms)
99 * - max_real : max real time in a call (ms)
101 public function getFunctionStats() {
102 $this->collateData();
104 $totalCpu = max( $this->end
['cpu'] - $this->start
['cpu'], 0 );
105 $totalReal = max( $this->end
['real'] - $this->start
['real'], 0 );
106 $totalMem = max( $this->end
['memory'] - $this->start
['memory'], 0 );
109 foreach ( $this->collated
as $fname => $data ) {
112 'calls' => $data['count'],
113 'real' => $data['real'] * 1000,
114 '%real' => $totalReal ?
100 * $data['real'] / $totalReal : 0,
115 'cpu' => $data['cpu'] * 1000,
116 '%cpu' => $totalCpu ?
100 * $data['cpu'] / $totalCpu : 0,
117 'memory' => $data['memory'],
118 '%memory' => $totalMem ?
100 * $data['memory'] / $totalMem : 0,
119 'min_real' => 1000 * $data['min_real'],
120 'max_real' => 1000 * $data['max_real']
127 'real' => 1000 * $totalReal,
129 'cpu' => 1000 * $totalCpu,
131 'memory' => $totalMem,
133 'min_real' => 1000 * $totalReal,
134 'max_real' => 1000 * $totalReal
141 * Clear all of the profiling data for another run
143 public function reset() {
147 $this->workStack
= [];
148 $this->collated
= [];
149 $this->collateDone
= false;
153 * @return array Initial collation entry
155 protected function getZeroEntry() {
167 * @return array Initial collation entry for errors
169 protected function getErrorEntry() {
170 $entry = $this->getZeroEntry();
176 * Update the collation entry for a given method name
178 * @param string $name
179 * @param float $elapsedCpu
180 * @param float $elapsedReal
181 * @param int $memChange
183 protected function updateEntry( $name, $elapsedCpu, $elapsedReal, $memChange ) {
184 $entry =& $this->collated
[$name];
185 if ( !is_array( $entry ) ) {
186 $entry = $this->getZeroEntry();
187 $this->collated
[$name] =& $entry;
189 $entry['cpu'] +
= $elapsedCpu;
190 $entry['real'] +
= $elapsedReal;
191 $entry['memory'] +
= $memChange > 0 ?
$memChange : 0;
193 $entry['min_real'] = min( $entry['min_real'], $elapsedReal );
194 $entry['max_real'] = max( $entry['max_real'], $elapsedReal );
198 * This method should not be called outside SectionProfiler
200 * @param string $functionname
202 public function profileInInternal( $functionname ) {
203 // Once the data is collated for reports, any future calls
204 // should clear the collation cache so the next report will
205 // reflect them. This matters when trace mode is used.
206 $this->collateDone
= false;
208 $cpu = $this->getTime( 'cpu' );
209 $real = $this->getTime( 'wall' );
210 $memory = memory_get_usage();
212 if ( $this->start
=== null ) {
213 $this->start
= [ 'cpu' => $cpu, 'real' => $real, 'memory' => $memory ];
216 $this->workStack
[] = [
218 count( $this->workStack
),
226 * This method should not be called outside SectionProfiler
228 * @param string $functionname
230 public function profileOutInternal( $functionname ) {
231 $item = array_pop( $this->workStack
);
232 if ( $item === null ) {
233 $this->debugGroup( 'profileerror', "Profiling error: $functionname" );
236 list( $ofname, /* $ocount */, $ortime, $octime, $omem ) = $item;
238 if ( $functionname === 'close' ) {
239 $message = "Profile section ended by close(): {$ofname}";
240 $this->debugGroup( 'profileerror', $message );
241 if ( $this->collateOnly
) {
242 $this->collated
[$message] = $this->errorEntry
;
244 $this->stack
[] = [ $message, 0, 0.0, 0.0, 0, 0.0, 0.0, 0 ];
246 $functionname = $ofname;
247 } elseif ( $ofname !== $functionname ) {
248 $message = "Profiling error: in({$ofname}), out($functionname)";
249 $this->debugGroup( 'profileerror', $message );
250 if ( $this->collateOnly
) {
251 $this->collated
[$message] = $this->errorEntry
;
253 $this->stack
[] = [ $message, 0, 0.0, 0.0, 0, 0.0, 0.0, 0 ];
257 $realTime = $this->getTime( 'wall' );
258 $cpuTime = $this->getTime( 'cpu' );
259 $memUsage = memory_get_usage();
261 if ( $this->collateOnly
) {
262 $elapsedcpu = $cpuTime - $octime;
263 $elapsedreal = $realTime - $ortime;
264 $memchange = $memUsage - $omem;
265 $this->updateEntry( $functionname, $elapsedcpu, $elapsedreal, $memchange );
267 $this->stack
[] = array_merge( $item, [ $realTime, $cpuTime, $memUsage ] );
273 'memory' => $memUsage
278 * Returns a tree of function calls with their real times
282 public function getCallTreeReport() {
283 if ( $this->collateOnly
) {
284 throw new Exception( "Tree is only available for trace profiling." );
286 return implode( '', array_map(
287 [ $this, 'getCallTreeLine' ], $this->remapCallTree( $this->stack
)
292 * Recursive function the format the current profiling array into a tree
294 * @param array $stack Profiling array
297 protected function remapCallTree( array $stack ) {
298 if ( count( $stack ) < 2 ) {
302 for ( $max = count( $stack ) - 1; $max > 0; ) {
303 /* Find all items under this entry */
304 $level = $stack[$max][1];
306 for ( $i = $max -1; $i >= 0; $i-- ) {
307 if ( $stack[$i][1] > $level ) {
308 $working[] = $stack[$i];
313 $working = $this->remapCallTree( array_reverse( $working ) );
315 foreach ( $working as $item ) {
316 array_push( $output, $item );
318 array_unshift( $output, $stack[$max] );
321 array_unshift( $outputs, $output );
324 foreach ( $outputs as $output ) {
325 foreach ( $output as $item ) {
333 * Callback to get a formatted line for the call tree
334 * @param array $entry
337 protected function getCallTreeLine( $entry ) {
338 // $entry has (name, level, stime, scpu, smem, etime, ecpu, emem)
339 list( $fname, $level, $startreal, , , $endreal ) = $entry;
340 $delta = $endreal - $startreal;
341 $space = str_repeat( ' ', $level );
342 # The ugly double sprintf is to work around a PHP bug,
343 # which has been fixed in recent releases.
344 return sprintf( "%10s %s %s\n",
345 trim( sprintf( "%7.3f", $delta * 1000.0 ) ), $space, $fname );
349 * Populate collated data
351 protected function collateData() {
352 if ( $this->collateDone
) {
355 $this->collateDone
= true;
356 // Close opened profiling sections
357 while ( count( $this->workStack
) ) {
358 $this->profileOutInternal( 'close' );
361 if ( $this->collateOnly
) {
362 return; // already collated as methods exited
365 $this->collated
= [];
367 # Estimate profiling overhead
368 $oldEnd = $this->end
;
369 $profileCount = count( $this->stack
);
370 $this->calculateOverhead( $profileCount );
372 # First, subtract the overhead!
373 $overheadTotal = $overheadMemory = $overheadInternal = [];
374 foreach ( $this->stack
as $entry ) {
375 // $entry is (name,pos,rtime0,cputime0,mem0,rtime1,cputime1,mem1)
377 $elapsed = $entry[5] - $entry[2];
378 $memchange = $entry[7] - $entry[4];
380 if ( $fname === '-overhead-total' ) {
381 $overheadTotal[] = $elapsed;
382 $overheadMemory[] = max( 0, $memchange );
383 } elseif ( $fname === '-overhead-internal' ) {
384 $overheadInternal[] = $elapsed;
387 $overheadTotal = $overheadTotal ?
388 array_sum( $overheadTotal ) / count( $overheadInternal ) : 0;
389 $overheadMemory = $overheadMemory ?
390 array_sum( $overheadMemory ) / count( $overheadInternal ) : 0;
391 $overheadInternal = $overheadInternal ?
392 array_sum( $overheadInternal ) / count( $overheadInternal ) : 0;
395 foreach ( $this->stack
as $index => $entry ) {
396 // $entry is (name,pos,rtime0,cputime0,mem0,rtime1,cputime1,mem1)
398 $elapsedCpu = $entry[6] - $entry[3];
399 $elapsedReal = $entry[5] - $entry[2];
400 $memchange = $entry[7] - $entry[4];
401 $subcalls = $this->calltreeCount( $this->stack
, $index );
403 if ( substr( $fname, 0, 9 ) !== '-overhead' ) {
404 # Adjust for profiling overhead (except special values with elapsed=0)
406 $elapsed -= $overheadInternal;
407 $elapsed -= ( $subcalls * $overheadTotal );
408 $memchange -= ( $subcalls * $overheadMemory );
412 $this->updateEntry( $fname, $elapsedCpu, $elapsedReal, $memchange );
415 $this->collated
['-overhead-total']['count'] = $profileCount;
416 arsort( $this->collated
, SORT_NUMERIC
);
418 // Unclobber the end info map (the overhead checking alters it)
419 $this->end
= $oldEnd;
423 * Dummy calls to calculate profiling overhead
425 * @param int $profileCount
427 protected function calculateOverhead( $profileCount ) {
428 $this->profileInInternal( '-overhead-total' );
429 for ( $i = 0; $i < $profileCount; $i++
) {
430 $this->profileInInternal( '-overhead-internal' );
431 $this->profileOutInternal( '-overhead-internal' );
433 $this->profileOutInternal( '-overhead-total' );
437 * Counts the number of profiled function calls sitting under
438 * the given point in the call graph. Not the most efficient algo.
440 * @param array $stack
444 protected function calltreeCount( $stack, $start ) {
445 $level = $stack[$start][1];
447 for ( $i = $start -1; $i >= 0 && $stack[$i][1] > $level; $i-- ) {
454 * Get the initial time of the request, based on getrusage()
456 * @param string|bool $metric Metric to use, with the following possibilities:
457 * - user: User CPU time (without system calls)
458 * - cpu: Total CPU time (user and system calls)
459 * - wall (or any other string): elapsed time
460 * - false (default): will fall back to default metric
463 protected function getTime( $metric = 'wall' ) {
464 if ( $metric === 'cpu' ||
$metric === 'user' ) {
469 $time = $ru['ru_utime.tv_sec'] +
$ru['ru_utime.tv_usec'] / 1e6
;
470 if ( $metric === 'cpu' ) {
471 # This is the time of system calls, added to the user time
472 # it gives the total CPU time
473 $time +
= $ru['ru_stime.tv_sec'] +
$ru['ru_stime.tv_usec'] / 1e6
;
477 return microtime( true );
482 * Add an entry in the debug log file
484 * @param string $s String to output
486 protected function debug( $s ) {
487 if ( function_exists( 'wfDebug' ) ) {
493 * Add an entry in the debug log group
495 * @param string $group Group to send the message to
496 * @param string $s String to output
498 protected function debugGroup( $group, $s ) {
499 if ( function_exists( 'wfDebugLog' ) ) {
500 wfDebugLog( $group, $s );
506 * Subclass ScopedCallback to avoid call_user_func_array(), which is slow
508 * This class should not be used outside of SectionProfiler
510 class SectionProfileCallback
extends ScopedCallback
{
511 /** @var SectionProfiler */
517 * @param SectionProfiler $profiler
518 * @param string $section
520 public function __construct( SectionProfiler
$profiler, $section ) {
521 parent
::__construct( null );
522 $this->profiler
= $profiler;
523 $this->section
= $section;
526 function __destruct() {
527 $this->profiler
->profileOutInternal( $this->section
);