Revert r362472 as it is breaking PPC build bots
[llvm-core.git] / lib / Support / TimeProfiler.cpp
blobbc23408156452fd86e6608127144dec8c8795504
1 //===-- TimeProfiler.cpp - Hierarchical Time Profiler ---------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements hierarchical time profiler.
11 //===----------------------------------------------------------------------===//
13 #include "llvm/Support/TimeProfiler.h"
14 #include "llvm/ADT/StringMap.h"
15 #include "llvm/Support/CommandLine.h"
16 #include "llvm/Support/FileSystem.h"
17 #include "llvm/Support/JSON.h"
18 #include <cassert>
19 #include <chrono>
20 #include <string>
21 #include <vector>
23 using namespace std::chrono;
25 namespace llvm {
27 static cl::opt<unsigned> TimeTraceGranularity(
28 "time-trace-granularity",
29 cl::desc(
30 "Minimum time granularity (in microseconds) traced by time profiler"),
31 cl::init(500));
33 TimeTraceProfiler *TimeTraceProfilerInstance = nullptr;
35 typedef duration<steady_clock::rep, steady_clock::period> DurationType;
36 typedef std::pair<size_t, DurationType> CountAndDurationType;
37 typedef std::pair<std::string, CountAndDurationType>
38 NameAndCountAndDurationType;
40 struct Entry {
41 time_point<steady_clock> Start;
42 DurationType Duration;
43 std::string Name;
44 std::string Detail;
46 Entry(time_point<steady_clock> &&S, DurationType &&D, std::string &&N,
47 std::string &&Dt)
48 : Start(std::move(S)), Duration(std::move(D)), Name(std::move(N)),
49 Detail(std::move(Dt)){};
52 struct TimeTraceProfiler {
53 TimeTraceProfiler() {
54 StartTime = steady_clock::now();
57 void begin(std::string Name, llvm::function_ref<std::string()> Detail) {
58 Stack.emplace_back(steady_clock::now(), DurationType{}, std::move(Name),
59 Detail());
62 void end() {
63 assert(!Stack.empty() && "Must call begin() first");
64 auto &E = Stack.back();
65 E.Duration = steady_clock::now() - E.Start;
67 // Only include sections longer than TimeTraceGranularity msec.
68 if (duration_cast<microseconds>(E.Duration).count() > TimeTraceGranularity)
69 Entries.emplace_back(E);
71 // Track total time taken by each "name", but only the topmost levels of
72 // them; e.g. if there's a template instantiation that instantiates other
73 // templates from within, we only want to add the topmost one. "topmost"
74 // happens to be the ones that don't have any currently open entries above
75 // itself.
76 if (std::find_if(++Stack.rbegin(), Stack.rend(), [&](const Entry &Val) {
77 return Val.Name == E.Name;
78 }) == Stack.rend()) {
79 auto &CountAndTotal = CountAndTotalPerName[E.Name];
80 CountAndTotal.first++;
81 CountAndTotal.second += E.Duration;
84 Stack.pop_back();
87 void Write(raw_pwrite_stream &OS) {
88 assert(Stack.empty() &&
89 "All profiler sections should be ended when calling Write");
90 json::OStream J(OS);
91 J.objectBegin();
92 J.attributeBegin("traceEvents");
93 J.arrayBegin();
95 // Emit all events for the main flame graph.
96 for (const auto &E : Entries) {
97 auto StartUs = duration_cast<microseconds>(E.Start - StartTime).count();
98 auto DurUs = duration_cast<microseconds>(E.Duration).count();
100 J.object([&]{
101 J.attribute("pid", 1);
102 J.attribute("tid", 0);
103 J.attribute("ph", "X");
104 J.attribute("ts", StartUs);
105 J.attribute("dur", DurUs);
106 J.attribute("name", E.Name);
107 J.attributeObject("args", [&] { J.attribute("detail", E.Detail); });
111 // Emit totals by section name as additional "thread" events, sorted from
112 // longest one.
113 int Tid = 1;
114 std::vector<NameAndCountAndDurationType> SortedTotals;
115 SortedTotals.reserve(CountAndTotalPerName.size());
116 for (const auto &E : CountAndTotalPerName)
117 SortedTotals.emplace_back(E.getKey(), E.getValue());
119 llvm::sort(SortedTotals.begin(), SortedTotals.end(),
120 [](const NameAndCountAndDurationType &A,
121 const NameAndCountAndDurationType &B) {
122 return A.second.second > B.second.second;
124 for (const auto &E : SortedTotals) {
125 auto DurUs = duration_cast<microseconds>(E.second.second).count();
126 auto Count = CountAndTotalPerName[E.first].first;
128 J.object([&]{
129 J.attribute("pid", 1);
130 J.attribute("tid", Tid);
131 J.attribute("ph", "X");
132 J.attribute("ts", 0);
133 J.attribute("dur", DurUs);
134 J.attribute("name", "Total " + E.first);
135 J.attributeObject("args", [&] {
136 J.attribute("count", int64_t(Count));
137 J.attribute("avg ms", int64_t(DurUs / Count / 1000));
141 ++Tid;
144 // Emit metadata event with process name.
145 J.object([&] {
146 J.attribute("cat", "");
147 J.attribute("pid", 1);
148 J.attribute("tid", 0);
149 J.attribute("ts", 0);
150 J.attribute("ph", "M");
151 J.attribute("name", "process_name");
152 J.attributeObject("args", [&] { J.attribute("name", "clang"); });
155 J.arrayEnd();
156 J.attributeEnd();
157 J.objectEnd();
160 SmallVector<Entry, 16> Stack;
161 SmallVector<Entry, 128> Entries;
162 StringMap<CountAndDurationType> CountAndTotalPerName;
163 time_point<steady_clock> StartTime;
166 void timeTraceProfilerInitialize() {
167 assert(TimeTraceProfilerInstance == nullptr &&
168 "Profiler should not be initialized");
169 TimeTraceProfilerInstance = new TimeTraceProfiler();
172 void timeTraceProfilerCleanup() {
173 delete TimeTraceProfilerInstance;
174 TimeTraceProfilerInstance = nullptr;
177 void timeTraceProfilerWrite(raw_pwrite_stream &OS) {
178 assert(TimeTraceProfilerInstance != nullptr &&
179 "Profiler object can't be null");
180 TimeTraceProfilerInstance->Write(OS);
183 void timeTraceProfilerBegin(StringRef Name, StringRef Detail) {
184 if (TimeTraceProfilerInstance != nullptr)
185 TimeTraceProfilerInstance->begin(Name, [&]() { return Detail; });
188 void timeTraceProfilerBegin(StringRef Name,
189 llvm::function_ref<std::string()> Detail) {
190 if (TimeTraceProfilerInstance != nullptr)
191 TimeTraceProfilerInstance->begin(Name, Detail);
194 void timeTraceProfilerEnd() {
195 if (TimeTraceProfilerInstance != nullptr)
196 TimeTraceProfilerInstance->end();
199 } // namespace llvm