1 //===--- SyntheticCountsUtils.cpp - synthetic counts propagation utils ---===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines utilities for propagating synthetic counts.
12 //===----------------------------------------------------------------------===//
14 #include "llvm/Analysis/SyntheticCountsUtils.h"
15 #include "llvm/ADT/DenseSet.h"
16 #include "llvm/ADT/SCCIterator.h"
17 #include "llvm/ADT/SmallPtrSet.h"
18 #include "llvm/Analysis/CallGraph.h"
19 #include "llvm/IR/CallSite.h"
20 #include "llvm/IR/Function.h"
21 #include "llvm/IR/InstIterator.h"
22 #include "llvm/IR/Instructions.h"
26 // Given an SCC, propagate entry counts along the edge of the SCC nodes.
27 template <typename CallGraphType
>
28 void SyntheticCountsUtils
<CallGraphType
>::propagateFromSCC(
29 const SccTy
&SCC
, GetRelBBFreqTy GetRelBBFreq
, GetCountTy GetCount
,
30 AddCountTy AddCount
) {
32 SmallPtrSet
<NodeRef
, 8> SCCNodes
;
33 SmallVector
<std::pair
<NodeRef
, EdgeRef
>, 8> SCCEdges
, NonSCCEdges
;
35 for (auto &Node
: SCC
)
36 SCCNodes
.insert(Node
);
38 // Partition the edges coming out of the SCC into those whose destination is
39 // in the SCC and the rest.
40 for (const auto &Node
: SCCNodes
) {
41 for (auto &E
: children_edges
<CallGraphType
>(Node
)) {
42 if (SCCNodes
.count(CGT::edge_dest(E
)))
43 SCCEdges
.emplace_back(Node
, E
);
45 NonSCCEdges
.emplace_back(Node
, E
);
49 // For nodes in the same SCC, update the counts in two steps:
50 // 1. Compute the additional count for each node by propagating the counts
51 // along all incoming edges to the node that originate from within the same
52 // SCC and summing them up.
53 // 2. Add the additional counts to the nodes in the SCC.
54 // This ensures that the order of
55 // traversal of nodes within the SCC doesn't affect the final result.
57 DenseMap
<NodeRef
, uint64_t> AdditionalCounts
;
58 for (auto &E
: SCCEdges
) {
59 auto OptRelFreq
= GetRelBBFreq(E
.second
);
62 Scaled64 RelFreq
= OptRelFreq
.getValue();
63 auto Caller
= E
.first
;
64 auto Callee
= CGT::edge_dest(E
.second
);
65 RelFreq
*= Scaled64(GetCount(Caller
), 0);
66 uint64_t AdditionalCount
= RelFreq
.toInt
<uint64_t>();
67 AdditionalCounts
[Callee
] += AdditionalCount
;
70 // Update the counts for the nodes in the SCC.
71 for (auto &Entry
: AdditionalCounts
)
72 AddCount(Entry
.first
, Entry
.second
);
74 // Now update the counts for nodes outside the SCC.
75 for (auto &E
: NonSCCEdges
) {
76 auto OptRelFreq
= GetRelBBFreq(E
.second
);
79 Scaled64 RelFreq
= OptRelFreq
.getValue();
80 auto Caller
= E
.first
;
81 auto Callee
= CGT::edge_dest(E
.second
);
82 RelFreq
*= Scaled64(GetCount(Caller
), 0);
83 AddCount(Callee
, RelFreq
.toInt
<uint64_t>());
87 /// Propgate synthetic entry counts on a callgraph \p CG.
89 /// This performs a reverse post-order traversal of the callgraph SCC. For each
90 /// SCC, it first propagates the entry counts to the nodes within the SCC
91 /// through call edges and updates them in one shot. Then the entry counts are
92 /// propagated to nodes outside the SCC. This requires \p GraphTraits
93 /// to have a specialization for \p CallGraphType.
95 template <typename CallGraphType
>
96 void SyntheticCountsUtils
<CallGraphType
>::propagate(const CallGraphType
&CG
,
97 GetRelBBFreqTy GetRelBBFreq
,
99 AddCountTy AddCount
) {
100 std::vector
<SccTy
> SCCs
;
102 // Collect all the SCCs.
103 for (auto I
= scc_begin(CG
); !I
.isAtEnd(); ++I
)
106 // The callgraph-scc needs to be visited in top-down order for propagation.
107 // The scc iterator returns the scc in bottom-up order, so reverse the SCCs
108 // and call propagateFromSCC.
109 for (auto &SCC
: reverse(SCCs
))
110 propagateFromSCC(SCC
, GetRelBBFreq
, GetCount
, AddCount
);
113 template class llvm::SyntheticCountsUtils
<const CallGraph
*>;