Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / llvm / lib / Analysis / SyntheticCountsUtils.cpp
blob29c41fda5e28f853b7d2c525675e4a04b0d5dd38
1 //===--- SyntheticCountsUtils.cpp - synthetic counts propagation utils ---===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file defines utilities for propagating synthetic counts.
11 //===----------------------------------------------------------------------===//
13 #include "llvm/Analysis/SyntheticCountsUtils.h"
14 #include "llvm/ADT/DenseSet.h"
15 #include "llvm/ADT/SCCIterator.h"
16 #include "llvm/Analysis/CallGraph.h"
17 #include "llvm/IR/ModuleSummaryIndex.h"
19 using namespace llvm;
21 // Given an SCC, propagate entry counts along the edge of the SCC nodes.
22 template <typename CallGraphType>
23 void SyntheticCountsUtils<CallGraphType>::propagateFromSCC(
24 const SccTy &SCC, GetProfCountTy GetProfCount, AddCountTy AddCount) {
26 DenseSet<NodeRef> SCCNodes;
27 SmallVector<std::pair<NodeRef, EdgeRef>, 8> SCCEdges, NonSCCEdges;
29 for (auto &Node : SCC)
30 SCCNodes.insert(Node);
32 // Partition the edges coming out of the SCC into those whose destination is
33 // in the SCC and the rest.
34 for (const auto &Node : SCCNodes) {
35 for (auto &E : children_edges<CallGraphType>(Node)) {
36 if (SCCNodes.count(CGT::edge_dest(E)))
37 SCCEdges.emplace_back(Node, E);
38 else
39 NonSCCEdges.emplace_back(Node, E);
43 // For nodes in the same SCC, update the counts in two steps:
44 // 1. Compute the additional count for each node by propagating the counts
45 // along all incoming edges to the node that originate from within the same
46 // SCC and summing them up.
47 // 2. Add the additional counts to the nodes in the SCC.
48 // This ensures that the order of
49 // traversal of nodes within the SCC doesn't affect the final result.
51 DenseMap<NodeRef, Scaled64> AdditionalCounts;
52 for (auto &E : SCCEdges) {
53 auto OptProfCount = GetProfCount(E.first, E.second);
54 if (!OptProfCount)
55 continue;
56 auto Callee = CGT::edge_dest(E.second);
57 AdditionalCounts[Callee] += *OptProfCount;
60 // Update the counts for the nodes in the SCC.
61 for (auto &Entry : AdditionalCounts)
62 AddCount(Entry.first, Entry.second);
64 // Now update the counts for nodes outside the SCC.
65 for (auto &E : NonSCCEdges) {
66 auto OptProfCount = GetProfCount(E.first, E.second);
67 if (!OptProfCount)
68 continue;
69 auto Callee = CGT::edge_dest(E.second);
70 AddCount(Callee, *OptProfCount);
74 /// Propgate synthetic entry counts on a callgraph \p CG.
75 ///
76 /// This performs a reverse post-order traversal of the callgraph SCC. For each
77 /// SCC, it first propagates the entry counts to the nodes within the SCC
78 /// through call edges and updates them in one shot. Then the entry counts are
79 /// propagated to nodes outside the SCC. This requires \p GraphTraits
80 /// to have a specialization for \p CallGraphType.
82 template <typename CallGraphType>
83 void SyntheticCountsUtils<CallGraphType>::propagate(const CallGraphType &CG,
84 GetProfCountTy GetProfCount,
85 AddCountTy AddCount) {
86 std::vector<SccTy> SCCs;
88 // Collect all the SCCs.
89 for (auto I = scc_begin(CG); !I.isAtEnd(); ++I)
90 SCCs.push_back(*I);
92 // The callgraph-scc needs to be visited in top-down order for propagation.
93 // The scc iterator returns the scc in bottom-up order, so reverse the SCCs
94 // and call propagateFromSCC.
95 for (auto &SCC : reverse(SCCs))
96 propagateFromSCC(SCC, GetProfCount, AddCount);
99 template class llvm::SyntheticCountsUtils<const CallGraph *>;
100 template class llvm::SyntheticCountsUtils<ModuleSummaryIndex *>;