SyntheticCountsUtils.cpp revision 336809
1//===--- SyntheticCountsUtils.cpp - synthetic counts propagation utils ---===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file defines utilities for propagating synthetic counts.
11//
12//===----------------------------------------------------------------------===//
13
14#include "llvm/Analysis/SyntheticCountsUtils.h"
15#include "llvm/ADT/DenseSet.h"
16#include "llvm/ADT/SCCIterator.h"
17#include "llvm/ADT/SmallPtrSet.h"
18#include "llvm/Analysis/CallGraph.h"
19#include "llvm/IR/CallSite.h"
20#include "llvm/IR/Function.h"
21#include "llvm/IR/InstIterator.h"
22#include "llvm/IR/Instructions.h"
23
24using namespace llvm;
25
26// Given an SCC, propagate entry counts along the edge of the SCC nodes.
27template <typename CallGraphType>
28void SyntheticCountsUtils<CallGraphType>::propagateFromSCC(
29    const SccTy &SCC, GetRelBBFreqTy GetRelBBFreq, GetCountTy GetCount,
30    AddCountTy AddCount) {
31
32  SmallPtrSet<NodeRef, 8> SCCNodes;
33  SmallVector<std::pair<NodeRef, EdgeRef>, 8> SCCEdges, NonSCCEdges;
34
35  for (auto &Node : SCC)
36    SCCNodes.insert(Node);
37
38  // Partition the edges coming out of the SCC into those whose destination is
39  // in the SCC and the rest.
40  for (const auto &Node : SCCNodes) {
41    for (auto &E : children_edges<CallGraphType>(Node)) {
42      if (SCCNodes.count(CGT::edge_dest(E)))
43        SCCEdges.emplace_back(Node, E);
44      else
45        NonSCCEdges.emplace_back(Node, E);
46    }
47  }
48
49  // For nodes in the same SCC, update the counts in two steps:
50  // 1. Compute the additional count for each node by propagating the counts
51  // along all incoming edges to the node that originate from within the same
52  // SCC and summing them up.
53  // 2. Add the additional counts to the nodes in the SCC.
54  // This ensures that the order of
55  // traversal of nodes within the SCC doesn't affect the final result.
56
57  DenseMap<NodeRef, uint64_t> AdditionalCounts;
58  for (auto &E : SCCEdges) {
59    auto OptRelFreq = GetRelBBFreq(E.second);
60    if (!OptRelFreq)
61      continue;
62    Scaled64 RelFreq = OptRelFreq.getValue();
63    auto Caller = E.first;
64    auto Callee = CGT::edge_dest(E.second);
65    RelFreq *= Scaled64(GetCount(Caller), 0);
66    uint64_t AdditionalCount = RelFreq.toInt<uint64_t>();
67    AdditionalCounts[Callee] += AdditionalCount;
68  }
69
70  // Update the counts for the nodes in the SCC.
71  for (auto &Entry : AdditionalCounts)
72    AddCount(Entry.first, Entry.second);
73
74  // Now update the counts for nodes outside the SCC.
75  for (auto &E : NonSCCEdges) {
76    auto OptRelFreq = GetRelBBFreq(E.second);
77    if (!OptRelFreq)
78      continue;
79    Scaled64 RelFreq = OptRelFreq.getValue();
80    auto Caller = E.first;
81    auto Callee = CGT::edge_dest(E.second);
82    RelFreq *= Scaled64(GetCount(Caller), 0);
83    AddCount(Callee, RelFreq.toInt<uint64_t>());
84  }
85}
86
87/// Propgate synthetic entry counts on a callgraph \p CG.
88///
89/// This performs a reverse post-order traversal of the callgraph SCC. For each
90/// SCC, it first propagates the entry counts to the nodes within the SCC
91/// through call edges and updates them in one shot. Then the entry counts are
92/// propagated to nodes outside the SCC. This requires \p GraphTraits
93/// to have a specialization for \p CallGraphType.
94
95template <typename CallGraphType>
96void SyntheticCountsUtils<CallGraphType>::propagate(const CallGraphType &CG,
97                                                    GetRelBBFreqTy GetRelBBFreq,
98                                                    GetCountTy GetCount,
99                                                    AddCountTy AddCount) {
100  std::vector<SccTy> SCCs;
101
102  // Collect all the SCCs.
103  for (auto I = scc_begin(CG); !I.isAtEnd(); ++I)
104    SCCs.push_back(*I);
105
106  // The callgraph-scc needs to be visited in top-down order for propagation.
107  // The scc iterator returns the scc in bottom-up order, so reverse the SCCs
108  // and call propagateFromSCC.
109  for (auto &SCC : reverse(SCCs))
110    propagateFromSCC(SCC, GetRelBBFreq, GetCount, AddCount);
111}
112
113template class llvm::SyntheticCountsUtils<const CallGraph *>;
114