blob: bcdd984daa58422fc485585a20d6ae7dbe4ee83b [file] [log] [blame]
Easwaran Ramanf1f1adc2018-12-13 19:54:27 +00001//==-SummaryBasedOptimizations.cpp - Optimizations based on ThinLTO summary-==//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements optimizations that are based on the module summaries.
11// These optimizations are performed during the thinlink phase of the
12// compilation.
13//
14//===----------------------------------------------------------------------===//
15
16#include "llvm/LTO/SummaryBasedOptimizations.h"
17#include "llvm/Analysis/SyntheticCountsUtils.h"
18#include "llvm/IR/ModuleSummaryIndex.h"
19
20using namespace llvm;
21
22cl::opt<bool> ThinLTOSynthesizeEntryCounts(
23 "thinlto-synthesize-entry-counts", cl::init(false), cl::Hidden,
24 cl::desc("Synthesize entry counts based on the summary"));
25
26extern cl::opt<int> InitialSyntheticCount;
27
28static void initializeCounts(ModuleSummaryIndex &Index) {
29 auto Root = Index.calculateCallGraphRoot();
30 // Root is a fake node. All its successors are the actual roots of the
31 // callgraph.
32 // FIXME: This initializes the entry counts of only the root nodes. This makes
33 // sense when compiling a binary with ThinLTO, but for libraries any of the
34 // non-root nodes could be called from outside.
35 for (auto &C : Root.calls()) {
36 auto &V = C.first;
37 for (auto &GVS : V.getSummaryList()) {
38 auto S = GVS.get()->getBaseObject();
39 auto *F = cast<FunctionSummary>(S);
40 F->setEntryCount(InitialSyntheticCount);
41 }
42 }
43}
44
45void llvm::computeSyntheticCounts(ModuleSummaryIndex &Index) {
46 if (!ThinLTOSynthesizeEntryCounts)
47 return;
48
49 using Scaled64 = ScaledNumber<uint64_t>;
50 initializeCounts(Index);
51 auto GetCallSiteRelFreq = [](FunctionSummary::EdgeTy &Edge) {
52 return Scaled64(Edge.second.RelBlockFreq, -CalleeInfo::ScaleShift);
53 };
54 auto GetEntryCount = [](ValueInfo V) {
55 if (V.getSummaryList().size()) {
56 auto S = V.getSummaryList().front().get()->getBaseObject();
57 auto *F = cast<FunctionSummary>(S);
58 return F->entryCount();
59 } else {
60 return UINT64_C(0);
61 }
62 };
Easwaran Raman116e0802019-01-09 20:10:27 +000063 auto AddToEntryCount = [](ValueInfo V, Scaled64 New) {
Easwaran Ramanf1f1adc2018-12-13 19:54:27 +000064 if (!V.getSummaryList().size())
65 return;
66 for (auto &GVS : V.getSummaryList()) {
67 auto S = GVS.get()->getBaseObject();
68 auto *F = cast<FunctionSummary>(S);
Easwaran Raman116e0802019-01-09 20:10:27 +000069 F->setEntryCount(
70 SaturatingAdd(F->entryCount(), New.template toInt<uint64_t>()));
Easwaran Ramanf1f1adc2018-12-13 19:54:27 +000071 }
72 };
73
Easwaran Raman116e0802019-01-09 20:10:27 +000074 auto GetProfileCount = [&](ValueInfo V, FunctionSummary::EdgeTy &Edge) {
75 auto RelFreq = GetCallSiteRelFreq(Edge);
76 Scaled64 EC(GetEntryCount(V), 0);
77 return RelFreq * EC;
78 };
Easwaran Ramanf1f1adc2018-12-13 19:54:27 +000079 // After initializing the counts in initializeCounts above, the counts have to
80 // be propagated across the combined callgraph.
81 // SyntheticCountsUtils::propagate takes care of this propagation on any
82 // callgraph that specialized GraphTraits.
Easwaran Raman116e0802019-01-09 20:10:27 +000083 SyntheticCountsUtils<ModuleSummaryIndex *>::propagate(&Index, GetProfileCount,
84 AddToEntryCount);
Easwaran Ramanf1f1adc2018-12-13 19:54:27 +000085 Index.setHasSyntheticEntryCounts();
86}