1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
|
//==-SummaryBasedOptimizations.cpp - Optimizations based on ThinLTO summary-==//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file implements optimizations that are based on the module summaries.
// These optimizations are performed during the thinlink phase of the
// compilation.
//
//===----------------------------------------------------------------------===//
#include "llvm/LTO/SummaryBasedOptimizations.h"
#include "llvm/Analysis/SyntheticCountsUtils.h"
#include "llvm/IR/ModuleSummaryIndex.h"
#include "llvm/Support/CommandLine.h"
using namespace llvm;
static cl::opt<bool> ThinLTOSynthesizeEntryCounts(
"thinlto-synthesize-entry-counts", cl::init(false), cl::Hidden,
cl::desc("Synthesize entry counts based on the summary"));
namespace llvm {
extern cl::opt<int> InitialSyntheticCount;
}
static void initializeCounts(ModuleSummaryIndex &Index) {
auto Root = Index.calculateCallGraphRoot();
// Root is a fake node. All its successors are the actual roots of the
// callgraph.
// FIXME: This initializes the entry counts of only the root nodes. This makes
// sense when compiling a binary with ThinLTO, but for libraries any of the
// non-root nodes could be called from outside.
for (auto &C : Root.calls()) {
auto &V = C.first;
for (auto &GVS : V.getSummaryList()) {
auto S = GVS.get()->getBaseObject();
auto *F = cast<FunctionSummary>(S);
F->setEntryCount(InitialSyntheticCount);
}
}
}
void llvm::computeSyntheticCounts(ModuleSummaryIndex &Index) {
if (!ThinLTOSynthesizeEntryCounts)
return;
using Scaled64 = ScaledNumber<uint64_t>;
initializeCounts(Index);
auto GetCallSiteRelFreq = [](FunctionSummary::EdgeTy &Edge) {
return Scaled64(Edge.second.RelBlockFreq, -CalleeInfo::ScaleShift);
};
auto GetEntryCount = [](ValueInfo V) {
if (V.getSummaryList().size()) {
auto S = V.getSummaryList().front()->getBaseObject();
auto *F = cast<FunctionSummary>(S);
return F->entryCount();
} else {
return UINT64_C(0);
}
};
auto AddToEntryCount = [](ValueInfo V, Scaled64 New) {
if (!V.getSummaryList().size())
return;
for (auto &GVS : V.getSummaryList()) {
auto S = GVS.get()->getBaseObject();
auto *F = cast<FunctionSummary>(S);
F->setEntryCount(
SaturatingAdd(F->entryCount(), New.template toInt<uint64_t>()));
}
};
auto GetProfileCount = [&](ValueInfo V, FunctionSummary::EdgeTy &Edge) {
auto RelFreq = GetCallSiteRelFreq(Edge);
Scaled64 EC(GetEntryCount(V), 0);
return RelFreq * EC;
};
// After initializing the counts in initializeCounts above, the counts have to
// be propagated across the combined callgraph.
// SyntheticCountsUtils::propagate takes care of this propagation on any
// callgraph that specialized GraphTraits.
SyntheticCountsUtils<ModuleSummaryIndex *>::propagate(&Index, GetProfileCount,
AddToEntryCount);
Index.setHasSyntheticEntryCounts();
}
|