blob: b1c669ec31c467b1ced467dc745e291c34b6b452 [file] [log] [blame]
Diego Novilloe75c2b32014-10-30 18:00:06 +00001//===- SampleProfWriter.cpp - Write LLVM sample profile data --------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the class that writes LLVM sample profiles. It
11// supports two file formats: text and binary. The textual representation
12// is useful for debugging and testing purposes. The binary representation
13// is more compact, resulting in smaller file sizes. However, they can
14// both be used interchangeably.
15//
16// See lib/ProfileData/SampleProfReader.cpp for documentation on each of the
17// supported formats.
18//
19//===----------------------------------------------------------------------===//
20
Chandler Carruthe3e43d92017-06-06 11:49:48 +000021#include "llvm/ProfileData/SampleProfWriter.h"
Eugene Zelenkof4f67a02017-03-03 01:07:34 +000022#include "llvm/ADT/StringRef.h"
23#include "llvm/ProfileData/ProfileCommon.h"
24#include "llvm/ProfileData/SampleProf.h"
Wei Miec13dea2018-09-14 20:52:59 +000025#include "llvm/Support/Endian.h"
26#include "llvm/Support/EndianStream.h"
Diego Novilloe75c2b32014-10-30 18:00:06 +000027#include "llvm/Support/ErrorOr.h"
Eugene Zelenkof4f67a02017-03-03 01:07:34 +000028#include "llvm/Support/FileSystem.h"
Diego Novilloe75c2b32014-10-30 18:00:06 +000029#include "llvm/Support/LEB128.h"
Wei Mi93bc7462018-06-11 22:40:43 +000030#include "llvm/Support/MD5.h"
Eugene Zelenkof4f67a02017-03-03 01:07:34 +000031#include "llvm/Support/raw_ostream.h"
32#include <algorithm>
33#include <cstdint>
34#include <memory>
Dehao Chene26e9402017-05-11 23:43:44 +000035#include <set>
Eugene Zelenkof4f67a02017-03-03 01:07:34 +000036#include <system_error>
37#include <utility>
38#include <vector>
Diego Novilloe75c2b32014-10-30 18:00:06 +000039
Diego Novilloe75c2b32014-10-30 18:00:06 +000040using namespace llvm;
Eugene Zelenkof4f67a02017-03-03 01:07:34 +000041using namespace sampleprof;
Diego Novilloe75c2b32014-10-30 18:00:06 +000042
Dehao Chene26e9402017-05-11 23:43:44 +000043std::error_code
44SampleProfileWriter::write(const StringMap<FunctionSamples> &ProfileMap) {
45 if (std::error_code EC = writeHeader(ProfileMap))
46 return EC;
47
48 // Sort the ProfileMap by total samples.
49 typedef std::pair<StringRef, const FunctionSamples *> NameFunctionSamples;
50 std::vector<NameFunctionSamples> V;
51 for (const auto &I : ProfileMap)
52 V.push_back(std::make_pair(I.getKey(), &I.second));
53
54 std::stable_sort(
55 V.begin(), V.end(),
56 [](const NameFunctionSamples &A, const NameFunctionSamples &B) {
57 if (A.second->getTotalSamples() == B.second->getTotalSamples())
58 return A.first > B.first;
59 return A.second->getTotalSamples() > B.second->getTotalSamples();
60 });
61
62 for (const auto &I : V) {
63 if (std::error_code EC = write(*I.second))
64 return EC;
65 }
66 return sampleprof_error::success;
67}
68
Wei Miec13dea2018-09-14 20:52:59 +000069std::error_code SampleProfileWriterCompactBinary::write(
70 const StringMap<FunctionSamples> &ProfileMap) {
71 if (std::error_code EC = SampleProfileWriter::write(ProfileMap))
72 return EC;
73 if (std::error_code EC = writeFuncOffsetTable())
74 return EC;
75 return sampleprof_error::success;
76}
77
Adrian Prantl26b584c2018-05-01 15:54:18 +000078/// Write samples to a text file.
Diego Novillodbe26eb2015-11-13 20:24:28 +000079///
80/// Note: it may be tempting to implement this in terms of
Diego Novillo5d8ee1b2015-11-19 15:33:08 +000081/// FunctionSamples::print(). Please don't. The dump functionality is intended
Diego Novillodbe26eb2015-11-13 20:24:28 +000082/// for debugging and has no specified form.
83///
84/// The format used here is more structured and deliberate because
85/// it needs to be parsed by the SampleProfileReaderText class.
Dehao Chen5c299ca2016-03-03 18:09:32 +000086std::error_code SampleProfileWriterText::write(const FunctionSamples &S) {
Nathan Slingerland46cf0f02015-12-10 17:21:42 +000087 auto &OS = *OutputStream;
Dehao Chen5c299ca2016-03-03 18:09:32 +000088 OS << S.getName() << ":" << S.getTotalSamples();
Diego Novillo3bc8dc32015-10-08 19:40:37 +000089 if (Indent == 0)
90 OS << ":" << S.getHeadSamples();
91 OS << "\n";
Diego Novilloe75c2b32014-10-30 18:00:06 +000092
Diego Novillo5d8ee1b2015-11-19 15:33:08 +000093 SampleSorter<LineLocation, SampleRecord> SortedSamples(S.getBodySamples());
94 for (const auto &I : SortedSamples.get()) {
95 LineLocation Loc = I->first;
96 const SampleRecord &Sample = I->second;
Diego Novillo3bc8dc32015-10-08 19:40:37 +000097 OS.indent(Indent + 1);
Diego Novilloe75c2b32014-10-30 18:00:06 +000098 if (Loc.Discriminator == 0)
99 OS << Loc.LineOffset << ": ";
100 else
101 OS << Loc.LineOffset << "." << Loc.Discriminator << ": ";
102
103 OS << Sample.getSamples();
104
Diego Novillo9657de5f2014-11-01 00:56:55 +0000105 for (const auto &J : Sample.getCallTargets())
106 OS << " " << J.first() << ":" << J.second;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000107 OS << "\n";
108 }
109
Dehao Chen14eaa3c2017-04-13 19:52:10 +0000110 SampleSorter<LineLocation, FunctionSamplesMap> SortedCallsiteSamples(
Diego Novillo5d8ee1b2015-11-19 15:33:08 +0000111 S.getCallsiteSamples());
Diego Novillo3bc8dc32015-10-08 19:40:37 +0000112 Indent += 1;
Dehao Chen14eaa3c2017-04-13 19:52:10 +0000113 for (const auto &I : SortedCallsiteSamples.get())
114 for (const auto &FS : I->second) {
115 LineLocation Loc = I->first;
116 const FunctionSamples &CalleeSamples = FS.second;
117 OS.indent(Indent);
118 if (Loc.Discriminator == 0)
119 OS << Loc.LineOffset << ": ";
120 else
121 OS << Loc.LineOffset << "." << Loc.Discriminator << ": ";
122 if (std::error_code EC = write(CalleeSamples))
123 return EC;
124 }
Diego Novillo3bc8dc32015-10-08 19:40:37 +0000125 Indent -= 1;
126
Diego Novillodb271652015-10-13 22:48:46 +0000127 return sampleprof_error::success;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000128}
129
Diego Novillodb271652015-10-13 22:48:46 +0000130std::error_code SampleProfileWriterBinary::writeNameIdx(StringRef FName) {
131 const auto &ret = NameTable.find(FName);
132 if (ret == NameTable.end())
133 return sampleprof_error::truncated_name_table;
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000134 encodeULEB128(ret->second, *OutputStream);
Diego Novillodb271652015-10-13 22:48:46 +0000135 return sampleprof_error::success;
136}
Diego Novilloe75c2b32014-10-30 18:00:06 +0000137
Diego Novillodb271652015-10-13 22:48:46 +0000138void SampleProfileWriterBinary::addName(StringRef FName) {
Dehao Chene26e9402017-05-11 23:43:44 +0000139 NameTable.insert(std::make_pair(FName, 0));
Diego Novillodb271652015-10-13 22:48:46 +0000140}
141
142void SampleProfileWriterBinary::addNames(const FunctionSamples &S) {
143 // Add all the names in indirect call targets.
144 for (const auto &I : S.getBodySamples()) {
145 const SampleRecord &Sample = I.second;
146 for (const auto &J : Sample.getCallTargets())
147 addName(J.first());
148 }
149
150 // Recursively add all the names for inlined callsites.
Dehao Chen14eaa3c2017-04-13 19:52:10 +0000151 for (const auto &J : S.getCallsiteSamples())
152 for (const auto &FS : J.second) {
153 const FunctionSamples &CalleeSamples = FS.second;
154 addName(CalleeSamples.getName());
155 addNames(CalleeSamples);
156 }
Diego Novillodb271652015-10-13 22:48:46 +0000157}
158
Wei Mi93bc7462018-06-11 22:40:43 +0000159void SampleProfileWriterBinary::stablizeNameTable(std::set<StringRef> &V) {
160 // Sort the names to make NameTable deterministic.
161 for (const auto &I : NameTable)
162 V.insert(I.first);
163 int i = 0;
164 for (const StringRef &N : V)
165 NameTable[N] = i++;
166}
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000167
Wei Mi93bc7462018-06-11 22:40:43 +0000168std::error_code SampleProfileWriterRawBinary::writeNameTable() {
169 auto &OS = *OutputStream;
170 std::set<StringRef> V;
171 stablizeNameTable(V);
172
173 // Write out the name table.
174 encodeULEB128(NameTable.size(), OS);
175 for (auto N : V) {
176 OS << N;
177 encodeULEB128(0, OS);
178 }
179 return sampleprof_error::success;
180}
181
Wei Miec13dea2018-09-14 20:52:59 +0000182std::error_code SampleProfileWriterCompactBinary::writeFuncOffsetTable() {
183 auto &OS = *OutputStream;
184
185 // Fill the slot remembered by TableOffset with the offset of FuncOffsetTable.
186 auto &OFS = static_cast<raw_fd_ostream &>(OS);
187 uint64_t FuncOffsetTableStart = OS.tell();
188 if (OFS.seek(TableOffset) == (uint64_t)-1)
189 return sampleprof_error::ostream_seek_unsupported;
190 support::endian::Writer Writer(*OutputStream, support::little);
191 Writer.write(FuncOffsetTableStart);
192 if (OFS.seek(FuncOffsetTableStart) == (uint64_t)-1)
193 return sampleprof_error::ostream_seek_unsupported;
194
195 // Write out the table size.
196 encodeULEB128(FuncOffsetTable.size(), OS);
197
198 // Write out FuncOffsetTable.
199 for (auto entry : FuncOffsetTable) {
200 writeNameIdx(entry.first);
201 encodeULEB128(entry.second, OS);
202 }
203 return sampleprof_error::success;
204}
205
Wei Mi93bc7462018-06-11 22:40:43 +0000206std::error_code SampleProfileWriterCompactBinary::writeNameTable() {
207 auto &OS = *OutputStream;
208 std::set<StringRef> V;
209 stablizeNameTable(V);
210
211 // Write out the name table.
212 encodeULEB128(NameTable.size(), OS);
213 for (auto N : V) {
214 encodeULEB128(MD5Hash(N), OS);
215 }
216 return sampleprof_error::success;
217}
218
219std::error_code SampleProfileWriterRawBinary::writeMagicIdent() {
220 auto &OS = *OutputStream;
Diego Novillodb271652015-10-13 22:48:46 +0000221 // Write file magic identifier.
Diego Novilloe75c2b32014-10-30 18:00:06 +0000222 encodeULEB128(SPMagic(), OS);
223 encodeULEB128(SPVersion(), OS);
Wei Mi93bc7462018-06-11 22:40:43 +0000224 return sampleprof_error::success;
225}
226
227std::error_code SampleProfileWriterCompactBinary::writeMagicIdent() {
228 auto &OS = *OutputStream;
229 // Write file magic identifier.
230 encodeULEB128(SPMagic(SPF_Compact_Binary), OS);
231 encodeULEB128(SPVersion(), OS);
232 return sampleprof_error::success;
233}
234
235std::error_code SampleProfileWriterBinary::writeHeader(
236 const StringMap<FunctionSamples> &ProfileMap) {
237 writeMagicIdent();
Diego Novillodb271652015-10-13 22:48:46 +0000238
Easwaran Raman44878402016-02-19 03:15:33 +0000239 computeSummary(ProfileMap);
240 if (auto EC = writeSummary())
241 return EC;
242
Diego Novillodb271652015-10-13 22:48:46 +0000243 // Generate the name table for all the functions referenced in the profile.
244 for (const auto &I : ProfileMap) {
245 addName(I.first());
246 addNames(I.second);
247 }
248
Wei Mi93bc7462018-06-11 22:40:43 +0000249 writeNameTable();
Diego Novillodb271652015-10-13 22:48:46 +0000250 return sampleprof_error::success;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000251}
252
Wei Miec13dea2018-09-14 20:52:59 +0000253std::error_code SampleProfileWriterCompactBinary::writeHeader(
254 const StringMap<FunctionSamples> &ProfileMap) {
255 support::endian::Writer Writer(*OutputStream, support::little);
256 if (auto EC = SampleProfileWriterBinary::writeHeader(ProfileMap))
257 return EC;
258
259 // Reserve a slot for the offset of function offset table. The slot will
260 // be populated with the offset of FuncOffsetTable later.
261 TableOffset = OutputStream->tell();
262 Writer.write(static_cast<uint64_t>(-2));
263 return sampleprof_error::success;
264}
265
Easwaran Raman44878402016-02-19 03:15:33 +0000266std::error_code SampleProfileWriterBinary::writeSummary() {
267 auto &OS = *OutputStream;
Easwaran Raman30c760d2016-05-19 21:53:28 +0000268 encodeULEB128(Summary->getTotalCount(), OS);
269 encodeULEB128(Summary->getMaxCount(), OS);
Easwaran Raman418032a2016-03-28 23:14:29 +0000270 encodeULEB128(Summary->getMaxFunctionCount(), OS);
Easwaran Raman30c760d2016-05-19 21:53:28 +0000271 encodeULEB128(Summary->getNumCounts(), OS);
Easwaran Raman44878402016-02-19 03:15:33 +0000272 encodeULEB128(Summary->getNumFunctions(), OS);
273 std::vector<ProfileSummaryEntry> &Entries = Summary->getDetailedSummary();
274 encodeULEB128(Entries.size(), OS);
275 for (auto Entry : Entries) {
276 encodeULEB128(Entry.Cutoff, OS);
277 encodeULEB128(Entry.MinCount, OS);
278 encodeULEB128(Entry.NumCounts, OS);
279 }
280 return sampleprof_error::success;
281}
Dehao Chen5c299ca2016-03-03 18:09:32 +0000282std::error_code SampleProfileWriterBinary::writeBody(const FunctionSamples &S) {
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000283 auto &OS = *OutputStream;
284
Dehao Chen5c299ca2016-03-03 18:09:32 +0000285 if (std::error_code EC = writeNameIdx(S.getName()))
Diego Novillodb271652015-10-13 22:48:46 +0000286 return EC;
287
Diego Novilloe75c2b32014-10-30 18:00:06 +0000288 encodeULEB128(S.getTotalSamples(), OS);
Diego Novillo50072bf2015-10-09 17:54:24 +0000289
290 // Emit all the body samples.
Diego Novillo9dc572f2015-10-16 18:54:35 +0000291 encodeULEB128(S.getBodySamples().size(), OS);
Diego Novillo9657de5f2014-11-01 00:56:55 +0000292 for (const auto &I : S.getBodySamples()) {
293 LineLocation Loc = I.first;
294 const SampleRecord &Sample = I.second;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000295 encodeULEB128(Loc.LineOffset, OS);
296 encodeULEB128(Loc.Discriminator, OS);
297 encodeULEB128(Sample.getSamples(), OS);
298 encodeULEB128(Sample.getCallTargets().size(), OS);
Diego Novillo9657de5f2014-11-01 00:56:55 +0000299 for (const auto &J : Sample.getCallTargets()) {
Diego Novillodb271652015-10-13 22:48:46 +0000300 StringRef Callee = J.first();
Diego Novillo634f5c12015-10-15 16:36:21 +0000301 uint64_t CalleeSamples = J.second;
Diego Novillodb271652015-10-13 22:48:46 +0000302 if (std::error_code EC = writeNameIdx(Callee))
303 return EC;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000304 encodeULEB128(CalleeSamples, OS);
305 }
306 }
307
Diego Novillo50072bf2015-10-09 17:54:24 +0000308 // Recursively emit all the callsite samples.
Dehao Chenca9f2fd2017-08-03 00:09:18 +0000309 uint64_t NumCallsites = 0;
310 for (const auto &J : S.getCallsiteSamples())
311 NumCallsites += J.second.size();
312 encodeULEB128(NumCallsites, OS);
Dehao Chen14eaa3c2017-04-13 19:52:10 +0000313 for (const auto &J : S.getCallsiteSamples())
314 for (const auto &FS : J.second) {
315 LineLocation Loc = J.first;
316 const FunctionSamples &CalleeSamples = FS.second;
317 encodeULEB128(Loc.LineOffset, OS);
318 encodeULEB128(Loc.Discriminator, OS);
319 if (std::error_code EC = writeBody(CalleeSamples))
320 return EC;
321 }
Diego Novillo50072bf2015-10-09 17:54:24 +0000322
Diego Novillodb271652015-10-13 22:48:46 +0000323 return sampleprof_error::success;
Diego Novilloe75c2b32014-10-30 18:00:06 +0000324}
Diego Novillo9657de5f2014-11-01 00:56:55 +0000325
Adrian Prantl26b584c2018-05-01 15:54:18 +0000326/// Write samples of a top-level function to a binary file.
Diego Novillo9dc572f2015-10-16 18:54:35 +0000327///
328/// \returns true if the samples were written successfully, false otherwise.
Dehao Chen5c299ca2016-03-03 18:09:32 +0000329std::error_code SampleProfileWriterBinary::write(const FunctionSamples &S) {
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000330 encodeULEB128(S.getHeadSamples(), *OutputStream);
Dehao Chen5c299ca2016-03-03 18:09:32 +0000331 return writeBody(S);
Diego Novillo9dc572f2015-10-16 18:54:35 +0000332}
333
Wei Miec13dea2018-09-14 20:52:59 +0000334std::error_code
335SampleProfileWriterCompactBinary::write(const FunctionSamples &S) {
336 uint64_t Offset = OutputStream->tell();
337 StringRef Name = S.getName();
338 FuncOffsetTable[Name] = Offset;
339 encodeULEB128(S.getHeadSamples(), *OutputStream);
340 return writeBody(S);
341}
342
Adrian Prantl26b584c2018-05-01 15:54:18 +0000343/// Create a sample profile file writer based on the specified format.
Diego Novillo9657de5f2014-11-01 00:56:55 +0000344///
345/// \param Filename The file to create.
346///
Diego Novillo9657de5f2014-11-01 00:56:55 +0000347/// \param Format Encoding format for the profile file.
348///
349/// \returns an error code indicating the status of the created writer.
Diego Novillo2b6bd7a2014-11-03 00:51:45 +0000350ErrorOr<std::unique_ptr<SampleProfileWriter>>
351SampleProfileWriter::create(StringRef Filename, SampleProfileFormat Format) {
Diego Novillo9657de5f2014-11-01 00:56:55 +0000352 std::error_code EC;
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000353 std::unique_ptr<raw_ostream> OS;
Wei Mi7253cd82018-06-12 05:53:49 +0000354 if (Format == SPF_Binary || Format == SPF_Compact_Binary)
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000355 OS.reset(new raw_fd_ostream(Filename, EC, sys::fs::F_None));
356 else
357 OS.reset(new raw_fd_ostream(Filename, EC, sys::fs::F_Text));
358 if (EC)
359 return EC;
360
361 return create(OS, Format);
362}
363
Adrian Prantl26b584c2018-05-01 15:54:18 +0000364/// Create a sample profile stream writer based on the specified format.
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000365///
366/// \param OS The output stream to store the profile data to.
367///
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000368/// \param Format Encoding format for the profile file.
369///
370/// \returns an error code indicating the status of the created writer.
371ErrorOr<std::unique_ptr<SampleProfileWriter>>
372SampleProfileWriter::create(std::unique_ptr<raw_ostream> &OS,
373 SampleProfileFormat Format) {
374 std::error_code EC;
Diego Novillo2b6bd7a2014-11-03 00:51:45 +0000375 std::unique_ptr<SampleProfileWriter> Writer;
Diego Novillo9657de5f2014-11-01 00:56:55 +0000376
Wei Mi7253cd82018-06-12 05:53:49 +0000377 if (Format == SPF_Binary)
Wei Mi93bc7462018-06-11 22:40:43 +0000378 Writer.reset(new SampleProfileWriterRawBinary(OS));
379 else if (Format == SPF_Compact_Binary)
380 Writer.reset(new SampleProfileWriterCompactBinary(OS));
Diego Novillo9657de5f2014-11-01 00:56:55 +0000381 else if (Format == SPF_Text)
Nathan Slingerland46cf0f02015-12-10 17:21:42 +0000382 Writer.reset(new SampleProfileWriterText(OS));
Diego Novillodb271652015-10-13 22:48:46 +0000383 else if (Format == SPF_GCC)
384 EC = sampleprof_error::unsupported_writing_format;
Diego Novillo9657de5f2014-11-01 00:56:55 +0000385 else
386 EC = sampleprof_error::unrecognized_format;
387
Diego Novillo2b6bd7a2014-11-03 00:51:45 +0000388 if (EC)
389 return EC;
390
391 return std::move(Writer);
Diego Novillo9657de5f2014-11-01 00:56:55 +0000392}
Easwaran Raman44878402016-02-19 03:15:33 +0000393
394void SampleProfileWriter::computeSummary(
395 const StringMap<FunctionSamples> &ProfileMap) {
Easwaran Raman17e7f1192016-05-19 21:07:12 +0000396 SampleProfileSummaryBuilder Builder(ProfileSummaryBuilder::DefaultCutoffs);
Easwaran Raman44878402016-02-19 03:15:33 +0000397 for (const auto &I : ProfileMap) {
398 const FunctionSamples &Profile = I.second;
Easwaran Raman17e7f1192016-05-19 21:07:12 +0000399 Builder.addRecord(Profile);
Easwaran Raman44878402016-02-19 03:15:33 +0000400 }
Benjamin Kramere3bf6642016-05-20 09:18:37 +0000401 Summary = Builder.getSummary();
Easwaran Raman44878402016-02-19 03:15:33 +0000402}