1 //===- llvm-profdata.cpp - LLVM profile data tool -------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // llvm-profdata merges .profdata files.
11 //
12 //===----------------------------------------------------------------------===//
13
14 #include "llvm/ADT/SmallSet.h"
15 #include "llvm/ADT/SmallVector.h"
16 #include "llvm/ADT/StringRef.h"
17 #include "llvm/IR/LLVMContext.h"
18 #include "llvm/ProfileData/InstrProfReader.h"
19 #include "llvm/ProfileData/InstrProfWriter.h"
20 #include "llvm/ProfileData/ProfileCommon.h"
21 #include "llvm/ProfileData/SampleProfReader.h"
22 #include "llvm/ProfileData/SampleProfWriter.h"
23 #include "llvm/Support/CommandLine.h"
24 #include "llvm/Support/Errc.h"
25 #include "llvm/Support/FileSystem.h"
26 #include "llvm/Support/Format.h"
27 #include "llvm/Support/InitLLVM.h"
28 #include "llvm/Support/MemoryBuffer.h"
29 #include "llvm/Support/Path.h"
30 #include "llvm/Support/WithColor.h"
31 #include "llvm/Support/ThreadPool.h"
32 #include "llvm/Support/raw_ostream.h"
33 #include <algorithm>
34
35 using namespace llvm;
36
37 enum ProfileFormat {
38 PF_None = 0,
39 PF_Text,
40 PF_Compact_Binary,
41 PF_GCC,
42 PF_Binary
43 };
44
warn(Twine Message,std::string Whence="",std::string Hint="")45 static void warn(Twine Message, std::string Whence = "",
46 std::string Hint = "") {
47 WithColor::warning();
48 if (!Whence.empty())
49 errs() << Whence << ": ";
50 errs() << Message << "\n";
51 if (!Hint.empty())
52 WithColor::note() << Hint << "\n";
53 }
54
exitWithError(Twine Message,std::string Whence="",std::string Hint="")55 static void exitWithError(Twine Message, std::string Whence = "",
56 std::string Hint = "") {
57 WithColor::error();
58 if (!Whence.empty())
59 errs() << Whence << ": ";
60 errs() << Message << "\n";
61 if (!Hint.empty())
62 WithColor::note() << Hint << "\n";
63 ::exit(1);
64 }
65
exitWithError(Error E,StringRef Whence="")66 static void exitWithError(Error E, StringRef Whence = "") {
67 if (E.isA<InstrProfError>()) {
68 handleAllErrors(std::move(E), [&](const InstrProfError &IPE) {
69 instrprof_error instrError = IPE.get();
70 StringRef Hint = "";
71 if (instrError == instrprof_error::unrecognized_format) {
72 // Hint for common error of forgetting -sample for sample profiles.
73 Hint = "Perhaps you forgot to use the -sample option?";
74 }
75 exitWithError(IPE.message(), Whence, Hint);
76 });
77 }
78
79 exitWithError(toString(std::move(E)), Whence);
80 }
81
exitWithErrorCode(std::error_code EC,StringRef Whence="")82 static void exitWithErrorCode(std::error_code EC, StringRef Whence = "") {
83 exitWithError(EC.message(), Whence);
84 }
85
86 namespace {
87 enum ProfileKinds { instr, sample };
88 }
89
handleMergeWriterError(Error E,StringRef WhenceFile="",StringRef WhenceFunction="",bool ShowHint=true)90 static void handleMergeWriterError(Error E, StringRef WhenceFile = "",
91 StringRef WhenceFunction = "",
92 bool ShowHint = true) {
93 if (!WhenceFile.empty())
94 errs() << WhenceFile << ": ";
95 if (!WhenceFunction.empty())
96 errs() << WhenceFunction << ": ";
97
98 auto IPE = instrprof_error::success;
99 E = handleErrors(std::move(E),
100 [&IPE](std::unique_ptr<InstrProfError> E) -> Error {
101 IPE = E->get();
102 return Error(std::move(E));
103 });
104 errs() << toString(std::move(E)) << "\n";
105
106 if (ShowHint) {
107 StringRef Hint = "";
108 if (IPE != instrprof_error::success) {
109 switch (IPE) {
110 case instrprof_error::hash_mismatch:
111 case instrprof_error::count_mismatch:
112 case instrprof_error::value_site_count_mismatch:
113 Hint = "Make sure that all profile data to be merged is generated "
114 "from the same binary.";
115 break;
116 default:
117 break;
118 }
119 }
120
121 if (!Hint.empty())
122 errs() << Hint << "\n";
123 }
124 }
125
126 struct WeightedFile {
127 std::string Filename;
128 uint64_t Weight;
129 };
130 typedef SmallVector<WeightedFile, 5> WeightedFileVector;
131
132 /// Keep track of merged data and reported errors.
133 struct WriterContext {
134 std::mutex Lock;
135 InstrProfWriter Writer;
136 Error Err;
137 std::string ErrWhence;
138 std::mutex &ErrLock;
139 SmallSet<instrprof_error, 4> &WriterErrorCodes;
140
WriterContextWriterContext141 WriterContext(bool IsSparse, std::mutex &ErrLock,
142 SmallSet<instrprof_error, 4> &WriterErrorCodes)
143 : Lock(), Writer(IsSparse), Err(Error::success()), ErrWhence(""),
144 ErrLock(ErrLock), WriterErrorCodes(WriterErrorCodes) {}
145 };
146
147 /// Determine whether an error is fatal for profile merging.
isFatalError(instrprof_error IPE)148 static bool isFatalError(instrprof_error IPE) {
149 switch (IPE) {
150 default:
151 return true;
152 case instrprof_error::success:
153 case instrprof_error::eof:
154 case instrprof_error::unknown_function:
155 case instrprof_error::hash_mismatch:
156 case instrprof_error::count_mismatch:
157 case instrprof_error::counter_overflow:
158 case instrprof_error::value_site_count_mismatch:
159 return false;
160 }
161 }
162
163 /// Load an input into a writer context.
loadInput(const WeightedFile & Input,WriterContext * WC)164 static void loadInput(const WeightedFile &Input, WriterContext *WC) {
165 std::unique_lock<std::mutex> CtxGuard{WC->Lock};
166
167 // If there's a pending hard error, don't do more work.
168 if (WC->Err)
169 return;
170
171 // Copy the filename, because llvm::ThreadPool copied the input "const
172 // WeightedFile &" by value, making a reference to the filename within it
173 // invalid outside of this packaged task.
174 WC->ErrWhence = Input.Filename;
175
176 auto ReaderOrErr = InstrProfReader::create(Input.Filename);
177 if (Error E = ReaderOrErr.takeError()) {
178 // Skip the empty profiles by returning sliently.
179 instrprof_error IPE = InstrProfError::take(std::move(E));
180 if (IPE != instrprof_error::empty_raw_profile)
181 WC->Err = make_error<InstrProfError>(IPE);
182 return;
183 }
184
185 auto Reader = std::move(ReaderOrErr.get());
186 bool IsIRProfile = Reader->isIRLevelProfile();
187 if (WC->Writer.setIsIRLevelProfile(IsIRProfile)) {
188 WC->Err = make_error<StringError>(
189 "Merge IR generated profile with Clang generated profile.",
190 std::error_code());
191 return;
192 }
193
194 for (auto &I : *Reader) {
195 const StringRef FuncName = I.Name;
196 bool Reported = false;
197 WC->Writer.addRecord(std::move(I), Input.Weight, [&](Error E) {
198 if (Reported) {
199 consumeError(std::move(E));
200 return;
201 }
202 Reported = true;
203 // Only show hint the first time an error occurs.
204 instrprof_error IPE = InstrProfError::take(std::move(E));
205 std::unique_lock<std::mutex> ErrGuard{WC->ErrLock};
206 bool firstTime = WC->WriterErrorCodes.insert(IPE).second;
207 handleMergeWriterError(make_error<InstrProfError>(IPE), Input.Filename,
208 FuncName, firstTime);
209 });
210 }
211 if (Reader->hasError()) {
212 if (Error E = Reader->getError()) {
213 instrprof_error IPE = InstrProfError::take(std::move(E));
214 if (isFatalError(IPE))
215 WC->Err = make_error<InstrProfError>(IPE);
216 }
217 }
218 }
219
220 /// Merge the \p Src writer context into \p Dst.
mergeWriterContexts(WriterContext * Dst,WriterContext * Src)221 static void mergeWriterContexts(WriterContext *Dst, WriterContext *Src) {
222 // If we've already seen a hard error, continuing with the merge would
223 // clobber it.
224 if (Dst->Err || Src->Err)
225 return;
226
227 bool Reported = false;
228 Dst->Writer.mergeRecordsFromWriter(std::move(Src->Writer), [&](Error E) {
229 if (Reported) {
230 consumeError(std::move(E));
231 return;
232 }
233 Reported = true;
234 Dst->Err = std::move(E);
235 });
236 }
237
mergeInstrProfile(const WeightedFileVector & Inputs,StringRef OutputFilename,ProfileFormat OutputFormat,bool OutputSparse,unsigned NumThreads)238 static void mergeInstrProfile(const WeightedFileVector &Inputs,
239 StringRef OutputFilename,
240 ProfileFormat OutputFormat, bool OutputSparse,
241 unsigned NumThreads) {
242 if (OutputFilename.compare("-") == 0)
243 exitWithError("Cannot write indexed profdata format to stdout.");
244
245 if (OutputFormat != PF_Binary && OutputFormat != PF_Compact_Binary &&
246 OutputFormat != PF_Text)
247 exitWithError("Unknown format is specified.");
248
249 std::error_code EC;
250 raw_fd_ostream Output(OutputFilename.data(), EC, sys::fs::F_None);
251 if (EC)
252 exitWithErrorCode(EC, OutputFilename);
253
254 std::mutex ErrorLock;
255 SmallSet<instrprof_error, 4> WriterErrorCodes;
256
257 // If NumThreads is not specified, auto-detect a good default.
258 if (NumThreads == 0)
259 NumThreads =
260 std::min(hardware_concurrency(), unsigned((Inputs.size() + 1) / 2));
261
262 // Initialize the writer contexts.
263 SmallVector<std::unique_ptr<WriterContext>, 4> Contexts;
264 for (unsigned I = 0; I < NumThreads; ++I)
265 Contexts.emplace_back(llvm::make_unique<WriterContext>(
266 OutputSparse, ErrorLock, WriterErrorCodes));
267
268 if (NumThreads == 1) {
269 for (const auto &Input : Inputs)
270 loadInput(Input, Contexts[0].get());
271 } else {
272 ThreadPool Pool(NumThreads);
273
274 // Load the inputs in parallel (N/NumThreads serial steps).
275 unsigned Ctx = 0;
276 for (const auto &Input : Inputs) {
277 Pool.async(loadInput, Input, Contexts[Ctx].get());
278 Ctx = (Ctx + 1) % NumThreads;
279 }
280 Pool.wait();
281
282 // Merge the writer contexts together (~ lg(NumThreads) serial steps).
283 unsigned Mid = Contexts.size() / 2;
284 unsigned End = Contexts.size();
285 assert(Mid > 0 && "Expected more than one context");
286 do {
287 for (unsigned I = 0; I < Mid; ++I)
288 Pool.async(mergeWriterContexts, Contexts[I].get(),
289 Contexts[I + Mid].get());
290 Pool.wait();
291 if (End & 1) {
292 Pool.async(mergeWriterContexts, Contexts[0].get(),
293 Contexts[End - 1].get());
294 Pool.wait();
295 }
296 End = Mid;
297 Mid /= 2;
298 } while (Mid > 0);
299 }
300
301 // Handle deferred hard errors encountered during merging.
302 for (std::unique_ptr<WriterContext> &WC : Contexts) {
303 if (!WC->Err)
304 continue;
305 if (!WC->Err.isA<InstrProfError>())
306 exitWithError(std::move(WC->Err), WC->ErrWhence);
307
308 instrprof_error IPE = InstrProfError::take(std::move(WC->Err));
309 if (isFatalError(IPE))
310 exitWithError(make_error<InstrProfError>(IPE), WC->ErrWhence);
311 else
312 warn(toString(make_error<InstrProfError>(IPE)),
313 WC->ErrWhence);
314 }
315
316 InstrProfWriter &Writer = Contexts[0]->Writer;
317 if (OutputFormat == PF_Text) {
318 if (Error E = Writer.writeText(Output))
319 exitWithError(std::move(E));
320 } else {
321 Writer.write(Output);
322 }
323 }
324
325 static sampleprof::SampleProfileFormat FormatMap[] = {
326 sampleprof::SPF_None, sampleprof::SPF_Text, sampleprof::SPF_Compact_Binary,
327 sampleprof::SPF_GCC, sampleprof::SPF_Binary};
328
mergeSampleProfile(const WeightedFileVector & Inputs,StringRef OutputFilename,ProfileFormat OutputFormat)329 static void mergeSampleProfile(const WeightedFileVector &Inputs,
330 StringRef OutputFilename,
331 ProfileFormat OutputFormat) {
332 using namespace sampleprof;
333 auto WriterOrErr =
334 SampleProfileWriter::create(OutputFilename, FormatMap[OutputFormat]);
335 if (std::error_code EC = WriterOrErr.getError())
336 exitWithErrorCode(EC, OutputFilename);
337
338 auto Writer = std::move(WriterOrErr.get());
339 StringMap<FunctionSamples> ProfileMap;
340 SmallVector<std::unique_ptr<sampleprof::SampleProfileReader>, 5> Readers;
341 LLVMContext Context;
342 for (const auto &Input : Inputs) {
343 auto ReaderOrErr = SampleProfileReader::create(Input.Filename, Context);
344 if (std::error_code EC = ReaderOrErr.getError())
345 exitWithErrorCode(EC, Input.Filename);
346
347 // We need to keep the readers around until after all the files are
348 // read so that we do not lose the function names stored in each
349 // reader's memory. The function names are needed to write out the
350 // merged profile map.
351 Readers.push_back(std::move(ReaderOrErr.get()));
352 const auto Reader = Readers.back().get();
353 if (std::error_code EC = Reader->read())
354 exitWithErrorCode(EC, Input.Filename);
355
356 StringMap<FunctionSamples> &Profiles = Reader->getProfiles();
357 for (StringMap<FunctionSamples>::iterator I = Profiles.begin(),
358 E = Profiles.end();
359 I != E; ++I) {
360 StringRef FName = I->first();
361 FunctionSamples &Samples = I->second;
362 sampleprof_error Result = ProfileMap[FName].merge(Samples, Input.Weight);
363 if (Result != sampleprof_error::success) {
364 std::error_code EC = make_error_code(Result);
365 handleMergeWriterError(errorCodeToError(EC), Input.Filename, FName);
366 }
367 }
368 }
369 Writer->write(ProfileMap);
370 }
371
parseWeightedFile(const StringRef & WeightedFilename)372 static WeightedFile parseWeightedFile(const StringRef &WeightedFilename) {
373 StringRef WeightStr, FileName;
374 std::tie(WeightStr, FileName) = WeightedFilename.split(',');
375
376 uint64_t Weight;
377 if (WeightStr.getAsInteger(10, Weight) || Weight < 1)
378 exitWithError("Input weight must be a positive integer.");
379
380 return {FileName, Weight};
381 }
382
383 static std::unique_ptr<MemoryBuffer>
getInputFilenamesFileBuf(const StringRef & InputFilenamesFile)384 getInputFilenamesFileBuf(const StringRef &InputFilenamesFile) {
385 if (InputFilenamesFile == "")
386 return {};
387
388 auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFilenamesFile);
389 if (!BufOrError)
390 exitWithErrorCode(BufOrError.getError(), InputFilenamesFile);
391
392 return std::move(*BufOrError);
393 }
394
addWeightedInput(WeightedFileVector & WNI,const WeightedFile & WF)395 static void addWeightedInput(WeightedFileVector &WNI, const WeightedFile &WF) {
396 StringRef Filename = WF.Filename;
397 uint64_t Weight = WF.Weight;
398
399 // If it's STDIN just pass it on.
400 if (Filename == "-") {
401 WNI.push_back({Filename, Weight});
402 return;
403 }
404
405 llvm::sys::fs::file_status Status;
406 llvm::sys::fs::status(Filename, Status);
407 if (!llvm::sys::fs::exists(Status))
408 exitWithErrorCode(make_error_code(errc::no_such_file_or_directory),
409 Filename);
410 // If it's a source file, collect it.
411 if (llvm::sys::fs::is_regular_file(Status)) {
412 WNI.push_back({Filename, Weight});
413 return;
414 }
415
416 if (llvm::sys::fs::is_directory(Status)) {
417 std::error_code EC;
418 for (llvm::sys::fs::recursive_directory_iterator F(Filename, EC), E;
419 F != E && !EC; F.increment(EC)) {
420 if (llvm::sys::fs::is_regular_file(F->path())) {
421 addWeightedInput(WNI, {F->path(), Weight});
422 }
423 }
424 if (EC)
425 exitWithErrorCode(EC, Filename);
426 }
427 }
428
parseInputFilenamesFile(MemoryBuffer * Buffer,WeightedFileVector & WFV)429 static void parseInputFilenamesFile(MemoryBuffer *Buffer,
430 WeightedFileVector &WFV) {
431 if (!Buffer)
432 return;
433
434 SmallVector<StringRef, 8> Entries;
435 StringRef Data = Buffer->getBuffer();
436 Data.split(Entries, '\n', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
437 for (const StringRef &FileWeightEntry : Entries) {
438 StringRef SanitizedEntry = FileWeightEntry.trim(" \t\v\f\r");
439 // Skip comments.
440 if (SanitizedEntry.startswith("#"))
441 continue;
442 // If there's no comma, it's an unweighted profile.
443 else if (SanitizedEntry.find(',') == StringRef::npos)
444 addWeightedInput(WFV, {SanitizedEntry, 1});
445 else
446 addWeightedInput(WFV, parseWeightedFile(SanitizedEntry));
447 }
448 }
449
merge_main(int argc,const char * argv[])450 static int merge_main(int argc, const char *argv[]) {
451 cl::list<std::string> InputFilenames(cl::Positional,
452 cl::desc("<filename...>"));
453 cl::list<std::string> WeightedInputFilenames("weighted-input",
454 cl::desc("<weight>,<filename>"));
455 cl::opt<std::string> InputFilenamesFile(
456 "input-files", cl::init(""),
457 cl::desc("Path to file containing newline-separated "
458 "[<weight>,]<filename> entries"));
459 cl::alias InputFilenamesFileA("f", cl::desc("Alias for --input-files"),
460 cl::aliasopt(InputFilenamesFile));
461 cl::opt<bool> DumpInputFileList(
462 "dump-input-file-list", cl::init(false), cl::Hidden,
463 cl::desc("Dump the list of input files and their weights, then exit"));
464 cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
465 cl::init("-"), cl::Required,
466 cl::desc("Output file"));
467 cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
468 cl::aliasopt(OutputFilename));
469 cl::opt<ProfileKinds> ProfileKind(
470 cl::desc("Profile kind:"), cl::init(instr),
471 cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
472 clEnumVal(sample, "Sample profile")));
473 cl::opt<ProfileFormat> OutputFormat(
474 cl::desc("Format of output profile"), cl::init(PF_Binary),
475 cl::values(clEnumValN(PF_Binary, "binary", "Binary encoding (default)"),
476 clEnumValN(PF_Compact_Binary, "compbinary",
477 "Compact binary encoding"),
478 clEnumValN(PF_Text, "text", "Text encoding"),
479 clEnumValN(PF_GCC, "gcc",
480 "GCC encoding (only meaningful for -sample)")));
481 cl::opt<bool> OutputSparse("sparse", cl::init(false),
482 cl::desc("Generate a sparse profile (only meaningful for -instr)"));
483 cl::opt<unsigned> NumThreads(
484 "num-threads", cl::init(0),
485 cl::desc("Number of merge threads to use (default: autodetect)"));
486 cl::alias NumThreadsA("j", cl::desc("Alias for --num-threads"),
487 cl::aliasopt(NumThreads));
488
489 cl::ParseCommandLineOptions(argc, argv, "LLVM profile data merger\n");
490
491 WeightedFileVector WeightedInputs;
492 for (StringRef Filename : InputFilenames)
493 addWeightedInput(WeightedInputs, {Filename, 1});
494 for (StringRef WeightedFilename : WeightedInputFilenames)
495 addWeightedInput(WeightedInputs, parseWeightedFile(WeightedFilename));
496
497 // Make sure that the file buffer stays alive for the duration of the
498 // weighted input vector's lifetime.
499 auto Buffer = getInputFilenamesFileBuf(InputFilenamesFile);
500 parseInputFilenamesFile(Buffer.get(), WeightedInputs);
501
502 if (WeightedInputs.empty())
503 exitWithError("No input files specified. See " +
504 sys::path::filename(argv[0]) + " -help");
505
506 if (DumpInputFileList) {
507 for (auto &WF : WeightedInputs)
508 outs() << WF.Weight << "," << WF.Filename << "\n";
509 return 0;
510 }
511
512 if (ProfileKind == instr)
513 mergeInstrProfile(WeightedInputs, OutputFilename, OutputFormat,
514 OutputSparse, NumThreads);
515 else
516 mergeSampleProfile(WeightedInputs, OutputFilename, OutputFormat);
517
518 return 0;
519 }
520
521 typedef struct ValueSitesStats {
ValueSitesStatsValueSitesStats522 ValueSitesStats()
523 : TotalNumValueSites(0), TotalNumValueSitesWithValueProfile(0),
524 TotalNumValues(0) {}
525 uint64_t TotalNumValueSites;
526 uint64_t TotalNumValueSitesWithValueProfile;
527 uint64_t TotalNumValues;
528 std::vector<unsigned> ValueSitesHistogram;
529 } ValueSitesStats;
530
traverseAllValueSites(const InstrProfRecord & Func,uint32_t VK,ValueSitesStats & Stats,raw_fd_ostream & OS,InstrProfSymtab * Symtab)531 static void traverseAllValueSites(const InstrProfRecord &Func, uint32_t VK,
532 ValueSitesStats &Stats, raw_fd_ostream &OS,
533 InstrProfSymtab *Symtab) {
534 uint32_t NS = Func.getNumValueSites(VK);
535 Stats.TotalNumValueSites += NS;
536 for (size_t I = 0; I < NS; ++I) {
537 uint32_t NV = Func.getNumValueDataForSite(VK, I);
538 std::unique_ptr<InstrProfValueData[]> VD = Func.getValueForSite(VK, I);
539 Stats.TotalNumValues += NV;
540 if (NV) {
541 Stats.TotalNumValueSitesWithValueProfile++;
542 if (NV > Stats.ValueSitesHistogram.size())
543 Stats.ValueSitesHistogram.resize(NV, 0);
544 Stats.ValueSitesHistogram[NV - 1]++;
545 }
546 for (uint32_t V = 0; V < NV; V++) {
547 OS << "\t[ " << I << ", ";
548 if (Symtab == nullptr)
549 OS << VD[V].Value;
550 else
551 OS << Symtab->getFuncName(VD[V].Value);
552 OS << ", " << VD[V].Count << " ]\n";
553 }
554 }
555 }
556
showValueSitesStats(raw_fd_ostream & OS,uint32_t VK,ValueSitesStats & Stats)557 static void showValueSitesStats(raw_fd_ostream &OS, uint32_t VK,
558 ValueSitesStats &Stats) {
559 OS << " Total number of sites: " << Stats.TotalNumValueSites << "\n";
560 OS << " Total number of sites with values: "
561 << Stats.TotalNumValueSitesWithValueProfile << "\n";
562 OS << " Total number of profiled values: " << Stats.TotalNumValues << "\n";
563
564 OS << " Value sites histogram:\n\tNumTargets, SiteCount\n";
565 for (unsigned I = 0; I < Stats.ValueSitesHistogram.size(); I++) {
566 if (Stats.ValueSitesHistogram[I] > 0)
567 OS << "\t" << I + 1 << ", " << Stats.ValueSitesHistogram[I] << "\n";
568 }
569 }
570
showInstrProfile(const std::string & Filename,bool ShowCounts,uint32_t TopN,bool ShowIndirectCallTargets,bool ShowMemOPSizes,bool ShowDetailedSummary,std::vector<uint32_t> DetailedSummaryCutoffs,bool ShowAllFunctions,const std::string & ShowFunction,bool TextFormat,raw_fd_ostream & OS)571 static int showInstrProfile(const std::string &Filename, bool ShowCounts,
572 uint32_t TopN, bool ShowIndirectCallTargets,
573 bool ShowMemOPSizes, bool ShowDetailedSummary,
574 std::vector<uint32_t> DetailedSummaryCutoffs,
575 bool ShowAllFunctions,
576 const std::string &ShowFunction, bool TextFormat,
577 raw_fd_ostream &OS) {
578 auto ReaderOrErr = InstrProfReader::create(Filename);
579 std::vector<uint32_t> Cutoffs = std::move(DetailedSummaryCutoffs);
580 if (ShowDetailedSummary && Cutoffs.empty()) {
581 Cutoffs = {800000, 900000, 950000, 990000, 999000, 999900, 999990};
582 }
583 InstrProfSummaryBuilder Builder(std::move(Cutoffs));
584 if (Error E = ReaderOrErr.takeError())
585 exitWithError(std::move(E), Filename);
586
587 auto Reader = std::move(ReaderOrErr.get());
588 bool IsIRInstr = Reader->isIRLevelProfile();
589 size_t ShownFunctions = 0;
590 int NumVPKind = IPVK_Last - IPVK_First + 1;
591 std::vector<ValueSitesStats> VPStats(NumVPKind);
592
593 auto MinCmp = [](const std::pair<std::string, uint64_t> &v1,
594 const std::pair<std::string, uint64_t> &v2) {
595 return v1.second > v2.second;
596 };
597
598 std::priority_queue<std::pair<std::string, uint64_t>,
599 std::vector<std::pair<std::string, uint64_t>>,
600 decltype(MinCmp)>
601 HottestFuncs(MinCmp);
602
603 for (const auto &Func : *Reader) {
604 bool Show =
605 ShowAllFunctions || (!ShowFunction.empty() &&
606 Func.Name.find(ShowFunction) != Func.Name.npos);
607
608 bool doTextFormatDump = (Show && ShowCounts && TextFormat);
609
610 if (doTextFormatDump) {
611 InstrProfSymtab &Symtab = Reader->getSymtab();
612 InstrProfWriter::writeRecordInText(Func.Name, Func.Hash, Func, Symtab,
613 OS);
614 continue;
615 }
616
617 assert(Func.Counts.size() > 0 && "function missing entry counter");
618 Builder.addRecord(Func);
619
620 if (TopN) {
621 uint64_t FuncMax = 0;
622 for (size_t I = 0, E = Func.Counts.size(); I < E; ++I)
623 FuncMax = std::max(FuncMax, Func.Counts[I]);
624
625 if (HottestFuncs.size() == TopN) {
626 if (HottestFuncs.top().second < FuncMax) {
627 HottestFuncs.pop();
628 HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
629 }
630 } else
631 HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
632 }
633
634 if (Show) {
635
636 if (!ShownFunctions)
637 OS << "Counters:\n";
638
639 ++ShownFunctions;
640
641 OS << " " << Func.Name << ":\n"
642 << " Hash: " << format("0x%016" PRIx64, Func.Hash) << "\n"
643 << " Counters: " << Func.Counts.size() << "\n";
644 if (!IsIRInstr)
645 OS << " Function count: " << Func.Counts[0] << "\n";
646
647 if (ShowIndirectCallTargets)
648 OS << " Indirect Call Site Count: "
649 << Func.getNumValueSites(IPVK_IndirectCallTarget) << "\n";
650
651 uint32_t NumMemOPCalls = Func.getNumValueSites(IPVK_MemOPSize);
652 if (ShowMemOPSizes && NumMemOPCalls > 0)
653 OS << " Number of Memory Intrinsics Calls: " << NumMemOPCalls
654 << "\n";
655
656 if (ShowCounts) {
657 OS << " Block counts: [";
658 size_t Start = (IsIRInstr ? 0 : 1);
659 for (size_t I = Start, E = Func.Counts.size(); I < E; ++I) {
660 OS << (I == Start ? "" : ", ") << Func.Counts[I];
661 }
662 OS << "]\n";
663 }
664
665 if (ShowIndirectCallTargets) {
666 OS << " Indirect Target Results:\n";
667 traverseAllValueSites(Func, IPVK_IndirectCallTarget,
668 VPStats[IPVK_IndirectCallTarget], OS,
669 &(Reader->getSymtab()));
670 }
671
672 if (ShowMemOPSizes && NumMemOPCalls > 0) {
673 OS << " Memory Intrinsic Size Results:\n";
674 traverseAllValueSites(Func, IPVK_MemOPSize, VPStats[IPVK_MemOPSize], OS,
675 nullptr);
676 }
677 }
678 }
679 if (Reader->hasError())
680 exitWithError(Reader->getError(), Filename);
681
682 if (ShowCounts && TextFormat)
683 return 0;
684 std::unique_ptr<ProfileSummary> PS(Builder.getSummary());
685 OS << "Instrumentation level: "
686 << (Reader->isIRLevelProfile() ? "IR" : "Front-end") << "\n";
687 if (ShowAllFunctions || !ShowFunction.empty())
688 OS << "Functions shown: " << ShownFunctions << "\n";
689 OS << "Total functions: " << PS->getNumFunctions() << "\n";
690 OS << "Maximum function count: " << PS->getMaxFunctionCount() << "\n";
691 OS << "Maximum internal block count: " << PS->getMaxInternalCount() << "\n";
692
693 if (TopN) {
694 std::vector<std::pair<std::string, uint64_t>> SortedHottestFuncs;
695 while (!HottestFuncs.empty()) {
696 SortedHottestFuncs.emplace_back(HottestFuncs.top());
697 HottestFuncs.pop();
698 }
699 OS << "Top " << TopN
700 << " functions with the largest internal block counts: \n";
701 for (auto &hotfunc : llvm::reverse(SortedHottestFuncs))
702 OS << " " << hotfunc.first << ", max count = " << hotfunc.second << "\n";
703 }
704
705 if (ShownFunctions && ShowIndirectCallTargets) {
706 OS << "Statistics for indirect call sites profile:\n";
707 showValueSitesStats(OS, IPVK_IndirectCallTarget,
708 VPStats[IPVK_IndirectCallTarget]);
709 }
710
711 if (ShownFunctions && ShowMemOPSizes) {
712 OS << "Statistics for memory intrinsic calls sizes profile:\n";
713 showValueSitesStats(OS, IPVK_MemOPSize, VPStats[IPVK_MemOPSize]);
714 }
715
716 if (ShowDetailedSummary) {
717 OS << "Detailed summary:\n";
718 OS << "Total number of blocks: " << PS->getNumCounts() << "\n";
719 OS << "Total count: " << PS->getTotalCount() << "\n";
720 for (auto Entry : PS->getDetailedSummary()) {
721 OS << Entry.NumCounts << " blocks with count >= " << Entry.MinCount
722 << " account for "
723 << format("%0.6g", (float)Entry.Cutoff / ProfileSummary::Scale * 100)
724 << " percentage of the total counts.\n";
725 }
726 }
727 return 0;
728 }
729
showSampleProfile(const std::string & Filename,bool ShowCounts,bool ShowAllFunctions,const std::string & ShowFunction,raw_fd_ostream & OS)730 static int showSampleProfile(const std::string &Filename, bool ShowCounts,
731 bool ShowAllFunctions,
732 const std::string &ShowFunction,
733 raw_fd_ostream &OS) {
734 using namespace sampleprof;
735 LLVMContext Context;
736 auto ReaderOrErr = SampleProfileReader::create(Filename, Context);
737 if (std::error_code EC = ReaderOrErr.getError())
738 exitWithErrorCode(EC, Filename);
739
740 auto Reader = std::move(ReaderOrErr.get());
741 if (std::error_code EC = Reader->read())
742 exitWithErrorCode(EC, Filename);
743
744 if (ShowAllFunctions || ShowFunction.empty())
745 Reader->dump(OS);
746 else
747 Reader->dumpFunctionProfile(ShowFunction, OS);
748
749 return 0;
750 }
751
show_main(int argc,const char * argv[])752 static int show_main(int argc, const char *argv[]) {
753 cl::opt<std::string> Filename(cl::Positional, cl::Required,
754 cl::desc("<profdata-file>"));
755
756 cl::opt<bool> ShowCounts("counts", cl::init(false),
757 cl::desc("Show counter values for shown functions"));
758 cl::opt<bool> TextFormat(
759 "text", cl::init(false),
760 cl::desc("Show instr profile data in text dump format"));
761 cl::opt<bool> ShowIndirectCallTargets(
762 "ic-targets", cl::init(false),
763 cl::desc("Show indirect call site target values for shown functions"));
764 cl::opt<bool> ShowMemOPSizes(
765 "memop-sizes", cl::init(false),
766 cl::desc("Show the profiled sizes of the memory intrinsic calls "
767 "for shown functions"));
768 cl::opt<bool> ShowDetailedSummary("detailed-summary", cl::init(false),
769 cl::desc("Show detailed profile summary"));
770 cl::list<uint32_t> DetailedSummaryCutoffs(
771 cl::CommaSeparated, "detailed-summary-cutoffs",
772 cl::desc(
773 "Cutoff percentages (times 10000) for generating detailed summary"),
774 cl::value_desc("800000,901000,999999"));
775 cl::opt<bool> ShowAllFunctions("all-functions", cl::init(false),
776 cl::desc("Details for every function"));
777 cl::opt<std::string> ShowFunction("function",
778 cl::desc("Details for matching functions"));
779
780 cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
781 cl::init("-"), cl::desc("Output file"));
782 cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
783 cl::aliasopt(OutputFilename));
784 cl::opt<ProfileKinds> ProfileKind(
785 cl::desc("Profile kind:"), cl::init(instr),
786 cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
787 clEnumVal(sample, "Sample profile")));
788 cl::opt<uint32_t> TopNFunctions(
789 "topn", cl::init(0),
790 cl::desc("Show the list of functions with the largest internal counts"));
791
792 cl::ParseCommandLineOptions(argc, argv, "LLVM profile data summary\n");
793
794 if (OutputFilename.empty())
795 OutputFilename = "-";
796
797 std::error_code EC;
798 raw_fd_ostream OS(OutputFilename.data(), EC, sys::fs::F_Text);
799 if (EC)
800 exitWithErrorCode(EC, OutputFilename);
801
802 if (ShowAllFunctions && !ShowFunction.empty())
803 WithColor::warning() << "-function argument ignored: showing all functions\n";
804
805 std::vector<uint32_t> Cutoffs(DetailedSummaryCutoffs.begin(),
806 DetailedSummaryCutoffs.end());
807 if (ProfileKind == instr)
808 return showInstrProfile(Filename, ShowCounts, TopNFunctions,
809 ShowIndirectCallTargets, ShowMemOPSizes,
810 ShowDetailedSummary, DetailedSummaryCutoffs,
811 ShowAllFunctions, ShowFunction, TextFormat, OS);
812 else
813 return showSampleProfile(Filename, ShowCounts, ShowAllFunctions,
814 ShowFunction, OS);
815 }
816
main(int argc,const char * argv[])817 int main(int argc, const char *argv[]) {
818 InitLLVM X(argc, argv);
819
820 StringRef ProgName(sys::path::filename(argv[0]));
821 if (argc > 1) {
822 int (*func)(int, const char *[]) = nullptr;
823
824 if (strcmp(argv[1], "merge") == 0)
825 func = merge_main;
826 else if (strcmp(argv[1], "show") == 0)
827 func = show_main;
828
829 if (func) {
830 std::string Invocation(ProgName.str() + " " + argv[1]);
831 argv[1] = Invocation.c_str();
832 return func(argc - 1, argv + 1);
833 }
834
835 if (strcmp(argv[1], "-h") == 0 || strcmp(argv[1], "-help") == 0 ||
836 strcmp(argv[1], "--help") == 0) {
837
838 errs() << "OVERVIEW: LLVM profile data tools\n\n"
839 << "USAGE: " << ProgName << " <command> [args...]\n"
840 << "USAGE: " << ProgName << " <command> -help\n\n"
841 << "See each individual command --help for more details.\n"
842 << "Available commands: merge, show\n";
843 return 0;
844 }
845 }
846
847 if (argc < 2)
848 errs() << ProgName << ": No command specified!\n";
849 else
850 errs() << ProgName << ": Unknown command!\n";
851
852 errs() << "USAGE: " << ProgName << " <merge|show> [args...]\n";
853 return 1;
854 }
855