[yaml2obj][obj2yaml] - Do not create a symbol table by default.
[llvm-complete.git] / tools / llvm-profdata / llvm-profdata.cpp
blob1470442c38b6181a952f832f5b9f5b174e1dcdbc
1 //===- llvm-profdata.cpp - LLVM profile data tool -------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // llvm-profdata merges .profdata files.
11 //===----------------------------------------------------------------------===//
13 #include "llvm/ADT/SmallSet.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/StringRef.h"
16 #include "llvm/IR/LLVMContext.h"
17 #include "llvm/ProfileData/InstrProfReader.h"
18 #include "llvm/ProfileData/InstrProfWriter.h"
19 #include "llvm/ProfileData/ProfileCommon.h"
20 #include "llvm/ProfileData/SampleProfReader.h"
21 #include "llvm/ProfileData/SampleProfWriter.h"
22 #include "llvm/Support/CommandLine.h"
23 #include "llvm/Support/Errc.h"
24 #include "llvm/Support/FileSystem.h"
25 #include "llvm/Support/Format.h"
26 #include "llvm/Support/InitLLVM.h"
27 #include "llvm/Support/MemoryBuffer.h"
28 #include "llvm/Support/Path.h"
29 #include "llvm/Support/ThreadPool.h"
30 #include "llvm/Support/WithColor.h"
31 #include "llvm/Support/raw_ostream.h"
32 #include <algorithm>
34 using namespace llvm;
36 enum ProfileFormat {
37 PF_None = 0,
38 PF_Text,
39 PF_Compact_Binary,
40 PF_Ext_Binary,
41 PF_GCC,
42 PF_Binary
45 static void warn(Twine Message, std::string Whence = "",
46 std::string Hint = "") {
47 WithColor::warning();
48 if (!Whence.empty())
49 errs() << Whence << ": ";
50 errs() << Message << "\n";
51 if (!Hint.empty())
52 WithColor::note() << Hint << "\n";
55 static void exitWithError(Twine Message, std::string Whence = "",
56 std::string Hint = "") {
57 WithColor::error();
58 if (!Whence.empty())
59 errs() << Whence << ": ";
60 errs() << Message << "\n";
61 if (!Hint.empty())
62 WithColor::note() << Hint << "\n";
63 ::exit(1);
66 static void exitWithError(Error E, StringRef Whence = "") {
67 if (E.isA<InstrProfError>()) {
68 handleAllErrors(std::move(E), [&](const InstrProfError &IPE) {
69 instrprof_error instrError = IPE.get();
70 StringRef Hint = "";
71 if (instrError == instrprof_error::unrecognized_format) {
72 // Hint for common error of forgetting -sample for sample profiles.
73 Hint = "Perhaps you forgot to use the -sample option?";
75 exitWithError(IPE.message(), Whence, Hint);
76 });
79 exitWithError(toString(std::move(E)), Whence);
82 static void exitWithErrorCode(std::error_code EC, StringRef Whence = "") {
83 exitWithError(EC.message(), Whence);
86 namespace {
87 enum ProfileKinds { instr, sample };
88 enum FailureMode { failIfAnyAreInvalid, failIfAllAreInvalid };
91 static void warnOrExitGivenError(FailureMode FailMode, std::error_code EC,
92 StringRef Whence = "") {
93 if (FailMode == failIfAnyAreInvalid)
94 exitWithErrorCode(EC, Whence);
95 else
96 warn(EC.message(), Whence);
99 static void handleMergeWriterError(Error E, StringRef WhenceFile = "",
100 StringRef WhenceFunction = "",
101 bool ShowHint = true) {
102 if (!WhenceFile.empty())
103 errs() << WhenceFile << ": ";
104 if (!WhenceFunction.empty())
105 errs() << WhenceFunction << ": ";
107 auto IPE = instrprof_error::success;
108 E = handleErrors(std::move(E),
109 [&IPE](std::unique_ptr<InstrProfError> E) -> Error {
110 IPE = E->get();
111 return Error(std::move(E));
113 errs() << toString(std::move(E)) << "\n";
115 if (ShowHint) {
116 StringRef Hint = "";
117 if (IPE != instrprof_error::success) {
118 switch (IPE) {
119 case instrprof_error::hash_mismatch:
120 case instrprof_error::count_mismatch:
121 case instrprof_error::value_site_count_mismatch:
122 Hint = "Make sure that all profile data to be merged is generated "
123 "from the same binary.";
124 break;
125 default:
126 break;
130 if (!Hint.empty())
131 errs() << Hint << "\n";
135 namespace {
136 /// A remapper from original symbol names to new symbol names based on a file
137 /// containing a list of mappings from old name to new name.
138 class SymbolRemapper {
139 std::unique_ptr<MemoryBuffer> File;
140 DenseMap<StringRef, StringRef> RemappingTable;
142 public:
143 /// Build a SymbolRemapper from a file containing a list of old/new symbols.
144 static std::unique_ptr<SymbolRemapper> create(StringRef InputFile) {
145 auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFile);
146 if (!BufOrError)
147 exitWithErrorCode(BufOrError.getError(), InputFile);
149 auto Remapper = std::make_unique<SymbolRemapper>();
150 Remapper->File = std::move(BufOrError.get());
152 for (line_iterator LineIt(*Remapper->File, /*SkipBlanks=*/true, '#');
153 !LineIt.is_at_eof(); ++LineIt) {
154 std::pair<StringRef, StringRef> Parts = LineIt->split(' ');
155 if (Parts.first.empty() || Parts.second.empty() ||
156 Parts.second.count(' ')) {
157 exitWithError("unexpected line in remapping file",
158 (InputFile + ":" + Twine(LineIt.line_number())).str(),
159 "expected 'old_symbol new_symbol'");
161 Remapper->RemappingTable.insert(Parts);
163 return Remapper;
166 /// Attempt to map the given old symbol into a new symbol.
168 /// \return The new symbol, or \p Name if no such symbol was found.
169 StringRef operator()(StringRef Name) {
170 StringRef New = RemappingTable.lookup(Name);
171 return New.empty() ? Name : New;
176 struct WeightedFile {
177 std::string Filename;
178 uint64_t Weight;
180 typedef SmallVector<WeightedFile, 5> WeightedFileVector;
182 /// Keep track of merged data and reported errors.
183 struct WriterContext {
184 std::mutex Lock;
185 InstrProfWriter Writer;
186 std::vector<std::pair<Error, std::string>> Errors;
187 std::mutex &ErrLock;
188 SmallSet<instrprof_error, 4> &WriterErrorCodes;
190 WriterContext(bool IsSparse, std::mutex &ErrLock,
191 SmallSet<instrprof_error, 4> &WriterErrorCodes)
192 : Lock(), Writer(IsSparse), Errors(), ErrLock(ErrLock),
193 WriterErrorCodes(WriterErrorCodes) {}
196 /// Computer the overlap b/w profile BaseFilename and TestFileName,
197 /// and store the program level result to Overlap.
198 static void overlapInput(const std::string &BaseFilename,
199 const std::string &TestFilename, WriterContext *WC,
200 OverlapStats &Overlap,
201 const OverlapFuncFilters &FuncFilter,
202 raw_fd_ostream &OS, bool IsCS) {
203 auto ReaderOrErr = InstrProfReader::create(TestFilename);
204 if (Error E = ReaderOrErr.takeError()) {
205 // Skip the empty profiles by returning sliently.
206 instrprof_error IPE = InstrProfError::take(std::move(E));
207 if (IPE != instrprof_error::empty_raw_profile)
208 WC->Errors.emplace_back(make_error<InstrProfError>(IPE), TestFilename);
209 return;
212 auto Reader = std::move(ReaderOrErr.get());
213 for (auto &I : *Reader) {
214 OverlapStats FuncOverlap(OverlapStats::FunctionLevel);
215 FuncOverlap.setFuncInfo(I.Name, I.Hash);
217 WC->Writer.overlapRecord(std::move(I), Overlap, FuncOverlap, FuncFilter);
218 FuncOverlap.dump(OS);
222 /// Load an input into a writer context.
223 static void loadInput(const WeightedFile &Input, SymbolRemapper *Remapper,
224 WriterContext *WC) {
225 std::unique_lock<std::mutex> CtxGuard{WC->Lock};
227 // Copy the filename, because llvm::ThreadPool copied the input "const
228 // WeightedFile &" by value, making a reference to the filename within it
229 // invalid outside of this packaged task.
230 std::string Filename = Input.Filename;
232 auto ReaderOrErr = InstrProfReader::create(Input.Filename);
233 if (Error E = ReaderOrErr.takeError()) {
234 // Skip the empty profiles by returning sliently.
235 instrprof_error IPE = InstrProfError::take(std::move(E));
236 if (IPE != instrprof_error::empty_raw_profile)
237 WC->Errors.emplace_back(make_error<InstrProfError>(IPE), Filename);
238 return;
241 auto Reader = std::move(ReaderOrErr.get());
242 bool IsIRProfile = Reader->isIRLevelProfile();
243 bool HasCSIRProfile = Reader->hasCSIRLevelProfile();
244 if (WC->Writer.setIsIRLevelProfile(IsIRProfile, HasCSIRProfile)) {
245 WC->Errors.emplace_back(
246 make_error<StringError>(
247 "Merge IR generated profile with Clang generated profile.",
248 std::error_code()),
249 Filename);
250 return;
253 for (auto &I : *Reader) {
254 if (Remapper)
255 I.Name = (*Remapper)(I.Name);
256 const StringRef FuncName = I.Name;
257 bool Reported = false;
258 WC->Writer.addRecord(std::move(I), Input.Weight, [&](Error E) {
259 if (Reported) {
260 consumeError(std::move(E));
261 return;
263 Reported = true;
264 // Only show hint the first time an error occurs.
265 instrprof_error IPE = InstrProfError::take(std::move(E));
266 std::unique_lock<std::mutex> ErrGuard{WC->ErrLock};
267 bool firstTime = WC->WriterErrorCodes.insert(IPE).second;
268 handleMergeWriterError(make_error<InstrProfError>(IPE), Input.Filename,
269 FuncName, firstTime);
272 if (Reader->hasError())
273 if (Error E = Reader->getError())
274 WC->Errors.emplace_back(std::move(E), Filename);
277 /// Merge the \p Src writer context into \p Dst.
278 static void mergeWriterContexts(WriterContext *Dst, WriterContext *Src) {
279 for (auto &ErrorPair : Src->Errors)
280 Dst->Errors.push_back(std::move(ErrorPair));
281 Src->Errors.clear();
283 Dst->Writer.mergeRecordsFromWriter(std::move(Src->Writer), [&](Error E) {
284 instrprof_error IPE = InstrProfError::take(std::move(E));
285 std::unique_lock<std::mutex> ErrGuard{Dst->ErrLock};
286 bool firstTime = Dst->WriterErrorCodes.insert(IPE).second;
287 if (firstTime)
288 warn(toString(make_error<InstrProfError>(IPE)));
292 static void mergeInstrProfile(const WeightedFileVector &Inputs,
293 SymbolRemapper *Remapper,
294 StringRef OutputFilename,
295 ProfileFormat OutputFormat, bool OutputSparse,
296 unsigned NumThreads, FailureMode FailMode) {
297 if (OutputFilename.compare("-") == 0)
298 exitWithError("Cannot write indexed profdata format to stdout.");
300 if (OutputFormat != PF_Binary && OutputFormat != PF_Compact_Binary &&
301 OutputFormat != PF_Ext_Binary && OutputFormat != PF_Text)
302 exitWithError("Unknown format is specified.");
304 std::mutex ErrorLock;
305 SmallSet<instrprof_error, 4> WriterErrorCodes;
307 // If NumThreads is not specified, auto-detect a good default.
308 if (NumThreads == 0)
309 NumThreads =
310 std::min(hardware_concurrency(), unsigned((Inputs.size() + 1) / 2));
312 // Initialize the writer contexts.
313 SmallVector<std::unique_ptr<WriterContext>, 4> Contexts;
314 for (unsigned I = 0; I < NumThreads; ++I)
315 Contexts.emplace_back(std::make_unique<WriterContext>(
316 OutputSparse, ErrorLock, WriterErrorCodes));
318 if (NumThreads == 1) {
319 for (const auto &Input : Inputs)
320 loadInput(Input, Remapper, Contexts[0].get());
321 } else {
322 ThreadPool Pool(NumThreads);
324 // Load the inputs in parallel (N/NumThreads serial steps).
325 unsigned Ctx = 0;
326 for (const auto &Input : Inputs) {
327 Pool.async(loadInput, Input, Remapper, Contexts[Ctx].get());
328 Ctx = (Ctx + 1) % NumThreads;
330 Pool.wait();
332 // Merge the writer contexts together (~ lg(NumThreads) serial steps).
333 unsigned Mid = Contexts.size() / 2;
334 unsigned End = Contexts.size();
335 assert(Mid > 0 && "Expected more than one context");
336 do {
337 for (unsigned I = 0; I < Mid; ++I)
338 Pool.async(mergeWriterContexts, Contexts[I].get(),
339 Contexts[I + Mid].get());
340 Pool.wait();
341 if (End & 1) {
342 Pool.async(mergeWriterContexts, Contexts[0].get(),
343 Contexts[End - 1].get());
344 Pool.wait();
346 End = Mid;
347 Mid /= 2;
348 } while (Mid > 0);
351 // Handle deferred errors encountered during merging. If the number of errors
352 // is equal to the number of inputs the merge failed.
353 unsigned NumErrors = 0;
354 for (std::unique_ptr<WriterContext> &WC : Contexts) {
355 for (auto &ErrorPair : WC->Errors) {
356 ++NumErrors;
357 warn(toString(std::move(ErrorPair.first)), ErrorPair.second);
360 if (NumErrors == Inputs.size() ||
361 (NumErrors > 0 && FailMode == failIfAnyAreInvalid))
362 exitWithError("No profiles could be merged.");
364 std::error_code EC;
365 raw_fd_ostream Output(OutputFilename.data(), EC, sys::fs::OF_None);
366 if (EC)
367 exitWithErrorCode(EC, OutputFilename);
369 InstrProfWriter &Writer = Contexts[0]->Writer;
370 if (OutputFormat == PF_Text) {
371 if (Error E = Writer.writeText(Output))
372 exitWithError(std::move(E));
373 } else {
374 Writer.write(Output);
378 /// Make a copy of the given function samples with all symbol names remapped
379 /// by the provided symbol remapper.
380 static sampleprof::FunctionSamples
381 remapSamples(const sampleprof::FunctionSamples &Samples,
382 SymbolRemapper &Remapper, sampleprof_error &Error) {
383 sampleprof::FunctionSamples Result;
384 Result.setName(Remapper(Samples.getName()));
385 Result.addTotalSamples(Samples.getTotalSamples());
386 Result.addHeadSamples(Samples.getHeadSamples());
387 for (const auto &BodySample : Samples.getBodySamples()) {
388 Result.addBodySamples(BodySample.first.LineOffset,
389 BodySample.first.Discriminator,
390 BodySample.second.getSamples());
391 for (const auto &Target : BodySample.second.getCallTargets()) {
392 Result.addCalledTargetSamples(BodySample.first.LineOffset,
393 BodySample.first.Discriminator,
394 Remapper(Target.first()), Target.second);
397 for (const auto &CallsiteSamples : Samples.getCallsiteSamples()) {
398 sampleprof::FunctionSamplesMap &Target =
399 Result.functionSamplesAt(CallsiteSamples.first);
400 for (const auto &Callsite : CallsiteSamples.second) {
401 sampleprof::FunctionSamples Remapped =
402 remapSamples(Callsite.second, Remapper, Error);
403 MergeResult(Error, Target[Remapped.getName()].merge(Remapped));
406 return Result;
409 static sampleprof::SampleProfileFormat FormatMap[] = {
410 sampleprof::SPF_None,
411 sampleprof::SPF_Text,
412 sampleprof::SPF_Compact_Binary,
413 sampleprof::SPF_Ext_Binary,
414 sampleprof::SPF_GCC,
415 sampleprof::SPF_Binary};
417 static std::unique_ptr<MemoryBuffer>
418 getInputFileBuf(const StringRef &InputFile) {
419 if (InputFile == "")
420 return {};
422 auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFile);
423 if (!BufOrError)
424 exitWithErrorCode(BufOrError.getError(), InputFile);
426 return std::move(*BufOrError);
429 static void populateProfileSymbolList(MemoryBuffer *Buffer,
430 sampleprof::ProfileSymbolList &PSL) {
431 if (!Buffer)
432 return;
434 SmallVector<StringRef, 32> SymbolVec;
435 StringRef Data = Buffer->getBuffer();
436 Data.split(SymbolVec, '\n', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
438 for (StringRef symbol : SymbolVec)
439 PSL.add(symbol);
442 static void handleExtBinaryWriter(sampleprof::SampleProfileWriter &Writer,
443 ProfileFormat OutputFormat,
444 MemoryBuffer *Buffer,
445 sampleprof::ProfileSymbolList &WriterList,
446 bool CompressAllSections) {
447 populateProfileSymbolList(Buffer, WriterList);
448 if (WriterList.size() > 0 && OutputFormat != PF_Ext_Binary)
449 warn("Profile Symbol list is not empty but the output format is not "
450 "ExtBinary format. The list will be lost in the output. ");
452 Writer.setProfileSymbolList(&WriterList);
454 if (CompressAllSections) {
455 if (OutputFormat != PF_Ext_Binary) {
456 warn("-compress-all-section is ignored. Specify -extbinary to enable it");
457 } else {
458 auto ExtBinaryWriter =
459 static_cast<sampleprof::SampleProfileWriterExtBinary *>(&Writer);
460 ExtBinaryWriter->setToCompressAllSections();
465 static void mergeSampleProfile(const WeightedFileVector &Inputs,
466 SymbolRemapper *Remapper,
467 StringRef OutputFilename,
468 ProfileFormat OutputFormat,
469 StringRef ProfileSymbolListFile,
470 bool CompressAllSections, FailureMode FailMode) {
471 using namespace sampleprof;
472 StringMap<FunctionSamples> ProfileMap;
473 SmallVector<std::unique_ptr<sampleprof::SampleProfileReader>, 5> Readers;
474 LLVMContext Context;
475 sampleprof::ProfileSymbolList WriterList;
476 for (const auto &Input : Inputs) {
477 auto ReaderOrErr = SampleProfileReader::create(Input.Filename, Context);
478 if (std::error_code EC = ReaderOrErr.getError()) {
479 warnOrExitGivenError(FailMode, EC, Input.Filename);
480 continue;
483 // We need to keep the readers around until after all the files are
484 // read so that we do not lose the function names stored in each
485 // reader's memory. The function names are needed to write out the
486 // merged profile map.
487 Readers.push_back(std::move(ReaderOrErr.get()));
488 const auto Reader = Readers.back().get();
489 if (std::error_code EC = Reader->read()) {
490 warnOrExitGivenError(FailMode, EC, Input.Filename);
491 Readers.pop_back();
492 continue;
495 StringMap<FunctionSamples> &Profiles = Reader->getProfiles();
496 for (StringMap<FunctionSamples>::iterator I = Profiles.begin(),
497 E = Profiles.end();
498 I != E; ++I) {
499 sampleprof_error Result = sampleprof_error::success;
500 FunctionSamples Remapped =
501 Remapper ? remapSamples(I->second, *Remapper, Result)
502 : FunctionSamples();
503 FunctionSamples &Samples = Remapper ? Remapped : I->second;
504 StringRef FName = Samples.getName();
505 MergeResult(Result, ProfileMap[FName].merge(Samples, Input.Weight));
506 if (Result != sampleprof_error::success) {
507 std::error_code EC = make_error_code(Result);
508 handleMergeWriterError(errorCodeToError(EC), Input.Filename, FName);
512 std::unique_ptr<sampleprof::ProfileSymbolList> ReaderList =
513 Reader->getProfileSymbolList();
514 if (ReaderList)
515 WriterList.merge(*ReaderList);
517 auto WriterOrErr =
518 SampleProfileWriter::create(OutputFilename, FormatMap[OutputFormat]);
519 if (std::error_code EC = WriterOrErr.getError())
520 exitWithErrorCode(EC, OutputFilename);
522 auto Writer = std::move(WriterOrErr.get());
523 // WriterList will have StringRef refering to string in Buffer.
524 // Make sure Buffer lives as long as WriterList.
525 auto Buffer = getInputFileBuf(ProfileSymbolListFile);
526 handleExtBinaryWriter(*Writer, OutputFormat, Buffer.get(), WriterList,
527 CompressAllSections);
528 Writer->write(ProfileMap);
531 static WeightedFile parseWeightedFile(const StringRef &WeightedFilename) {
532 StringRef WeightStr, FileName;
533 std::tie(WeightStr, FileName) = WeightedFilename.split(',');
535 uint64_t Weight;
536 if (WeightStr.getAsInteger(10, Weight) || Weight < 1)
537 exitWithError("Input weight must be a positive integer.");
539 return {FileName, Weight};
542 static void addWeightedInput(WeightedFileVector &WNI, const WeightedFile &WF) {
543 StringRef Filename = WF.Filename;
544 uint64_t Weight = WF.Weight;
546 // If it's STDIN just pass it on.
547 if (Filename == "-") {
548 WNI.push_back({Filename, Weight});
549 return;
552 llvm::sys::fs::file_status Status;
553 llvm::sys::fs::status(Filename, Status);
554 if (!llvm::sys::fs::exists(Status))
555 exitWithErrorCode(make_error_code(errc::no_such_file_or_directory),
556 Filename);
557 // If it's a source file, collect it.
558 if (llvm::sys::fs::is_regular_file(Status)) {
559 WNI.push_back({Filename, Weight});
560 return;
563 if (llvm::sys::fs::is_directory(Status)) {
564 std::error_code EC;
565 for (llvm::sys::fs::recursive_directory_iterator F(Filename, EC), E;
566 F != E && !EC; F.increment(EC)) {
567 if (llvm::sys::fs::is_regular_file(F->path())) {
568 addWeightedInput(WNI, {F->path(), Weight});
571 if (EC)
572 exitWithErrorCode(EC, Filename);
576 static void parseInputFilenamesFile(MemoryBuffer *Buffer,
577 WeightedFileVector &WFV) {
578 if (!Buffer)
579 return;
581 SmallVector<StringRef, 8> Entries;
582 StringRef Data = Buffer->getBuffer();
583 Data.split(Entries, '\n', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
584 for (const StringRef &FileWeightEntry : Entries) {
585 StringRef SanitizedEntry = FileWeightEntry.trim(" \t\v\f\r");
586 // Skip comments.
587 if (SanitizedEntry.startswith("#"))
588 continue;
589 // If there's no comma, it's an unweighted profile.
590 else if (SanitizedEntry.find(',') == StringRef::npos)
591 addWeightedInput(WFV, {SanitizedEntry, 1});
592 else
593 addWeightedInput(WFV, parseWeightedFile(SanitizedEntry));
597 static int merge_main(int argc, const char *argv[]) {
598 cl::list<std::string> InputFilenames(cl::Positional,
599 cl::desc("<filename...>"));
600 cl::list<std::string> WeightedInputFilenames("weighted-input",
601 cl::desc("<weight>,<filename>"));
602 cl::opt<std::string> InputFilenamesFile(
603 "input-files", cl::init(""),
604 cl::desc("Path to file containing newline-separated "
605 "[<weight>,]<filename> entries"));
606 cl::alias InputFilenamesFileA("f", cl::desc("Alias for --input-files"),
607 cl::aliasopt(InputFilenamesFile));
608 cl::opt<bool> DumpInputFileList(
609 "dump-input-file-list", cl::init(false), cl::Hidden,
610 cl::desc("Dump the list of input files and their weights, then exit"));
611 cl::opt<std::string> RemappingFile("remapping-file", cl::value_desc("file"),
612 cl::desc("Symbol remapping file"));
613 cl::alias RemappingFileA("r", cl::desc("Alias for --remapping-file"),
614 cl::aliasopt(RemappingFile));
615 cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
616 cl::init("-"), cl::Required,
617 cl::desc("Output file"));
618 cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
619 cl::aliasopt(OutputFilename));
620 cl::opt<ProfileKinds> ProfileKind(
621 cl::desc("Profile kind:"), cl::init(instr),
622 cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
623 clEnumVal(sample, "Sample profile")));
624 cl::opt<ProfileFormat> OutputFormat(
625 cl::desc("Format of output profile"), cl::init(PF_Binary),
626 cl::values(
627 clEnumValN(PF_Binary, "binary", "Binary encoding (default)"),
628 clEnumValN(PF_Compact_Binary, "compbinary",
629 "Compact binary encoding"),
630 clEnumValN(PF_Ext_Binary, "extbinary", "Extensible binary encoding"),
631 clEnumValN(PF_Text, "text", "Text encoding"),
632 clEnumValN(PF_GCC, "gcc",
633 "GCC encoding (only meaningful for -sample)")));
634 cl::opt<FailureMode> FailureMode(
635 "failure-mode", cl::init(failIfAnyAreInvalid), cl::desc("Failure mode:"),
636 cl::values(clEnumValN(failIfAnyAreInvalid, "any",
637 "Fail if any profile is invalid."),
638 clEnumValN(failIfAllAreInvalid, "all",
639 "Fail only if all profiles are invalid.")));
640 cl::opt<bool> OutputSparse("sparse", cl::init(false),
641 cl::desc("Generate a sparse profile (only meaningful for -instr)"));
642 cl::opt<unsigned> NumThreads(
643 "num-threads", cl::init(0),
644 cl::desc("Number of merge threads to use (default: autodetect)"));
645 cl::alias NumThreadsA("j", cl::desc("Alias for --num-threads"),
646 cl::aliasopt(NumThreads));
647 cl::opt<std::string> ProfileSymbolListFile(
648 "prof-sym-list", cl::init(""),
649 cl::desc("Path to file containing the list of function symbols "
650 "used to populate profile symbol list"));
651 cl::opt<bool> CompressAllSections(
652 "compress-all-sections", cl::init(false), cl::Hidden,
653 cl::desc("Compress all sections when writing the profile (only "
654 "meaningful for -extbinary)"));
656 cl::ParseCommandLineOptions(argc, argv, "LLVM profile data merger\n");
658 WeightedFileVector WeightedInputs;
659 for (StringRef Filename : InputFilenames)
660 addWeightedInput(WeightedInputs, {Filename, 1});
661 for (StringRef WeightedFilename : WeightedInputFilenames)
662 addWeightedInput(WeightedInputs, parseWeightedFile(WeightedFilename));
664 // Make sure that the file buffer stays alive for the duration of the
665 // weighted input vector's lifetime.
666 auto Buffer = getInputFileBuf(InputFilenamesFile);
667 parseInputFilenamesFile(Buffer.get(), WeightedInputs);
669 if (WeightedInputs.empty())
670 exitWithError("No input files specified. See " +
671 sys::path::filename(argv[0]) + " -help");
673 if (DumpInputFileList) {
674 for (auto &WF : WeightedInputs)
675 outs() << WF.Weight << "," << WF.Filename << "\n";
676 return 0;
679 std::unique_ptr<SymbolRemapper> Remapper;
680 if (!RemappingFile.empty())
681 Remapper = SymbolRemapper::create(RemappingFile);
683 if (ProfileKind == instr)
684 mergeInstrProfile(WeightedInputs, Remapper.get(), OutputFilename,
685 OutputFormat, OutputSparse, NumThreads, FailureMode);
686 else
687 mergeSampleProfile(WeightedInputs, Remapper.get(), OutputFilename,
688 OutputFormat, ProfileSymbolListFile, CompressAllSections,
689 FailureMode);
691 return 0;
694 /// Computer the overlap b/w profile BaseFilename and profile TestFilename.
695 static void overlapInstrProfile(const std::string &BaseFilename,
696 const std::string &TestFilename,
697 const OverlapFuncFilters &FuncFilter,
698 raw_fd_ostream &OS, bool IsCS) {
699 std::mutex ErrorLock;
700 SmallSet<instrprof_error, 4> WriterErrorCodes;
701 WriterContext Context(false, ErrorLock, WriterErrorCodes);
702 WeightedFile WeightedInput{BaseFilename, 1};
703 OverlapStats Overlap;
704 Error E = Overlap.accumulateCounts(BaseFilename, TestFilename, IsCS);
705 if (E)
706 exitWithError(std::move(E), "Error in getting profile count sums");
707 if (Overlap.Base.CountSum < 1.0f) {
708 OS << "Sum of edge counts for profile " << BaseFilename << " is 0.\n";
709 exit(0);
711 if (Overlap.Test.CountSum < 1.0f) {
712 OS << "Sum of edge counts for profile " << TestFilename << " is 0.\n";
713 exit(0);
715 loadInput(WeightedInput, nullptr, &Context);
716 overlapInput(BaseFilename, TestFilename, &Context, Overlap, FuncFilter, OS,
717 IsCS);
718 Overlap.dump(OS);
721 static int overlap_main(int argc, const char *argv[]) {
722 cl::opt<std::string> BaseFilename(cl::Positional, cl::Required,
723 cl::desc("<base profile file>"));
724 cl::opt<std::string> TestFilename(cl::Positional, cl::Required,
725 cl::desc("<test profile file>"));
726 cl::opt<std::string> Output("output", cl::value_desc("output"), cl::init("-"),
727 cl::desc("Output file"));
728 cl::alias OutputA("o", cl::desc("Alias for --output"), cl::aliasopt(Output));
729 cl::opt<bool> IsCS("cs", cl::init(false),
730 cl::desc("For context sensitive counts"));
731 cl::opt<unsigned long long> ValueCutoff(
732 "value-cutoff", cl::init(-1),
733 cl::desc(
734 "Function level overlap information for every function in test "
735 "profile with max count value greater then the parameter value"));
736 cl::opt<std::string> FuncNameFilter(
737 "function",
738 cl::desc("Function level overlap information for matching functions"));
739 cl::ParseCommandLineOptions(argc, argv, "LLVM profile data overlap tool\n");
741 std::error_code EC;
742 raw_fd_ostream OS(Output.data(), EC, sys::fs::OF_Text);
743 if (EC)
744 exitWithErrorCode(EC, Output);
746 overlapInstrProfile(BaseFilename, TestFilename,
747 OverlapFuncFilters{ValueCutoff, FuncNameFilter}, OS,
748 IsCS);
750 return 0;
753 typedef struct ValueSitesStats {
754 ValueSitesStats()
755 : TotalNumValueSites(0), TotalNumValueSitesWithValueProfile(0),
756 TotalNumValues(0) {}
757 uint64_t TotalNumValueSites;
758 uint64_t TotalNumValueSitesWithValueProfile;
759 uint64_t TotalNumValues;
760 std::vector<unsigned> ValueSitesHistogram;
761 } ValueSitesStats;
763 static void traverseAllValueSites(const InstrProfRecord &Func, uint32_t VK,
764 ValueSitesStats &Stats, raw_fd_ostream &OS,
765 InstrProfSymtab *Symtab) {
766 uint32_t NS = Func.getNumValueSites(VK);
767 Stats.TotalNumValueSites += NS;
768 for (size_t I = 0; I < NS; ++I) {
769 uint32_t NV = Func.getNumValueDataForSite(VK, I);
770 std::unique_ptr<InstrProfValueData[]> VD = Func.getValueForSite(VK, I);
771 Stats.TotalNumValues += NV;
772 if (NV) {
773 Stats.TotalNumValueSitesWithValueProfile++;
774 if (NV > Stats.ValueSitesHistogram.size())
775 Stats.ValueSitesHistogram.resize(NV, 0);
776 Stats.ValueSitesHistogram[NV - 1]++;
779 uint64_t SiteSum = 0;
780 for (uint32_t V = 0; V < NV; V++)
781 SiteSum += VD[V].Count;
782 if (SiteSum == 0)
783 SiteSum = 1;
785 for (uint32_t V = 0; V < NV; V++) {
786 OS << "\t[ " << format("%2u", I) << ", ";
787 if (Symtab == nullptr)
788 OS << format("%4" PRIu64, VD[V].Value);
789 else
790 OS << Symtab->getFuncName(VD[V].Value);
791 OS << ", " << format("%10" PRId64, VD[V].Count) << " ] ("
792 << format("%.2f%%", (VD[V].Count * 100.0 / SiteSum)) << ")\n";
797 static void showValueSitesStats(raw_fd_ostream &OS, uint32_t VK,
798 ValueSitesStats &Stats) {
799 OS << " Total number of sites: " << Stats.TotalNumValueSites << "\n";
800 OS << " Total number of sites with values: "
801 << Stats.TotalNumValueSitesWithValueProfile << "\n";
802 OS << " Total number of profiled values: " << Stats.TotalNumValues << "\n";
804 OS << " Value sites histogram:\n\tNumTargets, SiteCount\n";
805 for (unsigned I = 0; I < Stats.ValueSitesHistogram.size(); I++) {
806 if (Stats.ValueSitesHistogram[I] > 0)
807 OS << "\t" << I + 1 << ", " << Stats.ValueSitesHistogram[I] << "\n";
811 static int showInstrProfile(const std::string &Filename, bool ShowCounts,
812 uint32_t TopN, bool ShowIndirectCallTargets,
813 bool ShowMemOPSizes, bool ShowDetailedSummary,
814 std::vector<uint32_t> DetailedSummaryCutoffs,
815 bool ShowAllFunctions, bool ShowCS,
816 uint64_t ValueCutoff, bool OnlyListBelow,
817 const std::string &ShowFunction, bool TextFormat,
818 raw_fd_ostream &OS) {
819 auto ReaderOrErr = InstrProfReader::create(Filename);
820 std::vector<uint32_t> Cutoffs = std::move(DetailedSummaryCutoffs);
821 if (ShowDetailedSummary && Cutoffs.empty()) {
822 Cutoffs = {800000, 900000, 950000, 990000, 999000, 999900, 999990};
824 InstrProfSummaryBuilder Builder(std::move(Cutoffs));
825 if (Error E = ReaderOrErr.takeError())
826 exitWithError(std::move(E), Filename);
828 auto Reader = std::move(ReaderOrErr.get());
829 bool IsIRInstr = Reader->isIRLevelProfile();
830 size_t ShownFunctions = 0;
831 size_t BelowCutoffFunctions = 0;
832 int NumVPKind = IPVK_Last - IPVK_First + 1;
833 std::vector<ValueSitesStats> VPStats(NumVPKind);
835 auto MinCmp = [](const std::pair<std::string, uint64_t> &v1,
836 const std::pair<std::string, uint64_t> &v2) {
837 return v1.second > v2.second;
840 std::priority_queue<std::pair<std::string, uint64_t>,
841 std::vector<std::pair<std::string, uint64_t>>,
842 decltype(MinCmp)>
843 HottestFuncs(MinCmp);
845 if (!TextFormat && OnlyListBelow) {
846 OS << "The list of functions with the maximum counter less than "
847 << ValueCutoff << ":\n";
850 // Add marker so that IR-level instrumentation round-trips properly.
851 if (TextFormat && IsIRInstr)
852 OS << ":ir\n";
854 for (const auto &Func : *Reader) {
855 if (Reader->isIRLevelProfile()) {
856 bool FuncIsCS = NamedInstrProfRecord::hasCSFlagInHash(Func.Hash);
857 if (FuncIsCS != ShowCS)
858 continue;
860 bool Show =
861 ShowAllFunctions || (!ShowFunction.empty() &&
862 Func.Name.find(ShowFunction) != Func.Name.npos);
864 bool doTextFormatDump = (Show && TextFormat);
866 if (doTextFormatDump) {
867 InstrProfSymtab &Symtab = Reader->getSymtab();
868 InstrProfWriter::writeRecordInText(Func.Name, Func.Hash, Func, Symtab,
869 OS);
870 continue;
873 assert(Func.Counts.size() > 0 && "function missing entry counter");
874 Builder.addRecord(Func);
876 uint64_t FuncMax = 0;
877 uint64_t FuncSum = 0;
878 for (size_t I = 0, E = Func.Counts.size(); I < E; ++I) {
879 FuncMax = std::max(FuncMax, Func.Counts[I]);
880 FuncSum += Func.Counts[I];
883 if (FuncMax < ValueCutoff) {
884 ++BelowCutoffFunctions;
885 if (OnlyListBelow) {
886 OS << " " << Func.Name << ": (Max = " << FuncMax
887 << " Sum = " << FuncSum << ")\n";
889 continue;
890 } else if (OnlyListBelow)
891 continue;
893 if (TopN) {
894 if (HottestFuncs.size() == TopN) {
895 if (HottestFuncs.top().second < FuncMax) {
896 HottestFuncs.pop();
897 HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
899 } else
900 HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
903 if (Show) {
904 if (!ShownFunctions)
905 OS << "Counters:\n";
907 ++ShownFunctions;
909 OS << " " << Func.Name << ":\n"
910 << " Hash: " << format("0x%016" PRIx64, Func.Hash) << "\n"
911 << " Counters: " << Func.Counts.size() << "\n";
912 if (!IsIRInstr)
913 OS << " Function count: " << Func.Counts[0] << "\n";
915 if (ShowIndirectCallTargets)
916 OS << " Indirect Call Site Count: "
917 << Func.getNumValueSites(IPVK_IndirectCallTarget) << "\n";
919 uint32_t NumMemOPCalls = Func.getNumValueSites(IPVK_MemOPSize);
920 if (ShowMemOPSizes && NumMemOPCalls > 0)
921 OS << " Number of Memory Intrinsics Calls: " << NumMemOPCalls
922 << "\n";
924 if (ShowCounts) {
925 OS << " Block counts: [";
926 size_t Start = (IsIRInstr ? 0 : 1);
927 for (size_t I = Start, E = Func.Counts.size(); I < E; ++I) {
928 OS << (I == Start ? "" : ", ") << Func.Counts[I];
930 OS << "]\n";
933 if (ShowIndirectCallTargets) {
934 OS << " Indirect Target Results:\n";
935 traverseAllValueSites(Func, IPVK_IndirectCallTarget,
936 VPStats[IPVK_IndirectCallTarget], OS,
937 &(Reader->getSymtab()));
940 if (ShowMemOPSizes && NumMemOPCalls > 0) {
941 OS << " Memory Intrinsic Size Results:\n";
942 traverseAllValueSites(Func, IPVK_MemOPSize, VPStats[IPVK_MemOPSize], OS,
943 nullptr);
947 if (Reader->hasError())
948 exitWithError(Reader->getError(), Filename);
950 if (TextFormat)
951 return 0;
952 std::unique_ptr<ProfileSummary> PS(Builder.getSummary());
953 OS << "Instrumentation level: "
954 << (Reader->isIRLevelProfile() ? "IR" : "Front-end") << "\n";
955 if (ShowAllFunctions || !ShowFunction.empty())
956 OS << "Functions shown: " << ShownFunctions << "\n";
957 OS << "Total functions: " << PS->getNumFunctions() << "\n";
958 if (ValueCutoff > 0) {
959 OS << "Number of functions with maximum count (< " << ValueCutoff
960 << "): " << BelowCutoffFunctions << "\n";
961 OS << "Number of functions with maximum count (>= " << ValueCutoff
962 << "): " << PS->getNumFunctions() - BelowCutoffFunctions << "\n";
964 OS << "Maximum function count: " << PS->getMaxFunctionCount() << "\n";
965 OS << "Maximum internal block count: " << PS->getMaxInternalCount() << "\n";
967 if (TopN) {
968 std::vector<std::pair<std::string, uint64_t>> SortedHottestFuncs;
969 while (!HottestFuncs.empty()) {
970 SortedHottestFuncs.emplace_back(HottestFuncs.top());
971 HottestFuncs.pop();
973 OS << "Top " << TopN
974 << " functions with the largest internal block counts: \n";
975 for (auto &hotfunc : llvm::reverse(SortedHottestFuncs))
976 OS << " " << hotfunc.first << ", max count = " << hotfunc.second << "\n";
979 if (ShownFunctions && ShowIndirectCallTargets) {
980 OS << "Statistics for indirect call sites profile:\n";
981 showValueSitesStats(OS, IPVK_IndirectCallTarget,
982 VPStats[IPVK_IndirectCallTarget]);
985 if (ShownFunctions && ShowMemOPSizes) {
986 OS << "Statistics for memory intrinsic calls sizes profile:\n";
987 showValueSitesStats(OS, IPVK_MemOPSize, VPStats[IPVK_MemOPSize]);
990 if (ShowDetailedSummary) {
991 OS << "Detailed summary:\n";
992 OS << "Total number of blocks: " << PS->getNumCounts() << "\n";
993 OS << "Total count: " << PS->getTotalCount() << "\n";
994 for (auto Entry : PS->getDetailedSummary()) {
995 OS << Entry.NumCounts << " blocks with count >= " << Entry.MinCount
996 << " account for "
997 << format("%0.6g", (float)Entry.Cutoff / ProfileSummary::Scale * 100)
998 << " percentage of the total counts.\n";
1001 return 0;
1004 static void showSectionInfo(sampleprof::SampleProfileReader *Reader,
1005 raw_fd_ostream &OS) {
1006 if (!Reader->dumpSectionInfo(OS)) {
1007 WithColor::warning() << "-show-sec-info-only is only supported for "
1008 << "sample profile in extbinary format and is "
1009 << "ignored for other formats.\n";
1010 return;
1014 static int showSampleProfile(const std::string &Filename, bool ShowCounts,
1015 bool ShowAllFunctions,
1016 const std::string &ShowFunction,
1017 bool ShowProfileSymbolList,
1018 bool ShowSectionInfoOnly, raw_fd_ostream &OS) {
1019 using namespace sampleprof;
1020 LLVMContext Context;
1021 auto ReaderOrErr = SampleProfileReader::create(Filename, Context);
1022 if (std::error_code EC = ReaderOrErr.getError())
1023 exitWithErrorCode(EC, Filename);
1025 auto Reader = std::move(ReaderOrErr.get());
1027 if (ShowSectionInfoOnly) {
1028 showSectionInfo(Reader.get(), OS);
1029 return 0;
1032 if (std::error_code EC = Reader->read())
1033 exitWithErrorCode(EC, Filename);
1035 if (ShowAllFunctions || ShowFunction.empty())
1036 Reader->dump(OS);
1037 else
1038 Reader->dumpFunctionProfile(ShowFunction, OS);
1040 if (ShowProfileSymbolList) {
1041 std::unique_ptr<sampleprof::ProfileSymbolList> ReaderList =
1042 Reader->getProfileSymbolList();
1043 ReaderList->dump(OS);
1046 return 0;
1049 static int show_main(int argc, const char *argv[]) {
1050 cl::opt<std::string> Filename(cl::Positional, cl::Required,
1051 cl::desc("<profdata-file>"));
1053 cl::opt<bool> ShowCounts("counts", cl::init(false),
1054 cl::desc("Show counter values for shown functions"));
1055 cl::opt<bool> TextFormat(
1056 "text", cl::init(false),
1057 cl::desc("Show instr profile data in text dump format"));
1058 cl::opt<bool> ShowIndirectCallTargets(
1059 "ic-targets", cl::init(false),
1060 cl::desc("Show indirect call site target values for shown functions"));
1061 cl::opt<bool> ShowMemOPSizes(
1062 "memop-sizes", cl::init(false),
1063 cl::desc("Show the profiled sizes of the memory intrinsic calls "
1064 "for shown functions"));
1065 cl::opt<bool> ShowDetailedSummary("detailed-summary", cl::init(false),
1066 cl::desc("Show detailed profile summary"));
1067 cl::list<uint32_t> DetailedSummaryCutoffs(
1068 cl::CommaSeparated, "detailed-summary-cutoffs",
1069 cl::desc(
1070 "Cutoff percentages (times 10000) for generating detailed summary"),
1071 cl::value_desc("800000,901000,999999"));
1072 cl::opt<bool> ShowAllFunctions("all-functions", cl::init(false),
1073 cl::desc("Details for every function"));
1074 cl::opt<bool> ShowCS("showcs", cl::init(false),
1075 cl::desc("Show context sensitive counts"));
1076 cl::opt<std::string> ShowFunction("function",
1077 cl::desc("Details for matching functions"));
1079 cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
1080 cl::init("-"), cl::desc("Output file"));
1081 cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
1082 cl::aliasopt(OutputFilename));
1083 cl::opt<ProfileKinds> ProfileKind(
1084 cl::desc("Profile kind:"), cl::init(instr),
1085 cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
1086 clEnumVal(sample, "Sample profile")));
1087 cl::opt<uint32_t> TopNFunctions(
1088 "topn", cl::init(0),
1089 cl::desc("Show the list of functions with the largest internal counts"));
1090 cl::opt<uint32_t> ValueCutoff(
1091 "value-cutoff", cl::init(0),
1092 cl::desc("Set the count value cutoff. Functions with the maximum count "
1093 "less than this value will not be printed out. (Default is 0)"));
1094 cl::opt<bool> OnlyListBelow(
1095 "list-below-cutoff", cl::init(false),
1096 cl::desc("Only output names of functions whose max count values are "
1097 "below the cutoff value"));
1098 cl::opt<bool> ShowProfileSymbolList(
1099 "show-prof-sym-list", cl::init(false),
1100 cl::desc("Show profile symbol list if it exists in the profile. "));
1101 cl::opt<bool> ShowSectionInfoOnly(
1102 "show-sec-info-only", cl::init(false),
1103 cl::desc("Show the information of each section in the sample profile. "
1104 "The flag is only usable when the sample profile is in "
1105 "extbinary format"));
1107 cl::ParseCommandLineOptions(argc, argv, "LLVM profile data summary\n");
1109 if (OutputFilename.empty())
1110 OutputFilename = "-";
1112 if (!Filename.compare(OutputFilename)) {
1113 errs() << sys::path::filename(argv[0])
1114 << ": Input file name cannot be the same as the output file name!\n";
1115 return 1;
1118 std::error_code EC;
1119 raw_fd_ostream OS(OutputFilename.data(), EC, sys::fs::OF_Text);
1120 if (EC)
1121 exitWithErrorCode(EC, OutputFilename);
1123 if (ShowAllFunctions && !ShowFunction.empty())
1124 WithColor::warning() << "-function argument ignored: showing all functions\n";
1126 if (ProfileKind == instr)
1127 return showInstrProfile(Filename, ShowCounts, TopNFunctions,
1128 ShowIndirectCallTargets, ShowMemOPSizes,
1129 ShowDetailedSummary, DetailedSummaryCutoffs,
1130 ShowAllFunctions, ShowCS, ValueCutoff,
1131 OnlyListBelow, ShowFunction, TextFormat, OS);
1132 else
1133 return showSampleProfile(Filename, ShowCounts, ShowAllFunctions,
1134 ShowFunction, ShowProfileSymbolList,
1135 ShowSectionInfoOnly, OS);
1138 int main(int argc, const char *argv[]) {
1139 InitLLVM X(argc, argv);
1141 StringRef ProgName(sys::path::filename(argv[0]));
1142 if (argc > 1) {
1143 int (*func)(int, const char *[]) = nullptr;
1145 if (strcmp(argv[1], "merge") == 0)
1146 func = merge_main;
1147 else if (strcmp(argv[1], "show") == 0)
1148 func = show_main;
1149 else if (strcmp(argv[1], "overlap") == 0)
1150 func = overlap_main;
1152 if (func) {
1153 std::string Invocation(ProgName.str() + " " + argv[1]);
1154 argv[1] = Invocation.c_str();
1155 return func(argc - 1, argv + 1);
1158 if (strcmp(argv[1], "-h") == 0 || strcmp(argv[1], "-help") == 0 ||
1159 strcmp(argv[1], "--help") == 0) {
1161 errs() << "OVERVIEW: LLVM profile data tools\n\n"
1162 << "USAGE: " << ProgName << " <command> [args...]\n"
1163 << "USAGE: " << ProgName << " <command> -help\n\n"
1164 << "See each individual command --help for more details.\n"
1165 << "Available commands: merge, show, overlap\n";
1166 return 0;
1170 if (argc < 2)
1171 errs() << ProgName << ": No command specified!\n";
1172 else
1173 errs() << ProgName << ": Unknown command!\n";
1175 errs() << "USAGE: " << ProgName << " <merge|show|overlap> [args...]\n";
1176 return 1;