[ORC] Add std::tuple support to SimplePackedSerialization.
[llvm-project.git] / llvm / lib / Transforms / Instrumentation / GCOVProfiling.cpp
blobd029a0ca8abf977491bde4233880d2823e3e2d64
1 //===- GCOVProfiling.cpp - Insert edge counters for gcov profiling --------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This pass implements GCOV-style profiling. When this pass is run it emits
10 // "gcno" files next to the existing source, and instruments the code that runs
11 // to records the edges between blocks that run and emit a complementary "gcda"
12 // file on exit.
14 //===----------------------------------------------------------------------===//
16 #include "CFGMST.h"
17 #include "llvm/ADT/DenseMap.h"
18 #include "llvm/ADT/Hashing.h"
19 #include "llvm/ADT/MapVector.h"
20 #include "llvm/ADT/STLExtras.h"
21 #include "llvm/ADT/Sequence.h"
22 #include "llvm/ADT/Statistic.h"
23 #include "llvm/ADT/StringExtras.h"
24 #include "llvm/ADT/StringMap.h"
25 #include "llvm/Analysis/BlockFrequencyInfo.h"
26 #include "llvm/Analysis/BranchProbabilityInfo.h"
27 #include "llvm/Analysis/EHPersonalities.h"
28 #include "llvm/Analysis/TargetLibraryInfo.h"
29 #include "llvm/IR/CFG.h"
30 #include "llvm/IR/DebugInfo.h"
31 #include "llvm/IR/DebugLoc.h"
32 #include "llvm/IR/IRBuilder.h"
33 #include "llvm/IR/InstIterator.h"
34 #include "llvm/IR/Instructions.h"
35 #include "llvm/IR/IntrinsicInst.h"
36 #include "llvm/IR/Module.h"
37 #include "llvm/InitializePasses.h"
38 #include "llvm/Pass.h"
39 #include "llvm/Support/CRC.h"
40 #include "llvm/Support/CommandLine.h"
41 #include "llvm/Support/Debug.h"
42 #include "llvm/Support/FileSystem.h"
43 #include "llvm/Support/Path.h"
44 #include "llvm/Support/Regex.h"
45 #include "llvm/Support/raw_ostream.h"
46 #include "llvm/Transforms/Instrumentation.h"
47 #include "llvm/Transforms/Instrumentation/GCOVProfiler.h"
48 #include "llvm/Transforms/Utils/ModuleUtils.h"
49 #include <algorithm>
50 #include <memory>
51 #include <string>
52 #include <utility>
54 using namespace llvm;
55 namespace endian = llvm::support::endian;
57 #define DEBUG_TYPE "insert-gcov-profiling"
59 enum : uint32_t {
60 GCOV_ARC_ON_TREE = 1 << 0,
62 GCOV_TAG_FUNCTION = 0x01000000,
63 GCOV_TAG_BLOCKS = 0x01410000,
64 GCOV_TAG_ARCS = 0x01430000,
65 GCOV_TAG_LINES = 0x01450000,
68 static cl::opt<std::string> DefaultGCOVVersion("default-gcov-version",
69 cl::init("408*"), cl::Hidden,
70 cl::ValueRequired);
72 static cl::opt<bool> AtomicCounter("gcov-atomic-counter", cl::Hidden,
73 cl::desc("Make counter updates atomic"));
75 // Returns the number of words which will be used to represent this string.
76 static unsigned wordsOfString(StringRef s) {
77 // Length + NUL-terminated string + 0~3 padding NULs.
78 return (s.size() / 4) + 2;
81 GCOVOptions GCOVOptions::getDefault() {
82 GCOVOptions Options;
83 Options.EmitNotes = true;
84 Options.EmitData = true;
85 Options.NoRedZone = false;
86 Options.Atomic = AtomicCounter;
88 if (DefaultGCOVVersion.size() != 4) {
89 llvm::report_fatal_error(std::string("Invalid -default-gcov-version: ") +
90 DefaultGCOVVersion);
92 memcpy(Options.Version, DefaultGCOVVersion.c_str(), 4);
93 return Options;
96 namespace {
97 class GCOVFunction;
99 class GCOVProfiler {
100 public:
101 GCOVProfiler() : GCOVProfiler(GCOVOptions::getDefault()) {}
102 GCOVProfiler(const GCOVOptions &Opts) : Options(Opts) {}
103 bool
104 runOnModule(Module &M, function_ref<BlockFrequencyInfo *(Function &F)> GetBFI,
105 function_ref<BranchProbabilityInfo *(Function &F)> GetBPI,
106 std::function<const TargetLibraryInfo &(Function &F)> GetTLI);
108 void write(uint32_t i) {
109 char Bytes[4];
110 endian::write32(Bytes, i, Endian);
111 os->write(Bytes, 4);
113 void writeString(StringRef s) {
114 write(wordsOfString(s) - 1);
115 os->write(s.data(), s.size());
116 os->write_zeros(4 - s.size() % 4);
118 void writeBytes(const char *Bytes, int Size) { os->write(Bytes, Size); }
120 private:
121 // Create the .gcno files for the Module based on DebugInfo.
122 bool
123 emitProfileNotes(NamedMDNode *CUNode, bool HasExecOrFork,
124 function_ref<BlockFrequencyInfo *(Function &F)> GetBFI,
125 function_ref<BranchProbabilityInfo *(Function &F)> GetBPI,
126 function_ref<const TargetLibraryInfo &(Function &F)> GetTLI);
128 Function *createInternalFunction(FunctionType *FTy, StringRef Name);
129 void emitGlobalConstructor(
130 SmallVectorImpl<std::pair<GlobalVariable *, MDNode *>> &CountersBySP);
132 bool isFunctionInstrumented(const Function &F);
133 std::vector<Regex> createRegexesFromString(StringRef RegexesStr);
134 static bool doesFilenameMatchARegex(StringRef Filename,
135 std::vector<Regex> &Regexes);
137 // Get pointers to the functions in the runtime library.
138 FunctionCallee getStartFileFunc(const TargetLibraryInfo *TLI);
139 FunctionCallee getEmitFunctionFunc(const TargetLibraryInfo *TLI);
140 FunctionCallee getEmitArcsFunc(const TargetLibraryInfo *TLI);
141 FunctionCallee getSummaryInfoFunc();
142 FunctionCallee getEndFileFunc();
144 // Add the function to write out all our counters to the global destructor
145 // list.
146 Function *
147 insertCounterWriteout(ArrayRef<std::pair<GlobalVariable *, MDNode *>>);
148 Function *insertReset(ArrayRef<std::pair<GlobalVariable *, MDNode *>>);
150 bool AddFlushBeforeForkAndExec();
152 enum class GCovFileType { GCNO, GCDA };
153 std::string mangleName(const DICompileUnit *CU, GCovFileType FileType);
155 GCOVOptions Options;
156 support::endianness Endian;
157 raw_ostream *os;
159 // Checksum, produced by hash of EdgeDestinations
160 SmallVector<uint32_t, 4> FileChecksums;
162 Module *M = nullptr;
163 std::function<const TargetLibraryInfo &(Function &F)> GetTLI;
164 LLVMContext *Ctx = nullptr;
165 SmallVector<std::unique_ptr<GCOVFunction>, 16> Funcs;
166 std::vector<Regex> FilterRe;
167 std::vector<Regex> ExcludeRe;
168 DenseSet<const BasicBlock *> ExecBlocks;
169 StringMap<bool> InstrumentedFiles;
172 class GCOVProfilerLegacyPass : public ModulePass {
173 public:
174 static char ID;
175 GCOVProfilerLegacyPass()
176 : GCOVProfilerLegacyPass(GCOVOptions::getDefault()) {}
177 GCOVProfilerLegacyPass(const GCOVOptions &Opts)
178 : ModulePass(ID), Profiler(Opts) {
179 initializeGCOVProfilerLegacyPassPass(*PassRegistry::getPassRegistry());
181 StringRef getPassName() const override { return "GCOV Profiler"; }
183 bool runOnModule(Module &M) override {
184 auto GetBFI = [this](Function &F) {
185 return &this->getAnalysis<BlockFrequencyInfoWrapperPass>(F).getBFI();
187 auto GetBPI = [this](Function &F) {
188 return &this->getAnalysis<BranchProbabilityInfoWrapperPass>(F).getBPI();
190 auto GetTLI = [this](Function &F) -> const TargetLibraryInfo & {
191 return this->getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);
193 return Profiler.runOnModule(M, GetBFI, GetBPI, GetTLI);
196 void getAnalysisUsage(AnalysisUsage &AU) const override {
197 AU.addRequired<BlockFrequencyInfoWrapperPass>();
198 AU.addRequired<TargetLibraryInfoWrapperPass>();
201 private:
202 GCOVProfiler Profiler;
205 struct BBInfo {
206 BBInfo *Group;
207 uint32_t Index;
208 uint32_t Rank = 0;
210 BBInfo(unsigned Index) : Group(this), Index(Index) {}
211 std::string infoString() const {
212 return (Twine("Index=") + Twine(Index)).str();
216 struct Edge {
217 // This class implements the CFG edges. Note the CFG can be a multi-graph.
218 // So there might be multiple edges with same SrcBB and DestBB.
219 const BasicBlock *SrcBB;
220 const BasicBlock *DestBB;
221 uint64_t Weight;
222 BasicBlock *Place = nullptr;
223 uint32_t SrcNumber, DstNumber;
224 bool InMST = false;
225 bool Removed = false;
226 bool IsCritical = false;
228 Edge(const BasicBlock *Src, const BasicBlock *Dest, uint64_t W = 1)
229 : SrcBB(Src), DestBB(Dest), Weight(W) {}
231 // Return the information string of an edge.
232 std::string infoString() const {
233 return (Twine(Removed ? "-" : " ") + (InMST ? " " : "*") +
234 (IsCritical ? "c" : " ") + " W=" + Twine(Weight))
235 .str();
240 char GCOVProfilerLegacyPass::ID = 0;
241 INITIALIZE_PASS_BEGIN(
242 GCOVProfilerLegacyPass, "insert-gcov-profiling",
243 "Insert instrumentation for GCOV profiling", false, false)
244 INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass)
245 INITIALIZE_PASS_DEPENDENCY(BranchProbabilityInfoWrapperPass)
246 INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
247 INITIALIZE_PASS_END(
248 GCOVProfilerLegacyPass, "insert-gcov-profiling",
249 "Insert instrumentation for GCOV profiling", false, false)
251 ModulePass *llvm::createGCOVProfilerPass(const GCOVOptions &Options) {
252 return new GCOVProfilerLegacyPass(Options);
255 static StringRef getFunctionName(const DISubprogram *SP) {
256 if (!SP->getLinkageName().empty())
257 return SP->getLinkageName();
258 return SP->getName();
261 /// Extract a filename for a DISubprogram.
263 /// Prefer relative paths in the coverage notes. Clang also may split
264 /// up absolute paths into a directory and filename component. When
265 /// the relative path doesn't exist, reconstruct the absolute path.
266 static SmallString<128> getFilename(const DISubprogram *SP) {
267 SmallString<128> Path;
268 StringRef RelPath = SP->getFilename();
269 if (sys::fs::exists(RelPath))
270 Path = RelPath;
271 else
272 sys::path::append(Path, SP->getDirectory(), SP->getFilename());
273 return Path;
276 namespace {
277 class GCOVRecord {
278 protected:
279 GCOVProfiler *P;
281 GCOVRecord(GCOVProfiler *P) : P(P) {}
283 void write(uint32_t i) { P->write(i); }
284 void writeString(StringRef s) { P->writeString(s); }
285 void writeBytes(const char *Bytes, int Size) { P->writeBytes(Bytes, Size); }
288 class GCOVFunction;
289 class GCOVBlock;
291 // Constructed only by requesting it from a GCOVBlock, this object stores a
292 // list of line numbers and a single filename, representing lines that belong
293 // to the block.
294 class GCOVLines : public GCOVRecord {
295 public:
296 void addLine(uint32_t Line) {
297 assert(Line != 0 && "Line zero is not a valid real line number.");
298 Lines.push_back(Line);
301 uint32_t length() const {
302 return 1 + wordsOfString(Filename) + Lines.size();
305 void writeOut() {
306 write(0);
307 writeString(Filename);
308 for (int i = 0, e = Lines.size(); i != e; ++i)
309 write(Lines[i]);
312 GCOVLines(GCOVProfiler *P, StringRef F)
313 : GCOVRecord(P), Filename(std::string(F)) {}
315 private:
316 std::string Filename;
317 SmallVector<uint32_t, 32> Lines;
321 // Represent a basic block in GCOV. Each block has a unique number in the
322 // function, number of lines belonging to each block, and a set of edges to
323 // other blocks.
324 class GCOVBlock : public GCOVRecord {
325 public:
326 GCOVLines &getFile(StringRef Filename) {
327 return LinesByFile.try_emplace(Filename, P, Filename).first->second;
330 void addEdge(GCOVBlock &Successor, uint32_t Flags) {
331 OutEdges.emplace_back(&Successor, Flags);
334 void writeOut() {
335 uint32_t Len = 3;
336 SmallVector<StringMapEntry<GCOVLines> *, 32> SortedLinesByFile;
337 for (auto &I : LinesByFile) {
338 Len += I.second.length();
339 SortedLinesByFile.push_back(&I);
342 write(GCOV_TAG_LINES);
343 write(Len);
344 write(Number);
346 llvm::sort(SortedLinesByFile, [](StringMapEntry<GCOVLines> *LHS,
347 StringMapEntry<GCOVLines> *RHS) {
348 return LHS->getKey() < RHS->getKey();
350 for (auto &I : SortedLinesByFile)
351 I->getValue().writeOut();
352 write(0);
353 write(0);
356 GCOVBlock(const GCOVBlock &RHS) : GCOVRecord(RHS), Number(RHS.Number) {
357 // Only allow copy before edges and lines have been added. After that,
358 // there are inter-block pointers (eg: edges) that won't take kindly to
359 // blocks being copied or moved around.
360 assert(LinesByFile.empty());
361 assert(OutEdges.empty());
364 uint32_t Number;
365 SmallVector<std::pair<GCOVBlock *, uint32_t>, 4> OutEdges;
367 private:
368 friend class GCOVFunction;
370 GCOVBlock(GCOVProfiler *P, uint32_t Number)
371 : GCOVRecord(P), Number(Number) {}
373 StringMap<GCOVLines> LinesByFile;
376 // A function has a unique identifier, a checksum (we leave as zero) and a
377 // set of blocks and a map of edges between blocks. This is the only GCOV
378 // object users can construct, the blocks and lines will be rooted here.
379 class GCOVFunction : public GCOVRecord {
380 public:
381 GCOVFunction(GCOVProfiler *P, Function *F, const DISubprogram *SP,
382 unsigned EndLine, uint32_t Ident, int Version)
383 : GCOVRecord(P), SP(SP), EndLine(EndLine), Ident(Ident),
384 Version(Version), EntryBlock(P, 0), ReturnBlock(P, 1) {
385 LLVM_DEBUG(dbgs() << "Function: " << getFunctionName(SP) << "\n");
386 bool ExitBlockBeforeBody = Version >= 48;
387 uint32_t i = ExitBlockBeforeBody ? 2 : 1;
388 for (BasicBlock &BB : *F)
389 Blocks.insert(std::make_pair(&BB, GCOVBlock(P, i++)));
390 if (!ExitBlockBeforeBody)
391 ReturnBlock.Number = i;
393 std::string FunctionNameAndLine;
394 raw_string_ostream FNLOS(FunctionNameAndLine);
395 FNLOS << getFunctionName(SP) << SP->getLine();
396 FNLOS.flush();
397 FuncChecksum = hash_value(FunctionNameAndLine);
400 GCOVBlock &getBlock(const BasicBlock *BB) {
401 return Blocks.find(const_cast<BasicBlock *>(BB))->second;
404 GCOVBlock &getEntryBlock() { return EntryBlock; }
405 GCOVBlock &getReturnBlock() {
406 return ReturnBlock;
409 uint32_t getFuncChecksum() const {
410 return FuncChecksum;
413 void writeOut(uint32_t CfgChecksum) {
414 write(GCOV_TAG_FUNCTION);
415 SmallString<128> Filename = getFilename(SP);
416 uint32_t BlockLen =
417 2 + (Version >= 47) + wordsOfString(getFunctionName(SP));
418 if (Version < 80)
419 BlockLen += wordsOfString(Filename) + 1;
420 else
421 BlockLen += 1 + wordsOfString(Filename) + 3 + (Version >= 90);
423 write(BlockLen);
424 write(Ident);
425 write(FuncChecksum);
426 if (Version >= 47)
427 write(CfgChecksum);
428 writeString(getFunctionName(SP));
429 if (Version < 80) {
430 writeString(Filename);
431 write(SP->getLine());
432 } else {
433 write(SP->isArtificial()); // artificial
434 writeString(Filename);
435 write(SP->getLine()); // start_line
436 write(0); // start_column
437 // EndLine is the last line with !dbg. It is not the } line as in GCC,
438 // but good enough.
439 write(EndLine);
440 if (Version >= 90)
441 write(0); // end_column
444 // Emit count of blocks.
445 write(GCOV_TAG_BLOCKS);
446 if (Version < 80) {
447 write(Blocks.size() + 2);
448 for (int i = Blocks.size() + 2; i; --i)
449 write(0);
450 } else {
451 write(1);
452 write(Blocks.size() + 2);
454 LLVM_DEBUG(dbgs() << (Blocks.size() + 1) << " blocks\n");
456 // Emit edges between blocks.
457 const uint32_t Outgoing = EntryBlock.OutEdges.size();
458 if (Outgoing) {
459 write(GCOV_TAG_ARCS);
460 write(Outgoing * 2 + 1);
461 write(EntryBlock.Number);
462 for (const auto &E : EntryBlock.OutEdges) {
463 write(E.first->Number);
464 write(E.second);
467 for (auto &It : Blocks) {
468 const GCOVBlock &Block = It.second;
469 if (Block.OutEdges.empty()) continue;
471 write(GCOV_TAG_ARCS);
472 write(Block.OutEdges.size() * 2 + 1);
473 write(Block.Number);
474 for (const auto &E : Block.OutEdges) {
475 write(E.first->Number);
476 write(E.second);
480 // Emit lines for each block.
481 for (auto &It : Blocks)
482 It.second.writeOut();
485 public:
486 const DISubprogram *SP;
487 unsigned EndLine;
488 uint32_t Ident;
489 uint32_t FuncChecksum;
490 int Version;
491 MapVector<BasicBlock *, GCOVBlock> Blocks;
492 GCOVBlock EntryBlock;
493 GCOVBlock ReturnBlock;
497 // RegexesStr is a string containing differents regex separated by a semi-colon.
498 // For example "foo\..*$;bar\..*$".
499 std::vector<Regex> GCOVProfiler::createRegexesFromString(StringRef RegexesStr) {
500 std::vector<Regex> Regexes;
501 while (!RegexesStr.empty()) {
502 std::pair<StringRef, StringRef> HeadTail = RegexesStr.split(';');
503 if (!HeadTail.first.empty()) {
504 Regex Re(HeadTail.first);
505 std::string Err;
506 if (!Re.isValid(Err)) {
507 Ctx->emitError(Twine("Regex ") + HeadTail.first +
508 " is not valid: " + Err);
510 Regexes.emplace_back(std::move(Re));
512 RegexesStr = HeadTail.second;
514 return Regexes;
517 bool GCOVProfiler::doesFilenameMatchARegex(StringRef Filename,
518 std::vector<Regex> &Regexes) {
519 for (Regex &Re : Regexes)
520 if (Re.match(Filename))
521 return true;
522 return false;
525 bool GCOVProfiler::isFunctionInstrumented(const Function &F) {
526 if (FilterRe.empty() && ExcludeRe.empty()) {
527 return true;
529 SmallString<128> Filename = getFilename(F.getSubprogram());
530 auto It = InstrumentedFiles.find(Filename);
531 if (It != InstrumentedFiles.end()) {
532 return It->second;
535 SmallString<256> RealPath;
536 StringRef RealFilename;
538 // Path can be
539 // /usr/lib/gcc/x86_64-linux-gnu/8/../../../../include/c++/8/bits/*.h so for
540 // such a case we must get the real_path.
541 if (sys::fs::real_path(Filename, RealPath)) {
542 // real_path can fail with path like "foo.c".
543 RealFilename = Filename;
544 } else {
545 RealFilename = RealPath;
548 bool ShouldInstrument;
549 if (FilterRe.empty()) {
550 ShouldInstrument = !doesFilenameMatchARegex(RealFilename, ExcludeRe);
551 } else if (ExcludeRe.empty()) {
552 ShouldInstrument = doesFilenameMatchARegex(RealFilename, FilterRe);
553 } else {
554 ShouldInstrument = doesFilenameMatchARegex(RealFilename, FilterRe) &&
555 !doesFilenameMatchARegex(RealFilename, ExcludeRe);
557 InstrumentedFiles[Filename] = ShouldInstrument;
558 return ShouldInstrument;
561 std::string GCOVProfiler::mangleName(const DICompileUnit *CU,
562 GCovFileType OutputType) {
563 bool Notes = OutputType == GCovFileType::GCNO;
565 if (NamedMDNode *GCov = M->getNamedMetadata("llvm.gcov")) {
566 for (int i = 0, e = GCov->getNumOperands(); i != e; ++i) {
567 MDNode *N = GCov->getOperand(i);
568 bool ThreeElement = N->getNumOperands() == 3;
569 if (!ThreeElement && N->getNumOperands() != 2)
570 continue;
571 if (dyn_cast<MDNode>(N->getOperand(ThreeElement ? 2 : 1)) != CU)
572 continue;
574 if (ThreeElement) {
575 // These nodes have no mangling to apply, it's stored mangled in the
576 // bitcode.
577 MDString *NotesFile = dyn_cast<MDString>(N->getOperand(0));
578 MDString *DataFile = dyn_cast<MDString>(N->getOperand(1));
579 if (!NotesFile || !DataFile)
580 continue;
581 return std::string(Notes ? NotesFile->getString()
582 : DataFile->getString());
585 MDString *GCovFile = dyn_cast<MDString>(N->getOperand(0));
586 if (!GCovFile)
587 continue;
589 SmallString<128> Filename = GCovFile->getString();
590 sys::path::replace_extension(Filename, Notes ? "gcno" : "gcda");
591 return std::string(Filename.str());
595 SmallString<128> Filename = CU->getFilename();
596 sys::path::replace_extension(Filename, Notes ? "gcno" : "gcda");
597 StringRef FName = sys::path::filename(Filename);
598 SmallString<128> CurPath;
599 if (sys::fs::current_path(CurPath))
600 return std::string(FName);
601 sys::path::append(CurPath, FName);
602 return std::string(CurPath.str());
605 bool GCOVProfiler::runOnModule(
606 Module &M, function_ref<BlockFrequencyInfo *(Function &F)> GetBFI,
607 function_ref<BranchProbabilityInfo *(Function &F)> GetBPI,
608 std::function<const TargetLibraryInfo &(Function &F)> GetTLI) {
609 this->M = &M;
610 this->GetTLI = std::move(GetTLI);
611 Ctx = &M.getContext();
613 NamedMDNode *CUNode = M.getNamedMetadata("llvm.dbg.cu");
614 if (!CUNode || (!Options.EmitNotes && !Options.EmitData))
615 return false;
617 bool HasExecOrFork = AddFlushBeforeForkAndExec();
619 FilterRe = createRegexesFromString(Options.Filter);
620 ExcludeRe = createRegexesFromString(Options.Exclude);
621 emitProfileNotes(CUNode, HasExecOrFork, GetBFI, GetBPI, this->GetTLI);
622 return true;
625 PreservedAnalyses GCOVProfilerPass::run(Module &M,
626 ModuleAnalysisManager &AM) {
628 GCOVProfiler Profiler(GCOVOpts);
629 FunctionAnalysisManager &FAM =
630 AM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager();
632 auto GetBFI = [&FAM](Function &F) {
633 return &FAM.getResult<BlockFrequencyAnalysis>(F);
635 auto GetBPI = [&FAM](Function &F) {
636 return &FAM.getResult<BranchProbabilityAnalysis>(F);
638 auto GetTLI = [&FAM](Function &F) -> const TargetLibraryInfo & {
639 return FAM.getResult<TargetLibraryAnalysis>(F);
642 if (!Profiler.runOnModule(M, GetBFI, GetBPI, GetTLI))
643 return PreservedAnalyses::all();
645 return PreservedAnalyses::none();
648 static bool functionHasLines(const Function &F, unsigned &EndLine) {
649 // Check whether this function actually has any source lines. Not only
650 // do these waste space, they also can crash gcov.
651 EndLine = 0;
652 for (auto &BB : F) {
653 for (auto &I : BB) {
654 // Debug intrinsic locations correspond to the location of the
655 // declaration, not necessarily any statements or expressions.
656 if (isa<DbgInfoIntrinsic>(&I)) continue;
658 const DebugLoc &Loc = I.getDebugLoc();
659 if (!Loc)
660 continue;
662 // Artificial lines such as calls to the global constructors.
663 if (Loc.getLine() == 0) continue;
664 EndLine = std::max(EndLine, Loc.getLine());
666 return true;
669 return false;
672 static bool isUsingScopeBasedEH(Function &F) {
673 if (!F.hasPersonalityFn()) return false;
675 EHPersonality Personality = classifyEHPersonality(F.getPersonalityFn());
676 return isScopedEHPersonality(Personality);
679 bool GCOVProfiler::AddFlushBeforeForkAndExec() {
680 SmallVector<CallInst *, 2> Forks;
681 SmallVector<CallInst *, 2> Execs;
682 for (auto &F : M->functions()) {
683 auto *TLI = &GetTLI(F);
684 for (auto &I : instructions(F)) {
685 if (CallInst *CI = dyn_cast<CallInst>(&I)) {
686 if (Function *Callee = CI->getCalledFunction()) {
687 LibFunc LF;
688 if (TLI->getLibFunc(*Callee, LF)) {
689 if (LF == LibFunc_fork) {
690 #if !defined(_WIN32)
691 Forks.push_back(CI);
692 #endif
693 } else if (LF == LibFunc_execl || LF == LibFunc_execle ||
694 LF == LibFunc_execlp || LF == LibFunc_execv ||
695 LF == LibFunc_execvp || LF == LibFunc_execve ||
696 LF == LibFunc_execvpe || LF == LibFunc_execvP) {
697 Execs.push_back(CI);
705 for (auto F : Forks) {
706 IRBuilder<> Builder(F);
707 BasicBlock *Parent = F->getParent();
708 auto NextInst = ++F->getIterator();
710 // We've a fork so just reset the counters in the child process
711 FunctionType *FTy = FunctionType::get(Builder.getInt32Ty(), {}, false);
712 FunctionCallee GCOVFork = M->getOrInsertFunction("__gcov_fork", FTy);
713 F->setCalledFunction(GCOVFork);
715 // We split just after the fork to have a counter for the lines after
716 // Anyway there's a bug:
717 // void foo() { fork(); }
718 // void bar() { foo(); blah(); }
719 // then "blah();" will be called 2 times but showed as 1
720 // because "blah()" belongs to the same block as "foo();"
721 Parent->splitBasicBlock(NextInst);
723 // back() is a br instruction with a debug location
724 // equals to the one from NextAfterFork
725 // So to avoid to have two debug locs on two blocks just change it
726 DebugLoc Loc = F->getDebugLoc();
727 Parent->back().setDebugLoc(Loc);
730 for (auto E : Execs) {
731 IRBuilder<> Builder(E);
732 BasicBlock *Parent = E->getParent();
733 auto NextInst = ++E->getIterator();
735 // Since the process is replaced by a new one we need to write out gcdas
736 // No need to reset the counters since they'll be lost after the exec**
737 FunctionType *FTy = FunctionType::get(Builder.getVoidTy(), {}, false);
738 FunctionCallee WriteoutF =
739 M->getOrInsertFunction("llvm_writeout_files", FTy);
740 Builder.CreateCall(WriteoutF);
742 DebugLoc Loc = E->getDebugLoc();
743 Builder.SetInsertPoint(&*NextInst);
744 // If the exec** fails we must reset the counters since they've been
745 // dumped
746 FunctionCallee ResetF = M->getOrInsertFunction("llvm_reset_counters", FTy);
747 Builder.CreateCall(ResetF)->setDebugLoc(Loc);
748 ExecBlocks.insert(Parent);
749 Parent->splitBasicBlock(NextInst);
750 Parent->back().setDebugLoc(Loc);
753 return !Forks.empty() || !Execs.empty();
756 static BasicBlock *getInstrBB(CFGMST<Edge, BBInfo> &MST, Edge &E,
757 const DenseSet<const BasicBlock *> &ExecBlocks) {
758 if (E.InMST || E.Removed)
759 return nullptr;
761 BasicBlock *SrcBB = const_cast<BasicBlock *>(E.SrcBB);
762 BasicBlock *DestBB = const_cast<BasicBlock *>(E.DestBB);
763 // For a fake edge, instrument the real BB.
764 if (SrcBB == nullptr)
765 return DestBB;
766 if (DestBB == nullptr)
767 return SrcBB;
769 auto CanInstrument = [](BasicBlock *BB) -> BasicBlock * {
770 // There are basic blocks (such as catchswitch) cannot be instrumented.
771 // If the returned first insertion point is the end of BB, skip this BB.
772 if (BB->getFirstInsertionPt() == BB->end())
773 return nullptr;
774 return BB;
777 // Instrument the SrcBB if it has a single successor,
778 // otherwise, the DestBB if this is not a critical edge.
779 Instruction *TI = SrcBB->getTerminator();
780 if (TI->getNumSuccessors() <= 1 && !ExecBlocks.count(SrcBB))
781 return CanInstrument(SrcBB);
782 if (!E.IsCritical)
783 return CanInstrument(DestBB);
785 // Some IndirectBr critical edges cannot be split by the previous
786 // SplitIndirectBrCriticalEdges call. Bail out.
787 const unsigned SuccNum = GetSuccessorNumber(SrcBB, DestBB);
788 BasicBlock *InstrBB =
789 isa<IndirectBrInst>(TI) ? nullptr : SplitCriticalEdge(TI, SuccNum);
790 if (!InstrBB)
791 return nullptr;
793 MST.addEdge(SrcBB, InstrBB, 0);
794 MST.addEdge(InstrBB, DestBB, 0).InMST = true;
795 E.Removed = true;
797 return CanInstrument(InstrBB);
800 #ifndef NDEBUG
801 static void dumpEdges(CFGMST<Edge, BBInfo> &MST, GCOVFunction &GF) {
802 size_t ID = 0;
803 for (auto &E : make_pointee_range(MST.AllEdges)) {
804 GCOVBlock &Src = E.SrcBB ? GF.getBlock(E.SrcBB) : GF.getEntryBlock();
805 GCOVBlock &Dst = E.DestBB ? GF.getBlock(E.DestBB) : GF.getReturnBlock();
806 dbgs() << " Edge " << ID++ << ": " << Src.Number << "->" << Dst.Number
807 << E.infoString() << "\n";
810 #endif
812 bool GCOVProfiler::emitProfileNotes(
813 NamedMDNode *CUNode, bool HasExecOrFork,
814 function_ref<BlockFrequencyInfo *(Function &F)> GetBFI,
815 function_ref<BranchProbabilityInfo *(Function &F)> GetBPI,
816 function_ref<const TargetLibraryInfo &(Function &F)> GetTLI) {
817 int Version;
819 uint8_t c3 = Options.Version[0];
820 uint8_t c2 = Options.Version[1];
821 uint8_t c1 = Options.Version[2];
822 Version = c3 >= 'A' ? (c3 - 'A') * 100 + (c2 - '0') * 10 + c1 - '0'
823 : (c3 - '0') * 10 + c1 - '0';
826 bool EmitGCDA = Options.EmitData;
827 for (unsigned i = 0, e = CUNode->getNumOperands(); i != e; ++i) {
828 // Each compile unit gets its own .gcno file. This means that whether we run
829 // this pass over the original .o's as they're produced, or run it after
830 // LTO, we'll generate the same .gcno files.
832 auto *CU = cast<DICompileUnit>(CUNode->getOperand(i));
834 // Skip module skeleton (and module) CUs.
835 if (CU->getDWOId())
836 continue;
838 std::vector<uint8_t> EdgeDestinations;
839 SmallVector<std::pair<GlobalVariable *, MDNode *>, 8> CountersBySP;
841 Endian = M->getDataLayout().isLittleEndian() ? support::endianness::little
842 : support::endianness::big;
843 unsigned FunctionIdent = 0;
844 for (auto &F : M->functions()) {
845 DISubprogram *SP = F.getSubprogram();
846 unsigned EndLine;
847 if (!SP) continue;
848 if (!functionHasLines(F, EndLine) || !isFunctionInstrumented(F))
849 continue;
850 // TODO: Functions using scope-based EH are currently not supported.
851 if (isUsingScopeBasedEH(F)) continue;
852 if (F.hasFnAttribute(llvm::Attribute::NoProfile))
853 continue;
855 // Add the function line number to the lines of the entry block
856 // to have a counter for the function definition.
857 uint32_t Line = SP->getLine();
858 auto Filename = getFilename(SP);
860 BranchProbabilityInfo *BPI = GetBPI(F);
861 BlockFrequencyInfo *BFI = GetBFI(F);
863 // Split indirectbr critical edges here before computing the MST rather
864 // than later in getInstrBB() to avoid invalidating it.
865 SplitIndirectBrCriticalEdges(F, BPI, BFI);
867 CFGMST<Edge, BBInfo> MST(F, /*InstrumentFuncEntry_=*/false, BPI, BFI);
869 // getInstrBB can split basic blocks and push elements to AllEdges.
870 for (size_t I : llvm::seq<size_t>(0, MST.AllEdges.size())) {
871 auto &E = *MST.AllEdges[I];
872 // For now, disable spanning tree optimization when fork or exec* is
873 // used.
874 if (HasExecOrFork)
875 E.InMST = false;
876 E.Place = getInstrBB(MST, E, ExecBlocks);
878 // Basic blocks in F are finalized at this point.
879 BasicBlock &EntryBlock = F.getEntryBlock();
880 Funcs.push_back(std::make_unique<GCOVFunction>(this, &F, SP, EndLine,
881 FunctionIdent++, Version));
882 GCOVFunction &Func = *Funcs.back();
884 // Some non-tree edges are IndirectBr which cannot be split. Ignore them
885 // as well.
886 llvm::erase_if(MST.AllEdges, [](std::unique_ptr<Edge> &E) {
887 return E->Removed || (!E->InMST && !E->Place);
889 const size_t Measured =
890 std::stable_partition(
891 MST.AllEdges.begin(), MST.AllEdges.end(),
892 [](std::unique_ptr<Edge> &E) { return E->Place; }) -
893 MST.AllEdges.begin();
894 for (size_t I : llvm::seq<size_t>(0, Measured)) {
895 Edge &E = *MST.AllEdges[I];
896 GCOVBlock &Src =
897 E.SrcBB ? Func.getBlock(E.SrcBB) : Func.getEntryBlock();
898 GCOVBlock &Dst =
899 E.DestBB ? Func.getBlock(E.DestBB) : Func.getReturnBlock();
900 E.SrcNumber = Src.Number;
901 E.DstNumber = Dst.Number;
903 std::stable_sort(
904 MST.AllEdges.begin(), MST.AllEdges.begin() + Measured,
905 [](const std::unique_ptr<Edge> &L, const std::unique_ptr<Edge> &R) {
906 return L->SrcNumber != R->SrcNumber ? L->SrcNumber < R->SrcNumber
907 : L->DstNumber < R->DstNumber;
910 for (const Edge &E : make_pointee_range(MST.AllEdges)) {
911 GCOVBlock &Src =
912 E.SrcBB ? Func.getBlock(E.SrcBB) : Func.getEntryBlock();
913 GCOVBlock &Dst =
914 E.DestBB ? Func.getBlock(E.DestBB) : Func.getReturnBlock();
915 Src.addEdge(Dst, E.Place ? 0 : uint32_t(GCOV_ARC_ON_TREE));
918 // Artificial functions such as global initializers
919 if (!SP->isArtificial())
920 Func.getBlock(&EntryBlock).getFile(Filename).addLine(Line);
922 LLVM_DEBUG(dumpEdges(MST, Func));
924 for (auto &GB : Func.Blocks) {
925 const BasicBlock &BB = *GB.first;
926 auto &Block = GB.second;
927 for (auto Succ : Block.OutEdges) {
928 uint32_t Idx = Succ.first->Number;
929 do EdgeDestinations.push_back(Idx & 255);
930 while ((Idx >>= 8) > 0);
933 for (auto &I : BB) {
934 // Debug intrinsic locations correspond to the location of the
935 // declaration, not necessarily any statements or expressions.
936 if (isa<DbgInfoIntrinsic>(&I)) continue;
938 const DebugLoc &Loc = I.getDebugLoc();
939 if (!Loc)
940 continue;
942 // Artificial lines such as calls to the global constructors.
943 if (Loc.getLine() == 0 || Loc.isImplicitCode())
944 continue;
946 if (Line == Loc.getLine()) continue;
947 Line = Loc.getLine();
948 if (SP != getDISubprogram(Loc.getScope()))
949 continue;
951 GCOVLines &Lines = Block.getFile(Filename);
952 Lines.addLine(Loc.getLine());
954 Line = 0;
956 if (EmitGCDA) {
957 DISubprogram *SP = F.getSubprogram();
958 ArrayType *CounterTy = ArrayType::get(Type::getInt64Ty(*Ctx), Measured);
959 GlobalVariable *Counters = new GlobalVariable(
960 *M, CounterTy, false, GlobalValue::InternalLinkage,
961 Constant::getNullValue(CounterTy), "__llvm_gcov_ctr");
962 CountersBySP.emplace_back(Counters, SP);
964 for (size_t I : llvm::seq<size_t>(0, Measured)) {
965 const Edge &E = *MST.AllEdges[I];
966 IRBuilder<> Builder(E.Place, E.Place->getFirstInsertionPt());
967 Value *V = Builder.CreateConstInBoundsGEP2_64(
968 Counters->getValueType(), Counters, 0, I);
969 if (Options.Atomic) {
970 Builder.CreateAtomicRMW(AtomicRMWInst::Add, V, Builder.getInt64(1),
971 MaybeAlign(), AtomicOrdering::Monotonic);
972 } else {
973 Value *Count =
974 Builder.CreateLoad(Builder.getInt64Ty(), V, "gcov_ctr");
975 Count = Builder.CreateAdd(Count, Builder.getInt64(1));
976 Builder.CreateStore(Count, V);
982 char Tmp[4];
983 JamCRC JC;
984 JC.update(EdgeDestinations);
985 uint32_t Stamp = JC.getCRC();
986 FileChecksums.push_back(Stamp);
988 if (Options.EmitNotes) {
989 std::error_code EC;
990 raw_fd_ostream out(mangleName(CU, GCovFileType::GCNO), EC,
991 sys::fs::OF_None);
992 if (EC) {
993 Ctx->emitError(
994 Twine("failed to open coverage notes file for writing: ") +
995 EC.message());
996 continue;
998 os = &out;
999 if (Endian == support::endianness::big) {
1000 out.write("gcno", 4);
1001 out.write(Options.Version, 4);
1002 } else {
1003 out.write("oncg", 4);
1004 std::reverse_copy(Options.Version, Options.Version + 4, Tmp);
1005 out.write(Tmp, 4);
1007 write(Stamp);
1008 if (Version >= 90)
1009 writeString(""); // unuseful current_working_directory
1010 if (Version >= 80)
1011 write(0); // unuseful has_unexecuted_blocks
1013 for (auto &Func : Funcs)
1014 Func->writeOut(Stamp);
1016 write(0);
1017 write(0);
1018 out.close();
1021 if (EmitGCDA) {
1022 emitGlobalConstructor(CountersBySP);
1023 EmitGCDA = false;
1026 return true;
1029 Function *GCOVProfiler::createInternalFunction(FunctionType *FTy,
1030 StringRef Name) {
1031 Function *F = Function::createWithDefaultAttr(
1032 FTy, GlobalValue::InternalLinkage, 0, Name, M);
1033 F->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
1034 F->addFnAttr(Attribute::NoUnwind);
1035 if (Options.NoRedZone)
1036 F->addFnAttr(Attribute::NoRedZone);
1037 return F;
1040 void GCOVProfiler::emitGlobalConstructor(
1041 SmallVectorImpl<std::pair<GlobalVariable *, MDNode *>> &CountersBySP) {
1042 Function *WriteoutF = insertCounterWriteout(CountersBySP);
1043 Function *ResetF = insertReset(CountersBySP);
1045 // Create a small bit of code that registers the "__llvm_gcov_writeout" to
1046 // be executed at exit and the "__llvm_gcov_reset" function to be executed
1047 // when "__gcov_flush" is called.
1048 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1049 Function *F = createInternalFunction(FTy, "__llvm_gcov_init");
1050 F->addFnAttr(Attribute::NoInline);
1052 BasicBlock *BB = BasicBlock::Create(*Ctx, "entry", F);
1053 IRBuilder<> Builder(BB);
1055 FTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1056 auto *PFTy = PointerType::get(FTy, 0);
1057 FTy = FunctionType::get(Builder.getVoidTy(), {PFTy, PFTy}, false);
1059 // Initialize the environment and register the local writeout, flush and
1060 // reset functions.
1061 FunctionCallee GCOVInit = M->getOrInsertFunction("llvm_gcov_init", FTy);
1062 Builder.CreateCall(GCOVInit, {WriteoutF, ResetF});
1063 Builder.CreateRetVoid();
1065 appendToGlobalCtors(*M, F, 0);
1068 FunctionCallee GCOVProfiler::getStartFileFunc(const TargetLibraryInfo *TLI) {
1069 Type *Args[] = {
1070 Type::getInt8PtrTy(*Ctx), // const char *orig_filename
1071 Type::getInt32Ty(*Ctx), // uint32_t version
1072 Type::getInt32Ty(*Ctx), // uint32_t checksum
1074 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), Args, false);
1075 AttributeList AL;
1076 if (auto AK = TLI->getExtAttrForI32Param(false))
1077 AL = AL.addParamAttribute(*Ctx, 2, AK);
1078 FunctionCallee Res = M->getOrInsertFunction("llvm_gcda_start_file", FTy, AL);
1079 return Res;
1082 FunctionCallee GCOVProfiler::getEmitFunctionFunc(const TargetLibraryInfo *TLI) {
1083 Type *Args[] = {
1084 Type::getInt32Ty(*Ctx), // uint32_t ident
1085 Type::getInt32Ty(*Ctx), // uint32_t func_checksum
1086 Type::getInt32Ty(*Ctx), // uint32_t cfg_checksum
1088 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), Args, false);
1089 AttributeList AL;
1090 if (auto AK = TLI->getExtAttrForI32Param(false)) {
1091 AL = AL.addParamAttribute(*Ctx, 0, AK);
1092 AL = AL.addParamAttribute(*Ctx, 1, AK);
1093 AL = AL.addParamAttribute(*Ctx, 2, AK);
1095 return M->getOrInsertFunction("llvm_gcda_emit_function", FTy);
1098 FunctionCallee GCOVProfiler::getEmitArcsFunc(const TargetLibraryInfo *TLI) {
1099 Type *Args[] = {
1100 Type::getInt32Ty(*Ctx), // uint32_t num_counters
1101 Type::getInt64PtrTy(*Ctx), // uint64_t *counters
1103 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), Args, false);
1104 AttributeList AL;
1105 if (auto AK = TLI->getExtAttrForI32Param(false))
1106 AL = AL.addParamAttribute(*Ctx, 0, AK);
1107 return M->getOrInsertFunction("llvm_gcda_emit_arcs", FTy, AL);
1110 FunctionCallee GCOVProfiler::getSummaryInfoFunc() {
1111 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1112 return M->getOrInsertFunction("llvm_gcda_summary_info", FTy);
1115 FunctionCallee GCOVProfiler::getEndFileFunc() {
1116 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1117 return M->getOrInsertFunction("llvm_gcda_end_file", FTy);
1120 Function *GCOVProfiler::insertCounterWriteout(
1121 ArrayRef<std::pair<GlobalVariable *, MDNode *> > CountersBySP) {
1122 FunctionType *WriteoutFTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1123 Function *WriteoutF = M->getFunction("__llvm_gcov_writeout");
1124 if (!WriteoutF)
1125 WriteoutF = createInternalFunction(WriteoutFTy, "__llvm_gcov_writeout");
1126 WriteoutF->addFnAttr(Attribute::NoInline);
1128 BasicBlock *BB = BasicBlock::Create(*Ctx, "entry", WriteoutF);
1129 IRBuilder<> Builder(BB);
1131 auto *TLI = &GetTLI(*WriteoutF);
1133 FunctionCallee StartFile = getStartFileFunc(TLI);
1134 FunctionCallee EmitFunction = getEmitFunctionFunc(TLI);
1135 FunctionCallee EmitArcs = getEmitArcsFunc(TLI);
1136 FunctionCallee SummaryInfo = getSummaryInfoFunc();
1137 FunctionCallee EndFile = getEndFileFunc();
1139 NamedMDNode *CUNodes = M->getNamedMetadata("llvm.dbg.cu");
1140 if (!CUNodes) {
1141 Builder.CreateRetVoid();
1142 return WriteoutF;
1145 // Collect the relevant data into a large constant data structure that we can
1146 // walk to write out everything.
1147 StructType *StartFileCallArgsTy = StructType::create(
1148 {Builder.getInt8PtrTy(), Builder.getInt32Ty(), Builder.getInt32Ty()},
1149 "start_file_args_ty");
1150 StructType *EmitFunctionCallArgsTy = StructType::create(
1151 {Builder.getInt32Ty(), Builder.getInt32Ty(), Builder.getInt32Ty()},
1152 "emit_function_args_ty");
1153 StructType *EmitArcsCallArgsTy = StructType::create(
1154 {Builder.getInt32Ty(), Builder.getInt64Ty()->getPointerTo()},
1155 "emit_arcs_args_ty");
1156 StructType *FileInfoTy =
1157 StructType::create({StartFileCallArgsTy, Builder.getInt32Ty(),
1158 EmitFunctionCallArgsTy->getPointerTo(),
1159 EmitArcsCallArgsTy->getPointerTo()},
1160 "file_info");
1162 Constant *Zero32 = Builder.getInt32(0);
1163 // Build an explicit array of two zeros for use in ConstantExpr GEP building.
1164 Constant *TwoZero32s[] = {Zero32, Zero32};
1166 SmallVector<Constant *, 8> FileInfos;
1167 for (int i : llvm::seq<int>(0, CUNodes->getNumOperands())) {
1168 auto *CU = cast<DICompileUnit>(CUNodes->getOperand(i));
1170 // Skip module skeleton (and module) CUs.
1171 if (CU->getDWOId())
1172 continue;
1174 std::string FilenameGcda = mangleName(CU, GCovFileType::GCDA);
1175 uint32_t CfgChecksum = FileChecksums.empty() ? 0 : FileChecksums[i];
1176 auto *StartFileCallArgs = ConstantStruct::get(
1177 StartFileCallArgsTy,
1178 {Builder.CreateGlobalStringPtr(FilenameGcda),
1179 Builder.getInt32(endian::read32be(Options.Version)),
1180 Builder.getInt32(CfgChecksum)});
1182 SmallVector<Constant *, 8> EmitFunctionCallArgsArray;
1183 SmallVector<Constant *, 8> EmitArcsCallArgsArray;
1184 for (int j : llvm::seq<int>(0, CountersBySP.size())) {
1185 uint32_t FuncChecksum = Funcs.empty() ? 0 : Funcs[j]->getFuncChecksum();
1186 EmitFunctionCallArgsArray.push_back(ConstantStruct::get(
1187 EmitFunctionCallArgsTy,
1188 {Builder.getInt32(j),
1189 Builder.getInt32(FuncChecksum),
1190 Builder.getInt32(CfgChecksum)}));
1192 GlobalVariable *GV = CountersBySP[j].first;
1193 unsigned Arcs = cast<ArrayType>(GV->getValueType())->getNumElements();
1194 EmitArcsCallArgsArray.push_back(ConstantStruct::get(
1195 EmitArcsCallArgsTy,
1196 {Builder.getInt32(Arcs), ConstantExpr::getInBoundsGetElementPtr(
1197 GV->getValueType(), GV, TwoZero32s)}));
1199 // Create global arrays for the two emit calls.
1200 int CountersSize = CountersBySP.size();
1201 assert(CountersSize == (int)EmitFunctionCallArgsArray.size() &&
1202 "Mismatched array size!");
1203 assert(CountersSize == (int)EmitArcsCallArgsArray.size() &&
1204 "Mismatched array size!");
1205 auto *EmitFunctionCallArgsArrayTy =
1206 ArrayType::get(EmitFunctionCallArgsTy, CountersSize);
1207 auto *EmitFunctionCallArgsArrayGV = new GlobalVariable(
1208 *M, EmitFunctionCallArgsArrayTy, /*isConstant*/ true,
1209 GlobalValue::InternalLinkage,
1210 ConstantArray::get(EmitFunctionCallArgsArrayTy,
1211 EmitFunctionCallArgsArray),
1212 Twine("__llvm_internal_gcov_emit_function_args.") + Twine(i));
1213 auto *EmitArcsCallArgsArrayTy =
1214 ArrayType::get(EmitArcsCallArgsTy, CountersSize);
1215 EmitFunctionCallArgsArrayGV->setUnnamedAddr(
1216 GlobalValue::UnnamedAddr::Global);
1217 auto *EmitArcsCallArgsArrayGV = new GlobalVariable(
1218 *M, EmitArcsCallArgsArrayTy, /*isConstant*/ true,
1219 GlobalValue::InternalLinkage,
1220 ConstantArray::get(EmitArcsCallArgsArrayTy, EmitArcsCallArgsArray),
1221 Twine("__llvm_internal_gcov_emit_arcs_args.") + Twine(i));
1222 EmitArcsCallArgsArrayGV->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
1224 FileInfos.push_back(ConstantStruct::get(
1225 FileInfoTy,
1226 {StartFileCallArgs, Builder.getInt32(CountersSize),
1227 ConstantExpr::getInBoundsGetElementPtr(EmitFunctionCallArgsArrayTy,
1228 EmitFunctionCallArgsArrayGV,
1229 TwoZero32s),
1230 ConstantExpr::getInBoundsGetElementPtr(
1231 EmitArcsCallArgsArrayTy, EmitArcsCallArgsArrayGV, TwoZero32s)}));
1234 // If we didn't find anything to actually emit, bail on out.
1235 if (FileInfos.empty()) {
1236 Builder.CreateRetVoid();
1237 return WriteoutF;
1240 // To simplify code, we cap the number of file infos we write out to fit
1241 // easily in a 32-bit signed integer. This gives consistent behavior between
1242 // 32-bit and 64-bit systems without requiring (potentially very slow) 64-bit
1243 // operations on 32-bit systems. It also seems unreasonable to try to handle
1244 // more than 2 billion files.
1245 if ((int64_t)FileInfos.size() > (int64_t)INT_MAX)
1246 FileInfos.resize(INT_MAX);
1248 // Create a global for the entire data structure so we can walk it more
1249 // easily.
1250 auto *FileInfoArrayTy = ArrayType::get(FileInfoTy, FileInfos.size());
1251 auto *FileInfoArrayGV = new GlobalVariable(
1252 *M, FileInfoArrayTy, /*isConstant*/ true, GlobalValue::InternalLinkage,
1253 ConstantArray::get(FileInfoArrayTy, FileInfos),
1254 "__llvm_internal_gcov_emit_file_info");
1255 FileInfoArrayGV->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
1257 // Create the CFG for walking this data structure.
1258 auto *FileLoopHeader =
1259 BasicBlock::Create(*Ctx, "file.loop.header", WriteoutF);
1260 auto *CounterLoopHeader =
1261 BasicBlock::Create(*Ctx, "counter.loop.header", WriteoutF);
1262 auto *FileLoopLatch = BasicBlock::Create(*Ctx, "file.loop.latch", WriteoutF);
1263 auto *ExitBB = BasicBlock::Create(*Ctx, "exit", WriteoutF);
1265 // We always have at least one file, so just branch to the header.
1266 Builder.CreateBr(FileLoopHeader);
1268 // The index into the files structure is our loop induction variable.
1269 Builder.SetInsertPoint(FileLoopHeader);
1270 PHINode *IV = Builder.CreatePHI(Builder.getInt32Ty(), /*NumReservedValues*/ 2,
1271 "file_idx");
1272 IV->addIncoming(Builder.getInt32(0), BB);
1273 auto *FileInfoPtr = Builder.CreateInBoundsGEP(
1274 FileInfoArrayTy, FileInfoArrayGV, {Builder.getInt32(0), IV});
1275 auto *StartFileCallArgsPtr =
1276 Builder.CreateStructGEP(FileInfoTy, FileInfoPtr, 0, "start_file_args");
1277 auto *StartFileCall = Builder.CreateCall(
1278 StartFile,
1279 {Builder.CreateLoad(StartFileCallArgsTy->getElementType(0),
1280 Builder.CreateStructGEP(StartFileCallArgsTy,
1281 StartFileCallArgsPtr, 0),
1282 "filename"),
1283 Builder.CreateLoad(StartFileCallArgsTy->getElementType(1),
1284 Builder.CreateStructGEP(StartFileCallArgsTy,
1285 StartFileCallArgsPtr, 1),
1286 "version"),
1287 Builder.CreateLoad(StartFileCallArgsTy->getElementType(2),
1288 Builder.CreateStructGEP(StartFileCallArgsTy,
1289 StartFileCallArgsPtr, 2),
1290 "stamp")});
1291 if (auto AK = TLI->getExtAttrForI32Param(false))
1292 StartFileCall->addParamAttr(2, AK);
1293 auto *NumCounters = Builder.CreateLoad(
1294 FileInfoTy->getElementType(1),
1295 Builder.CreateStructGEP(FileInfoTy, FileInfoPtr, 1), "num_ctrs");
1296 auto *EmitFunctionCallArgsArray =
1297 Builder.CreateLoad(FileInfoTy->getElementType(2),
1298 Builder.CreateStructGEP(FileInfoTy, FileInfoPtr, 2),
1299 "emit_function_args");
1300 auto *EmitArcsCallArgsArray = Builder.CreateLoad(
1301 FileInfoTy->getElementType(3),
1302 Builder.CreateStructGEP(FileInfoTy, FileInfoPtr, 3), "emit_arcs_args");
1303 auto *EnterCounterLoopCond =
1304 Builder.CreateICmpSLT(Builder.getInt32(0), NumCounters);
1305 Builder.CreateCondBr(EnterCounterLoopCond, CounterLoopHeader, FileLoopLatch);
1307 Builder.SetInsertPoint(CounterLoopHeader);
1308 auto *JV = Builder.CreatePHI(Builder.getInt32Ty(), /*NumReservedValues*/ 2,
1309 "ctr_idx");
1310 JV->addIncoming(Builder.getInt32(0), FileLoopHeader);
1311 auto *EmitFunctionCallArgsPtr = Builder.CreateInBoundsGEP(
1312 EmitFunctionCallArgsTy, EmitFunctionCallArgsArray, JV);
1313 auto *EmitFunctionCall = Builder.CreateCall(
1314 EmitFunction,
1315 {Builder.CreateLoad(EmitFunctionCallArgsTy->getElementType(0),
1316 Builder.CreateStructGEP(EmitFunctionCallArgsTy,
1317 EmitFunctionCallArgsPtr, 0),
1318 "ident"),
1319 Builder.CreateLoad(EmitFunctionCallArgsTy->getElementType(1),
1320 Builder.CreateStructGEP(EmitFunctionCallArgsTy,
1321 EmitFunctionCallArgsPtr, 1),
1322 "func_checkssum"),
1323 Builder.CreateLoad(EmitFunctionCallArgsTy->getElementType(2),
1324 Builder.CreateStructGEP(EmitFunctionCallArgsTy,
1325 EmitFunctionCallArgsPtr, 2),
1326 "cfg_checksum")});
1327 if (auto AK = TLI->getExtAttrForI32Param(false)) {
1328 EmitFunctionCall->addParamAttr(0, AK);
1329 EmitFunctionCall->addParamAttr(1, AK);
1330 EmitFunctionCall->addParamAttr(2, AK);
1332 auto *EmitArcsCallArgsPtr =
1333 Builder.CreateInBoundsGEP(EmitArcsCallArgsTy, EmitArcsCallArgsArray, JV);
1334 auto *EmitArcsCall = Builder.CreateCall(
1335 EmitArcs,
1336 {Builder.CreateLoad(
1337 EmitArcsCallArgsTy->getElementType(0),
1338 Builder.CreateStructGEP(EmitArcsCallArgsTy, EmitArcsCallArgsPtr, 0),
1339 "num_counters"),
1340 Builder.CreateLoad(
1341 EmitArcsCallArgsTy->getElementType(1),
1342 Builder.CreateStructGEP(EmitArcsCallArgsTy, EmitArcsCallArgsPtr, 1),
1343 "counters")});
1344 if (auto AK = TLI->getExtAttrForI32Param(false))
1345 EmitArcsCall->addParamAttr(0, AK);
1346 auto *NextJV = Builder.CreateAdd(JV, Builder.getInt32(1));
1347 auto *CounterLoopCond = Builder.CreateICmpSLT(NextJV, NumCounters);
1348 Builder.CreateCondBr(CounterLoopCond, CounterLoopHeader, FileLoopLatch);
1349 JV->addIncoming(NextJV, CounterLoopHeader);
1351 Builder.SetInsertPoint(FileLoopLatch);
1352 Builder.CreateCall(SummaryInfo, {});
1353 Builder.CreateCall(EndFile, {});
1354 auto *NextIV = Builder.CreateAdd(IV, Builder.getInt32(1), "next_file_idx");
1355 auto *FileLoopCond =
1356 Builder.CreateICmpSLT(NextIV, Builder.getInt32(FileInfos.size()));
1357 Builder.CreateCondBr(FileLoopCond, FileLoopHeader, ExitBB);
1358 IV->addIncoming(NextIV, FileLoopLatch);
1360 Builder.SetInsertPoint(ExitBB);
1361 Builder.CreateRetVoid();
1363 return WriteoutF;
1366 Function *GCOVProfiler::insertReset(
1367 ArrayRef<std::pair<GlobalVariable *, MDNode *>> CountersBySP) {
1368 FunctionType *FTy = FunctionType::get(Type::getVoidTy(*Ctx), false);
1369 Function *ResetF = M->getFunction("__llvm_gcov_reset");
1370 if (!ResetF)
1371 ResetF = createInternalFunction(FTy, "__llvm_gcov_reset");
1372 ResetF->addFnAttr(Attribute::NoInline);
1374 BasicBlock *Entry = BasicBlock::Create(*Ctx, "entry", ResetF);
1375 IRBuilder<> Builder(Entry);
1376 LLVMContext &C = Entry->getContext();
1378 // Zero out the counters.
1379 for (const auto &I : CountersBySP) {
1380 GlobalVariable *GV = I.first;
1381 auto *GVTy = cast<ArrayType>(GV->getValueType());
1382 Builder.CreateMemSet(GV, Constant::getNullValue(Type::getInt8Ty(C)),
1383 GVTy->getNumElements() *
1384 GVTy->getElementType()->getScalarSizeInBits() / 8,
1385 GV->getAlign());
1388 Type *RetTy = ResetF->getReturnType();
1389 if (RetTy->isVoidTy())
1390 Builder.CreateRetVoid();
1391 else if (RetTy->isIntegerTy())
1392 // Used if __llvm_gcov_reset was implicitly declared.
1393 Builder.CreateRet(ConstantInt::get(RetTy, 0));
1394 else
1395 report_fatal_error("invalid return type for __llvm_gcov_reset");
1397 return ResetF;