[clang] StmtPrinter: Handle DeclRefExpr to a Decomposition (#125001)
[llvm-project.git] / llvm / lib / DebugInfo / GSYM / FunctionInfo.cpp
blobb6dcaeb323f59a7e47661ca2e9099d6bba636852
1 //===- FunctionInfo.cpp ---------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
9 #include "llvm/DebugInfo/GSYM/FunctionInfo.h"
10 #include "llvm/DebugInfo/GSYM/FileWriter.h"
11 #include "llvm/DebugInfo/GSYM/GsymReader.h"
12 #include "llvm/DebugInfo/GSYM/LineTable.h"
13 #include "llvm/DebugInfo/GSYM/InlineInfo.h"
14 #include "llvm/Support/DataExtractor.h"
15 #include <optional>
17 using namespace llvm;
18 using namespace gsym;
20 /// FunctionInfo information type that is used to encode the optional data
21 /// that is associated with a FunctionInfo object.
22 enum InfoType : uint32_t {
23 EndOfList = 0u,
24 LineTableInfo = 1u,
25 InlineInfo = 2u,
26 MergedFunctionsInfo = 3u,
27 CallSiteInfo = 4u,
30 raw_ostream &llvm::gsym::operator<<(raw_ostream &OS, const FunctionInfo &FI) {
31 OS << FI.Range << ": " << "Name=" << HEX32(FI.Name) << '\n';
32 if (FI.OptLineTable)
33 OS << FI.OptLineTable << '\n';
34 if (FI.Inline)
35 OS << FI.Inline << '\n';
36 if (FI.CallSites)
37 OS << *FI.CallSites << '\n';
38 return OS;
41 llvm::Expected<FunctionInfo> FunctionInfo::decode(DataExtractor &Data,
42 uint64_t BaseAddr) {
43 FunctionInfo FI;
44 uint64_t Offset = 0;
45 if (!Data.isValidOffsetForDataOfSize(Offset, 4))
46 return createStringError(std::errc::io_error,
47 "0x%8.8" PRIx64 ": missing FunctionInfo Size", Offset);
48 FI.Range = {BaseAddr, BaseAddr + Data.getU32(&Offset)};
49 if (!Data.isValidOffsetForDataOfSize(Offset, 4))
50 return createStringError(std::errc::io_error,
51 "0x%8.8" PRIx64 ": missing FunctionInfo Name", Offset);
52 FI.Name = Data.getU32(&Offset);
53 if (FI.Name == 0)
54 return createStringError(std::errc::io_error,
55 "0x%8.8" PRIx64 ": invalid FunctionInfo Name value 0x%8.8x",
56 Offset - 4, FI.Name);
57 bool Done = false;
58 while (!Done) {
59 if (!Data.isValidOffsetForDataOfSize(Offset, 4))
60 return createStringError(std::errc::io_error,
61 "0x%8.8" PRIx64 ": missing FunctionInfo InfoType value", Offset);
62 const uint32_t IT = Data.getU32(&Offset);
63 if (!Data.isValidOffsetForDataOfSize(Offset, 4))
64 return createStringError(std::errc::io_error,
65 "0x%8.8" PRIx64 ": missing FunctionInfo InfoType length", Offset);
66 const uint32_t InfoLength = Data.getU32(&Offset);
67 if (!Data.isValidOffsetForDataOfSize(Offset, InfoLength))
68 return createStringError(std::errc::io_error,
69 "0x%8.8" PRIx64 ": missing FunctionInfo data for InfoType %u",
70 Offset, IT);
71 DataExtractor InfoData(Data.getData().substr(Offset, InfoLength),
72 Data.isLittleEndian(),
73 Data.getAddressSize());
74 switch (IT) {
75 case InfoType::EndOfList:
76 Done = true;
77 break;
79 case InfoType::LineTableInfo:
80 if (Expected<LineTable> LT = LineTable::decode(InfoData, BaseAddr))
81 FI.OptLineTable = std::move(LT.get());
82 else
83 return LT.takeError();
84 break;
86 case InfoType::InlineInfo:
87 if (Expected<InlineInfo> II = InlineInfo::decode(InfoData, BaseAddr))
88 FI.Inline = std::move(II.get());
89 else
90 return II.takeError();
91 break;
93 case InfoType::MergedFunctionsInfo:
94 if (Expected<MergedFunctionsInfo> MI =
95 MergedFunctionsInfo::decode(InfoData, BaseAddr))
96 FI.MergedFunctions = std::move(MI.get());
97 else
98 return MI.takeError();
99 break;
101 case InfoType::CallSiteInfo:
102 if (Expected<llvm::gsym::CallSiteInfoCollection> CI =
103 llvm::gsym::CallSiteInfoCollection::decode(InfoData))
104 FI.CallSites = std::move(CI.get());
105 else
106 return CI.takeError();
107 break;
109 default:
110 return createStringError(std::errc::io_error,
111 "0x%8.8" PRIx64 ": unsupported InfoType %u",
112 Offset-8, IT);
114 Offset += InfoLength;
116 return std::move(FI);
119 uint64_t FunctionInfo::cacheEncoding() {
120 EncodingCache.clear();
121 if (!isValid())
122 return 0;
123 raw_svector_ostream OutStrm(EncodingCache);
124 FileWriter FW(OutStrm, llvm::endianness::native);
125 llvm::Expected<uint64_t> Result = encode(FW);
126 if (!Result) {
127 EncodingCache.clear();
128 consumeError(Result.takeError());
129 return 0;
131 return EncodingCache.size();
134 llvm::Expected<uint64_t> FunctionInfo::encode(FileWriter &Out,
135 bool NoPadding) const {
136 if (!isValid())
137 return createStringError(std::errc::invalid_argument,
138 "attempted to encode invalid FunctionInfo object");
139 // Align FunctionInfo data to a 4 byte alignment, if padding is allowed
140 if (NoPadding == false)
141 Out.alignTo(4);
142 const uint64_t FuncInfoOffset = Out.tell();
143 // Check if we have already encoded this function info into EncodingCache.
144 // This will be non empty when creating segmented GSYM files as we need to
145 // precompute exactly how big FunctionInfo objects encode into so we can
146 // accurately make segments of a specific size.
147 if (!EncodingCache.empty() &&
148 llvm::endianness::native == Out.getByteOrder()) {
149 // We already encoded this object, just write out the bytes.
150 Out.writeData(llvm::ArrayRef<uint8_t>((const uint8_t *)EncodingCache.data(),
151 EncodingCache.size()));
152 return FuncInfoOffset;
154 // Write the size in bytes of this function as a uint32_t. This can be zero
155 // if we just have a symbol from a symbol table and that symbol has no size.
156 Out.writeU32(size());
157 // Write the name of this function as a uint32_t string table offset.
158 Out.writeU32(Name);
160 if (OptLineTable) {
161 Out.writeU32(InfoType::LineTableInfo);
162 // Write a uint32_t length as zero for now, we will fix this up after
163 // writing the LineTable out with the number of bytes that were written.
164 Out.writeU32(0);
165 const auto StartOffset = Out.tell();
166 llvm::Error err = OptLineTable->encode(Out, Range.start());
167 if (err)
168 return std::move(err);
169 const auto Length = Out.tell() - StartOffset;
170 if (Length > UINT32_MAX)
171 return createStringError(std::errc::invalid_argument,
172 "LineTable length is greater than UINT32_MAX");
173 // Fixup the size of the LineTable data with the correct size.
174 Out.fixup32(static_cast<uint32_t>(Length), StartOffset - 4);
177 // Write out the inline function info if we have any and if it is valid.
178 if (Inline) {
179 Out.writeU32(InfoType::InlineInfo);
180 // Write a uint32_t length as zero for now, we will fix this up after
181 // writing the LineTable out with the number of bytes that were written.
182 Out.writeU32(0);
183 const auto StartOffset = Out.tell();
184 llvm::Error err = Inline->encode(Out, Range.start());
185 if (err)
186 return std::move(err);
187 const auto Length = Out.tell() - StartOffset;
188 if (Length > UINT32_MAX)
189 return createStringError(std::errc::invalid_argument,
190 "InlineInfo length is greater than UINT32_MAX");
191 // Fixup the size of the InlineInfo data with the correct size.
192 Out.fixup32(static_cast<uint32_t>(Length), StartOffset - 4);
195 // Write out the merged functions info if we have any and if it is valid.
196 if (MergedFunctions) {
197 Out.writeU32(InfoType::MergedFunctionsInfo);
198 // Write a uint32_t length as zero for now, we will fix this up after
199 // writing the LineTable out with the number of bytes that were written.
200 Out.writeU32(0);
201 const auto StartOffset = Out.tell();
202 llvm::Error err = MergedFunctions->encode(Out);
203 if (err)
204 return std::move(err);
205 const auto Length = Out.tell() - StartOffset;
206 if (Length > UINT32_MAX)
207 return createStringError(
208 std::errc::invalid_argument,
209 "MergedFunctionsInfo length is greater than UINT32_MAX");
210 // Fixup the size of the MergedFunctionsInfo data with the correct size.
211 Out.fixup32(static_cast<uint32_t>(Length), StartOffset - 4);
214 // Write out the call sites if we have any and if they are valid.
215 if (CallSites) {
216 Out.writeU32(InfoType::CallSiteInfo);
217 // Write a uint32_t length as zero for now, we will fix this up after
218 // writing the CallSites out with the number of bytes that were written.
219 Out.writeU32(0);
220 const auto StartOffset = Out.tell();
221 Error Err = CallSites->encode(Out);
222 if (Err)
223 return std::move(Err);
224 const auto Length = Out.tell() - StartOffset;
225 if (Length > UINT32_MAX)
226 return createStringError(std::errc::invalid_argument,
227 "CallSites length is greater than UINT32_MAX");
228 // Fixup the size of the CallSites data with the correct size.
229 Out.fixup32(static_cast<uint32_t>(Length), StartOffset - 4);
232 // Terminate the data chunks with an end of list with zero size.
233 Out.writeU32(InfoType::EndOfList);
234 Out.writeU32(0);
235 return FuncInfoOffset;
238 llvm::Expected<LookupResult>
239 FunctionInfo::lookup(DataExtractor &Data, const GsymReader &GR,
240 uint64_t FuncAddr, uint64_t Addr,
241 std::optional<DataExtractor> *MergedFuncsData) {
242 LookupResult LR;
243 LR.LookupAddr = Addr;
244 uint64_t Offset = 0;
245 LR.FuncRange = {FuncAddr, FuncAddr + Data.getU32(&Offset)};
246 uint32_t NameOffset = Data.getU32(&Offset);
247 // The "lookup" functions doesn't report errors as accurately as the "decode"
248 // function as it is meant to be fast. For more accurage errors we could call
249 // "decode".
250 if (!Data.isValidOffset(Offset))
251 return createStringError(std::errc::io_error,
252 "FunctionInfo data is truncated");
253 // This function will be called with the result of a binary search of the
254 // address table, we must still make sure the address does not fall into a
255 // gap between functions are after the last function.
256 if (LR.FuncRange.size() > 0 && !LR.FuncRange.contains(Addr))
257 return createStringError(std::errc::io_error,
258 "address 0x%" PRIx64 " is not in GSYM", Addr);
260 if (NameOffset == 0)
261 return createStringError(std::errc::io_error,
262 "0x%8.8" PRIx64 ": invalid FunctionInfo Name value 0x00000000",
263 Offset - 4);
264 LR.FuncName = GR.getString(NameOffset);
265 bool Done = false;
266 std::optional<LineEntry> LineEntry;
267 std::optional<DataExtractor> InlineInfoData;
268 while (!Done) {
269 if (!Data.isValidOffsetForDataOfSize(Offset, 8))
270 return createStringError(std::errc::io_error,
271 "FunctionInfo data is truncated");
272 const uint32_t IT = Data.getU32(&Offset);
273 const uint32_t InfoLength = Data.getU32(&Offset);
274 const StringRef InfoBytes = Data.getData().substr(Offset, InfoLength);
275 if (InfoLength != InfoBytes.size())
276 return createStringError(std::errc::io_error,
277 "FunctionInfo data is truncated");
278 DataExtractor InfoData(InfoBytes, Data.isLittleEndian(),
279 Data.getAddressSize());
280 switch (IT) {
281 case InfoType::EndOfList:
282 Done = true;
283 break;
285 case InfoType::LineTableInfo:
286 if (auto ExpectedLE = LineTable::lookup(InfoData, FuncAddr, Addr))
287 LineEntry = ExpectedLE.get();
288 else
289 return ExpectedLE.takeError();
290 break;
292 case InfoType::MergedFunctionsInfo:
293 // Store the merged functions data for later parsing, if needed.
294 if (MergedFuncsData)
295 *MergedFuncsData = InfoData;
296 break;
298 case InfoType::InlineInfo:
299 // We will parse the inline info after our line table, but only if
300 // we have a line entry.
301 InlineInfoData = InfoData;
302 break;
304 case InfoType::CallSiteInfo:
305 if (auto CSIC = CallSiteInfoCollection::decode(InfoData)) {
306 // Find matching call site based on relative offset
307 for (const auto &CS : CSIC->CallSites) {
308 // Check if the call site matches the lookup address
309 if (CS.ReturnOffset == Addr - FuncAddr) {
310 // Get regex patterns
311 for (uint32_t RegexOffset : CS.MatchRegex) {
312 LR.CallSiteFuncRegex.push_back(GR.getString(RegexOffset));
314 break;
317 } else {
318 return CSIC.takeError();
320 break;
322 default:
323 break;
325 Offset += InfoLength;
328 if (!LineEntry) {
329 // We don't have a valid line entry for our address, fill in our source
330 // location as best we can and return.
331 SourceLocation SrcLoc;
332 SrcLoc.Name = LR.FuncName;
333 SrcLoc.Offset = Addr - FuncAddr;
334 LR.Locations.push_back(SrcLoc);
335 return LR;
338 std::optional<FileEntry> LineEntryFile = GR.getFile(LineEntry->File);
339 if (!LineEntryFile)
340 return createStringError(std::errc::invalid_argument,
341 "failed to extract file[%" PRIu32 "]",
342 LineEntry->File);
344 SourceLocation SrcLoc;
345 SrcLoc.Name = LR.FuncName;
346 SrcLoc.Offset = Addr - FuncAddr;
347 SrcLoc.Dir = GR.getString(LineEntryFile->Dir);
348 SrcLoc.Base = GR.getString(LineEntryFile->Base);
349 SrcLoc.Line = LineEntry->Line;
350 LR.Locations.push_back(SrcLoc);
351 // If we don't have inline information, we are done.
352 if (!InlineInfoData)
353 return LR;
354 // We have inline information. Try to augment the lookup result with this
355 // data.
356 llvm::Error Err = InlineInfo::lookup(GR, *InlineInfoData, FuncAddr, Addr,
357 LR.Locations);
358 if (Err)
359 return std::move(Err);
360 return LR;