LLVM 20.0.0git
GsymCreator.cpp
Go to the documentation of this file.
1//===- GsymCreator.cpp ----------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//===----------------------------------------------------------------------===//
7
15
16#include <algorithm>
17#include <cassert>
18#include <functional>
19#include <vector>
20
21using namespace llvm;
22using namespace gsym;
23
25 : StrTab(StringTableBuilder::ELF), Quiet(Quiet) {
27}
28
30 llvm::StringRef directory = llvm::sys::path::parent_path(Path, Style);
31 llvm::StringRef filename = llvm::sys::path::filename(Path, Style);
32 // We must insert the strings first, then call the FileEntry constructor.
33 // If we inline the insertString() function call into the constructor, the
34 // call order is undefined due to parameter lists not having any ordering
35 // requirements.
36 const uint32_t Dir = insertString(directory);
37 const uint32_t Base = insertString(filename);
38 return insertFileEntry(FileEntry(Dir, Base));
39}
40
41uint32_t GsymCreator::insertFileEntry(FileEntry FE) {
42 std::lock_guard<std::mutex> Guard(Mutex);
43 const auto NextIndex = Files.size();
44 // Find FE in hash map and insert if not present.
45 auto R = FileEntryToIndex.insert(std::make_pair(FE, NextIndex));
46 if (R.second)
47 Files.emplace_back(FE);
48 return R.first->second;
49}
50
51uint32_t GsymCreator::copyFile(const GsymCreator &SrcGC, uint32_t FileIdx) {
52 // File index zero is reserved for a FileEntry with no directory and no
53 // filename. Any other file and we need to copy the strings for the directory
54 // and filename.
55 if (FileIdx == 0)
56 return 0;
57 const FileEntry SrcFE = SrcGC.Files[FileIdx];
58 // Copy the strings for the file and then add the newly converted file entry.
59 uint32_t Dir =
60 SrcFE.Dir == 0
61 ? 0
62 : StrTab.add(SrcGC.StringOffsetMap.find(SrcFE.Dir)->second);
63 uint32_t Base = StrTab.add(SrcGC.StringOffsetMap.find(SrcFE.Base)->second);
64 FileEntry DstFE(Dir, Base);
65 return insertFileEntry(DstFE);
66}
67
69 std::optional<uint64_t> SegmentSize) const {
70 if (SegmentSize)
71 return saveSegments(Path, ByteOrder, *SegmentSize);
72 std::error_code EC;
73 raw_fd_ostream OutStrm(Path, EC);
74 if (EC)
75 return llvm::errorCodeToError(EC);
76 FileWriter O(OutStrm, ByteOrder);
77 return encode(O);
78}
79
81 std::lock_guard<std::mutex> Guard(Mutex);
82 if (Funcs.empty())
83 return createStringError(std::errc::invalid_argument,
84 "no functions to encode");
85 if (!Finalized)
86 return createStringError(std::errc::invalid_argument,
87 "GsymCreator wasn't finalized prior to encoding");
88
89 if (Funcs.size() > UINT32_MAX)
90 return createStringError(std::errc::invalid_argument,
91 "too many FunctionInfos");
92
93 std::optional<uint64_t> BaseAddress = getBaseAddress();
94 // Base address should be valid if we have any functions.
95 if (!BaseAddress)
96 return createStringError(std::errc::invalid_argument,
97 "invalid base address");
98 Header Hdr;
99 Hdr.Magic = GSYM_MAGIC;
100 Hdr.Version = GSYM_VERSION;
101 Hdr.AddrOffSize = getAddressOffsetSize();
102 Hdr.UUIDSize = static_cast<uint8_t>(UUID.size());
103 Hdr.BaseAddress = *BaseAddress;
104 Hdr.NumAddresses = static_cast<uint32_t>(Funcs.size());
105 Hdr.StrtabOffset = 0; // We will fix this up later.
106 Hdr.StrtabSize = 0; // We will fix this up later.
107 memset(Hdr.UUID, 0, sizeof(Hdr.UUID));
108 if (UUID.size() > sizeof(Hdr.UUID))
109 return createStringError(std::errc::invalid_argument,
110 "invalid UUID size %u", (uint32_t)UUID.size());
111 // Copy the UUID value if we have one.
112 if (UUID.size() > 0)
113 memcpy(Hdr.UUID, UUID.data(), UUID.size());
114 // Write out the header.
115 llvm::Error Err = Hdr.encode(O);
116 if (Err)
117 return Err;
118
119 const uint64_t MaxAddressOffset = getMaxAddressOffset();
120 // Write out the address offsets.
121 O.alignTo(Hdr.AddrOffSize);
122 for (const auto &FuncInfo : Funcs) {
123 uint64_t AddrOffset = FuncInfo.startAddress() - Hdr.BaseAddress;
124 // Make sure we calculated the address offsets byte size correctly by
125 // verifying the current address offset is within ranges. We have seen bugs
126 // introduced when the code changes that can cause problems here so it is
127 // good to catch this during testing.
128 assert(AddrOffset <= MaxAddressOffset);
129 (void)MaxAddressOffset;
130 switch (Hdr.AddrOffSize) {
131 case 1:
132 O.writeU8(static_cast<uint8_t>(AddrOffset));
133 break;
134 case 2:
135 O.writeU16(static_cast<uint16_t>(AddrOffset));
136 break;
137 case 4:
138 O.writeU32(static_cast<uint32_t>(AddrOffset));
139 break;
140 case 8:
141 O.writeU64(AddrOffset);
142 break;
143 }
144 }
145
146 // Write out all zeros for the AddrInfoOffsets.
147 O.alignTo(4);
148 const off_t AddrInfoOffsetsOffset = O.tell();
149 for (size_t i = 0, n = Funcs.size(); i < n; ++i)
150 O.writeU32(0);
151
152 // Write out the file table
153 O.alignTo(4);
154 assert(!Files.empty());
155 assert(Files[0].Dir == 0);
156 assert(Files[0].Base == 0);
157 size_t NumFiles = Files.size();
158 if (NumFiles > UINT32_MAX)
159 return createStringError(std::errc::invalid_argument, "too many files");
160 O.writeU32(static_cast<uint32_t>(NumFiles));
161 for (auto File : Files) {
162 O.writeU32(File.Dir);
163 O.writeU32(File.Base);
164 }
165
166 // Write out the string table.
167 const off_t StrtabOffset = O.tell();
168 StrTab.write(O.get_stream());
169 const off_t StrtabSize = O.tell() - StrtabOffset;
170 std::vector<uint32_t> AddrInfoOffsets;
171
172 // Write out the address infos for each function info.
173 for (const auto &FuncInfo : Funcs) {
174 if (Expected<uint64_t> OffsetOrErr = FuncInfo.encode(O))
175 AddrInfoOffsets.push_back(OffsetOrErr.get());
176 else
177 return OffsetOrErr.takeError();
178 }
179 // Fixup the string table offset and size in the header
180 O.fixup32((uint32_t)StrtabOffset, offsetof(Header, StrtabOffset));
181 O.fixup32((uint32_t)StrtabSize, offsetof(Header, StrtabSize));
182
183 // Fixup all address info offsets
184 uint64_t Offset = 0;
185 for (auto AddrInfoOffset : AddrInfoOffsets) {
186 O.fixup32(AddrInfoOffset, AddrInfoOffsetsOffset + Offset);
187 Offset += 4;
188 }
189 return ErrorSuccess();
190}
191
193 // Use the loader to load call site information from the YAML file.
194 CallSiteInfoLoader Loader(*this, Funcs);
195 return Loader.loadYAML(YAMLFile);
196}
197
199 // Nothing to do if we have less than 2 functions.
200 if (Funcs.size() < 2)
201 return;
202
203 // Sort the function infos by address range first, preserving input order
204 llvm::stable_sort(Funcs);
205 std::vector<FunctionInfo> TopLevelFuncs;
206
207 // Add the first function info to the top level functions
208 TopLevelFuncs.emplace_back(std::move(Funcs.front()));
209
210 // Now if the next function info has the same address range as the top level,
211 // then merge it into the top level function, otherwise add it to the top
212 // level.
213 for (size_t Idx = 1; Idx < Funcs.size(); ++Idx) {
214 FunctionInfo &TopFunc = TopLevelFuncs.back();
215 FunctionInfo &MatchFunc = Funcs[Idx];
216 if (TopFunc.Range == MatchFunc.Range) {
217 // Both have the same range - add the 2nd func as a child of the 1st func
218 if (!TopFunc.MergedFunctions)
220 // Avoid adding duplicate functions to MergedFunctions. Since functions
221 // are already ordered within the Funcs array, we can just check equality
222 // against the last function in the merged array.
223 else if (TopFunc.MergedFunctions->MergedFunctions.back() == MatchFunc)
224 continue;
225 TopFunc.MergedFunctions->MergedFunctions.emplace_back(
226 std::move(MatchFunc));
227 } else
228 // No match, add the function as a top-level function
229 TopLevelFuncs.emplace_back(std::move(MatchFunc));
230 }
231
232 uint32_t mergedCount = Funcs.size() - TopLevelFuncs.size();
233 // If any functions were merged, print a message about it.
234 if (mergedCount != 0)
235 Out << "Have " << mergedCount
236 << " merged functions as children of other functions\n";
237
238 std::swap(Funcs, TopLevelFuncs);
239}
240
242 std::lock_guard<std::mutex> Guard(Mutex);
243 if (Finalized)
244 return createStringError(std::errc::invalid_argument, "already finalized");
245 Finalized = true;
246
247 // Don't let the string table indexes change by finalizing in order.
248 StrTab.finalizeInOrder();
249
250 // Remove duplicates function infos that have both entries from debug info
251 // (DWARF or Breakpad) and entries from the SymbolTable.
252 //
253 // Also handle overlapping function. Usually there shouldn't be any, but they
254 // can and do happen in some rare cases.
255 //
256 // (a) (b) (c)
257 // ^ ^ ^ ^
258 // |X |Y |X ^ |X
259 // | | | |Y | ^
260 // | | | v v |Y
261 // v v v v
262 //
263 // In (a) and (b), Y is ignored and X will be reported for the full range.
264 // In (c), both functions will be included in the result and lookups for an
265 // address in the intersection will return Y because of binary search.
266 //
267 // Note that in case of (b), we cannot include Y in the result because then
268 // we wouldn't find any function for range (end of Y, end of X)
269 // with binary search
270
271 const auto NumBefore = Funcs.size();
272 // Only sort and unique if this isn't a segment. If this is a segment we
273 // already finalized the main GsymCreator with all of the function infos
274 // and then the already sorted and uniqued function infos were added to this
275 // object.
276 if (!IsSegment) {
277 if (NumBefore > 1) {
278 // Sort function infos so we can emit sorted functions. Use stable sort to
279 // ensure determinism.
280 llvm::stable_sort(Funcs);
281 std::vector<FunctionInfo> FinalizedFuncs;
282 FinalizedFuncs.reserve(Funcs.size());
283 FinalizedFuncs.emplace_back(std::move(Funcs.front()));
284 for (size_t Idx=1; Idx < NumBefore; ++Idx) {
285 FunctionInfo &Prev = FinalizedFuncs.back();
286 FunctionInfo &Curr = Funcs[Idx];
287 // Empty ranges won't intersect, but we still need to
288 // catch the case where we have multiple symbols at the
289 // same address and coalesce them.
290 const bool ranges_equal = Prev.Range == Curr.Range;
291 if (ranges_equal || Prev.Range.intersects(Curr.Range)) {
292 // Overlapping ranges or empty identical ranges.
293 if (ranges_equal) {
294 // Same address range. Check if one is from debug
295 // info and the other is from a symbol table. If
296 // so, then keep the one with debug info. Our
297 // sorting guarantees that entries with matching
298 // address ranges that have debug info are last in
299 // the sort.
300 if (!(Prev == Curr)) {
301 if (Prev.hasRichInfo() && Curr.hasRichInfo())
302 Out.Report(
303 "Duplicate address ranges with different debug info.",
304 [&](raw_ostream &OS) {
305 OS << "warning: same address range contains "
306 "different debug "
307 << "info. Removing:\n"
308 << Prev << "\nIn favor of this one:\n"
309 << Curr << "\n";
310 });
311
312 // We want to swap the current entry with the previous since
313 // later entries with the same range always have more debug info
314 // or different debug info.
315 std::swap(Prev, Curr);
316 }
317 } else {
318 Out.Report("Overlapping function ranges", [&](raw_ostream &OS) {
319 // print warnings about overlaps
320 OS << "warning: function ranges overlap:\n"
321 << Prev << "\n"
322 << Curr << "\n";
323 });
324 FinalizedFuncs.emplace_back(std::move(Curr));
325 }
326 } else {
327 if (Prev.Range.size() == 0 && Curr.Range.contains(Prev.Range.start())) {
328 // Symbols on macOS don't have address ranges, so if the range
329 // doesn't match and the size is zero, then we replace the empty
330 // symbol function info with the current one.
331 std::swap(Prev, Curr);
332 } else {
333 FinalizedFuncs.emplace_back(std::move(Curr));
334 }
335 }
336 }
337 std::swap(Funcs, FinalizedFuncs);
338 }
339 // If our last function info entry doesn't have a size and if we have valid
340 // text ranges, we should set the size of the last entry since any search for
341 // a high address might match our last entry. By fixing up this size, we can
342 // help ensure we don't cause lookups to always return the last symbol that
343 // has no size when doing lookups.
344 if (!Funcs.empty() && Funcs.back().Range.size() == 0 && ValidTextRanges) {
345 if (auto Range =
346 ValidTextRanges->getRangeThatContains(Funcs.back().Range.start())) {
347 Funcs.back().Range = {Funcs.back().Range.start(), Range->end()};
348 }
349 }
350 Out << "Pruned " << NumBefore - Funcs.size() << " functions, ended with "
351 << Funcs.size() << " total\n";
352 }
353 return Error::success();
354}
355
356uint32_t GsymCreator::copyString(const GsymCreator &SrcGC, uint32_t StrOff) {
357 // String offset at zero is always the empty string, no copying needed.
358 if (StrOff == 0)
359 return 0;
360 return StrTab.add(SrcGC.StringOffsetMap.find(StrOff)->second);
361}
362
364 if (S.empty())
365 return 0;
366
367 // The hash can be calculated outside the lock.
368 CachedHashStringRef CHStr(S);
369 std::lock_guard<std::mutex> Guard(Mutex);
370 if (Copy) {
371 // We need to provide backing storage for the string if requested
372 // since StringTableBuilder stores references to strings. Any string
373 // that comes from a section in an object file doesn't need to be
374 // copied, but any string created by code will need to be copied.
375 // This allows GsymCreator to be really fast when parsing DWARF and
376 // other object files as most strings don't need to be copied.
377 if (!StrTab.contains(CHStr))
378 CHStr = CachedHashStringRef{StringStorage.insert(S).first->getKey(),
379 CHStr.hash()};
380 }
381 const uint32_t StrOff = StrTab.add(CHStr);
382 // Save a mapping of string offsets to the cached string reference in case
383 // we need to segment the GSYM file and copy string from one string table to
384 // another.
385 StringOffsetMap.try_emplace(StrOff, CHStr);
386 return StrOff;
387}
388
390 auto I = StringOffsetMap.find(Offset);
391 assert(I != StringOffsetMap.end() &&
392 "GsymCreator::getString expects a valid offset as parameter.");
393 return I->second.val();
394}
395
397 std::lock_guard<std::mutex> Guard(Mutex);
398 Funcs.emplace_back(std::move(FI));
399}
400
402 std::function<bool(FunctionInfo &)> const &Callback) {
403 std::lock_guard<std::mutex> Guard(Mutex);
404 for (auto &FI : Funcs) {
405 if (!Callback(FI))
406 break;
407 }
408}
409
411 std::function<bool(const FunctionInfo &)> const &Callback) const {
412 std::lock_guard<std::mutex> Guard(Mutex);
413 for (const auto &FI : Funcs) {
414 if (!Callback(FI))
415 break;
416 }
417}
418
420 std::lock_guard<std::mutex> Guard(Mutex);
421 return Funcs.size();
422}
423
425 if (ValidTextRanges)
426 return ValidTextRanges->contains(Addr);
427 return true; // No valid text ranges has been set, so accept all ranges.
428}
429
430std::optional<uint64_t> GsymCreator::getFirstFunctionAddress() const {
431 // If we have finalized then Funcs are sorted. If we are a segment then
432 // Funcs will be sorted as well since function infos get added from an
433 // already finalized GsymCreator object where its functions were sorted and
434 // uniqued.
435 if ((Finalized || IsSegment) && !Funcs.empty())
436 return std::optional<uint64_t>(Funcs.front().startAddress());
437 return std::nullopt;
438}
439
440std::optional<uint64_t> GsymCreator::getLastFunctionAddress() const {
441 // If we have finalized then Funcs are sorted. If we are a segment then
442 // Funcs will be sorted as well since function infos get added from an
443 // already finalized GsymCreator object where its functions were sorted and
444 // uniqued.
445 if ((Finalized || IsSegment) && !Funcs.empty())
446 return std::optional<uint64_t>(Funcs.back().startAddress());
447 return std::nullopt;
448}
449
450std::optional<uint64_t> GsymCreator::getBaseAddress() const {
451 if (BaseAddress)
452 return BaseAddress;
453 return getFirstFunctionAddress();
454}
455
456uint64_t GsymCreator::getMaxAddressOffset() const {
457 switch (getAddressOffsetSize()) {
458 case 1: return UINT8_MAX;
459 case 2: return UINT16_MAX;
460 case 4: return UINT32_MAX;
461 case 8: return UINT64_MAX;
462 }
463 llvm_unreachable("invalid address offset");
464}
465
466uint8_t GsymCreator::getAddressOffsetSize() const {
467 const std::optional<uint64_t> BaseAddress = getBaseAddress();
468 const std::optional<uint64_t> LastFuncAddr = getLastFunctionAddress();
469 if (BaseAddress && LastFuncAddr) {
470 const uint64_t AddrDelta = *LastFuncAddr - *BaseAddress;
471 if (AddrDelta <= UINT8_MAX)
472 return 1;
473 else if (AddrDelta <= UINT16_MAX)
474 return 2;
475 else if (AddrDelta <= UINT32_MAX)
476 return 4;
477 return 8;
478 }
479 return 1;
480}
481
482uint64_t GsymCreator::calculateHeaderAndTableSize() const {
483 uint64_t Size = sizeof(Header);
484 const size_t NumFuncs = Funcs.size();
485 // Add size of address offset table
486 Size += NumFuncs * getAddressOffsetSize();
487 // Add size of address info offsets which are 32 bit integers in version 1.
488 Size += NumFuncs * sizeof(uint32_t);
489 // Add file table size
490 Size += Files.size() * sizeof(FileEntry);
491 // Add string table size
492 Size += StrTab.getSize();
493
494 return Size;
495}
496
497// This function takes a InlineInfo class that was copy constructed from an
498// InlineInfo from the \a SrcGC and updates all members that point to strings
499// and files to point to strings and files from this GsymCreator.
500void GsymCreator::fixupInlineInfo(const GsymCreator &SrcGC, InlineInfo &II) {
501 II.Name = copyString(SrcGC, II.Name);
502 II.CallFile = copyFile(SrcGC, II.CallFile);
503 for (auto &ChildII: II.Children)
504 fixupInlineInfo(SrcGC, ChildII);
505}
506
507uint64_t GsymCreator::copyFunctionInfo(const GsymCreator &SrcGC, size_t FuncIdx) {
508 // To copy a function info we need to copy any files and strings over into
509 // this GsymCreator and then copy the function info and update the string
510 // table offsets to match the new offsets.
511 const FunctionInfo &SrcFI = SrcGC.Funcs[FuncIdx];
512
513 FunctionInfo DstFI;
514 DstFI.Range = SrcFI.Range;
515 DstFI.Name = copyString(SrcGC, SrcFI.Name);
516 // Copy the line table if there is one.
517 if (SrcFI.OptLineTable) {
518 // Copy the entire line table.
519 DstFI.OptLineTable = LineTable(SrcFI.OptLineTable.value());
520 // Fixup all LineEntry::File entries which are indexes in the the file table
521 // from SrcGC and must be converted to file indexes from this GsymCreator.
522 LineTable &DstLT = DstFI.OptLineTable.value();
523 const size_t NumLines = DstLT.size();
524 for (size_t I=0; I<NumLines; ++I) {
525 LineEntry &LE = DstLT.get(I);
526 LE.File = copyFile(SrcGC, LE.File);
527 }
528 }
529 // Copy the inline information if needed.
530 if (SrcFI.Inline) {
531 // Make a copy of the source inline information.
532 DstFI.Inline = SrcFI.Inline.value();
533 // Fixup all strings and files in the copied inline information.
534 fixupInlineInfo(SrcGC, *DstFI.Inline);
535 }
536 std::lock_guard<std::mutex> Guard(Mutex);
537 Funcs.emplace_back(DstFI);
538 return Funcs.back().cacheEncoding();
539}
540
541llvm::Error GsymCreator::saveSegments(StringRef Path,
542 llvm::endianness ByteOrder,
543 uint64_t SegmentSize) const {
544 if (SegmentSize == 0)
545 return createStringError(std::errc::invalid_argument,
546 "invalid segment size zero");
547
548 size_t FuncIdx = 0;
549 const size_t NumFuncs = Funcs.size();
550 while (FuncIdx < NumFuncs) {
552 createSegment(SegmentSize, FuncIdx);
553 if (ExpectedGC) {
554 GsymCreator *GC = ExpectedGC->get();
555 if (GC == NULL)
556 break; // We had not more functions to encode.
557 // Don't collect any messages at all
558 OutputAggregator Out(nullptr);
559 llvm::Error Err = GC->finalize(Out);
560 if (Err)
561 return Err;
562 std::string SegmentedGsymPath;
563 raw_string_ostream SGP(SegmentedGsymPath);
564 std::optional<uint64_t> FirstFuncAddr = GC->getFirstFunctionAddress();
565 if (FirstFuncAddr) {
566 SGP << Path << "-" << llvm::format_hex(*FirstFuncAddr, 1);
567 SGP.flush();
568 Err = GC->save(SegmentedGsymPath, ByteOrder, std::nullopt);
569 if (Err)
570 return Err;
571 }
572 } else {
573 return ExpectedGC.takeError();
574 }
575 }
576 return Error::success();
577}
578
580GsymCreator::createSegment(uint64_t SegmentSize, size_t &FuncIdx) const {
581 // No function entries, return empty unique pointer
582 if (FuncIdx >= Funcs.size())
583 return std::unique_ptr<GsymCreator>();
584
585 std::unique_ptr<GsymCreator> GC(new GsymCreator(/*Quiet=*/true));
586
587 // Tell the creator that this is a segment.
588 GC->setIsSegment();
589
590 // Set the base address if there is one.
591 if (BaseAddress)
592 GC->setBaseAddress(*BaseAddress);
593 // Copy the UUID value from this object into the new creator.
594 GC->setUUID(UUID);
595 const size_t NumFuncs = Funcs.size();
596 // Track how big the function infos are for the current segment so we can
597 // emit segments that are close to the requested size. It is quick math to
598 // determine the current header and tables sizes, so we can do that each loop.
599 uint64_t SegmentFuncInfosSize = 0;
600 for (; FuncIdx < NumFuncs; ++FuncIdx) {
601 const uint64_t HeaderAndTableSize = GC->calculateHeaderAndTableSize();
602 if (HeaderAndTableSize + SegmentFuncInfosSize >= SegmentSize) {
603 if (SegmentFuncInfosSize == 0)
604 return createStringError(std::errc::invalid_argument,
605 "a segment size of %" PRIu64 " is to small to "
606 "fit any function infos, specify a larger value",
607 SegmentSize);
608
609 break;
610 }
611 SegmentFuncInfosSize += alignTo(GC->copyFunctionInfo(*this, FuncIdx), 4);
612 }
613 return std::move(GC);
614}
#define offsetof(TYPE, MEMBER)
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
uint64_t Addr
uint64_t Size
#define I(x, y, z)
Definition: MD5.cpp:58
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
uint64_t IntrinsicInst * II
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
raw_pwrite_stream & OS
std::pair< llvm::MachO::Target, std::string > UUID
uint64_t start() const
Definition: AddressRanges.h:28
bool intersects(const AddressRange &R) const
Definition: AddressRanges.h:36
bool contains(uint64_t Addr) const
Definition: AddressRanges.h:32
uint64_t size() const
Definition: AddressRanges.h:30
A container which contains a StringRef plus a precomputed hash.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition: DenseMap.h:211
Subclass of Error for the sole purpose of identifying the success path in the type system.
Definition: Error.h:335
Lightweight error class with error context and mandatory checking.
Definition: Error.h:160
static ErrorSuccess success()
Create a success value.
Definition: Error.h:337
Tagged union holding either a T or a Error.
Definition: Error.h:481
Error takeError()
Take ownership of the stored error.
Definition: Error.h:608
reference get()
Returns a reference to the stored T value.
Definition: Error.h:578
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:147
std::pair< typename Base::iterator, bool > insert(StringRef key)
Definition: StringSet.h:38
Utility for building string tables with deduplicated suffixes.
void finalizeInOrder()
Finalize the string table without reording it.
bool contains(StringRef S) const
Check if a string is contained in the string table.
void write(raw_ostream &OS) const
size_t add(CachedHashStringRef S)
Add a string to the builder.
llvm::Error loadYAML(StringRef YAMLFile)
This method reads the specified YAML file, parses its content, and updates the Funcs vector with call...
A simplified binary data writer class that doesn't require targets, target definitions,...
Definition: FileWriter.h:29
GsymCreator is used to emit GSYM data to a stand alone file or section within a file.
Definition: GsymCreator.h:134
void addFunctionInfo(FunctionInfo &&FI)
Add a function info to this GSYM creator.
uint32_t insertString(StringRef S, bool Copy=true)
Insert a string into the GSYM string table.
llvm::Expected< std::unique_ptr< GsymCreator > > createSegment(uint64_t SegmentSize, size_t &FuncIdx) const
Create a segmented GSYM creator starting with function info index FuncIdx.
llvm::Error save(StringRef Path, llvm::endianness ByteOrder, std::optional< uint64_t > SegmentSize=std::nullopt) const
Save a GSYM file to a stand alone file.
Definition: GsymCreator.cpp:68
void prepareMergedFunctions(OutputAggregator &Out)
Organize merged FunctionInfo's.
StringRef getString(uint32_t Offset)
Retrieve a string from the GSYM string table given its offset.
llvm::Error loadCallSitesFromYAML(StringRef YAMLFile)
Load call site information from a YAML file.
llvm::Error encode(FileWriter &O) const
Encode a GSYM into the file writer stream at the current position.
Definition: GsymCreator.cpp:80
llvm::Error finalize(OutputAggregator &OS)
Finalize the data in the GSYM creator prior to saving the data out.
uint32_t insertFile(StringRef Path, sys::path::Style Style=sys::path::Style::native)
Insert a file into this GSYM creator.
Definition: GsymCreator.cpp:29
size_t getNumFunctionInfos() const
Get the current number of FunctionInfo objects contained in this object.
bool IsValidTextAddress(uint64_t Addr) const
Check if an address is a valid code address.
void forEachFunctionInfo(std::function< bool(FunctionInfo &)> const &Callback)
Thread safe iteration over all function infos.
GsymCreator(bool Quiet=false)
Definition: GsymCreator.cpp:24
LineTable class contains deserialized versions of line tables for each function's address ranges.
Definition: LineTable.h:118
size_t size() const
Definition: LineTable.h:193
LineEntry & get(size_t i)
Definition: LineTable.h:196
void Report(StringRef s, std::function< void(raw_ostream &o)> detailCallback)
A raw_ostream that writes to a file descriptor.
Definition: raw_ostream.h:460
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52
A raw_ostream that writes to an std::string.
Definition: raw_ostream.h:661
#define UINT64_MAX
Definition: DataTypes.h:77
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr uint32_t GSYM_MAGIC
Definition: Header.h:24
constexpr uint32_t GSYM_VERSION
Definition: Header.h:26
StringRef parent_path(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get parent path.
Definition: Path.cpp:467
StringRef filename(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get filename.
Definition: Path.cpp:577
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
@ Offset
Definition: DWP.cpp:480
void stable_sort(R &&Range)
Definition: STLExtras.h:2037
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
Definition: Error.h:1291
FormattedNumber format_hex(uint64_t N, unsigned Width, bool Upper=false)
format_hex - Output N as a fixed width hexadecimal.
Definition: Format.h:187
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
Definition: Alignment.h:155
Error errorCodeToError(std::error_code EC)
Helper for converting an std::error_code to a Error.
Definition: Error.cpp:111
endianness
Definition: bit.h:70
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860
Files in GSYM are contained in FileEntry structs where we split the directory and basename into two d...
Definition: FileEntry.h:24
uint32_t Dir
Offsets in the string table.
Definition: FileEntry.h:28
Function information in GSYM files encodes information for one contiguous address range.
Definition: FunctionInfo.h:92
std::optional< InlineInfo > Inline
Definition: FunctionInfo.h:96
std::optional< MergedFunctionsInfo > MergedFunctions
Definition: FunctionInfo.h:97
bool hasRichInfo() const
Query if a FunctionInfo has rich debug info.
Definition: FunctionInfo.h:114
uint32_t Name
String table offset in the string table.
Definition: FunctionInfo.h:94
std::optional< LineTable > OptLineTable
Definition: FunctionInfo.h:95
The GSYM header.
Definition: Header.h:45
uint16_t Version
The version can number determines how the header is decoded and how each InfoType in FunctionInfo is ...
Definition: Header.h:54
uint8_t AddrOffSize
The size in bytes of each address offset in the address offsets table.
Definition: Header.h:56
uint32_t Magic
The magic bytes should be set to GSYM_MAGIC.
Definition: Header.h:49
llvm::Error encode(FileWriter &O) const
Encode this object into FileWriter stream.
Definition: Header.cpp:85
uint32_t StrtabOffset
The file relative offset of the start of the string table for strings contained in the GSYM file.
Definition: Header.h:72
uint8_t UUID[GSYM_MAX_UUID_SIZE]
The UUID of the original executable file.
Definition: Header.h:86
uint32_t StrtabSize
The size in bytes of the string table.
Definition: Header.h:80
uint8_t UUIDSize
The size in bytes of the UUID encoded in the "UUID" member.
Definition: Header.h:58
uint32_t NumAddresses
The number of addresses stored in the address offsets table.
Definition: Header.h:64
uint64_t BaseAddress
The 64 bit base address that all address offsets in the address offsets table are relative to.
Definition: Header.h:62
Inline information stores the name of the inline function along with an array of address ranges.
Definition: InlineInfo.h:59
Line entries are used to encode the line tables in FunctionInfo objects.
Definition: LineEntry.h:22