LLVM 20.0.0git
LVBinaryReader.h
Go to the documentation of this file.
1//===-- LVBinaryReader.h ----------------------------------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the LVBinaryReader class, which is used to describe a
10// binary reader.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_DEBUGINFO_LOGICALVIEW_READERS_LVBINARYREADER_H
15#define LLVM_DEBUGINFO_LOGICALVIEW_READERS_LVBINARYREADER_H
16
18#include "llvm/MC/MCAsmInfo.h"
19#include "llvm/MC/MCContext.h"
22#include "llvm/MC/MCInstrInfo.h"
27#include "llvm/Object/COFF.h"
29
30namespace llvm {
31namespace logicalview {
32
33constexpr bool UpdateHighAddress = false;
34
35// Logical scope, Section address, Section index, IsComdat.
36struct LVSymbolTableEntry final {
37 LVScope *Scope = nullptr;
40 bool IsComdat = false;
41 LVSymbolTableEntry() = default;
46};
47
48// Function names extracted from the object symbol table.
49class LVSymbolTable final {
50 using LVSymbolNames = std::map<std::string, LVSymbolTableEntry, std::less<>>;
51 LVSymbolNames SymbolNames;
52
53public:
54 LVSymbolTable() = default;
55
56 void add(StringRef Name, LVScope *Function, LVSectionIndex SectionIndex = 0);
58 bool IsComdat);
60
65
66 void print(raw_ostream &OS);
67};
68
69class LVBinaryReader : public LVReader {
70 // Function names extracted from the object symbol table.
71 LVSymbolTable SymbolTable;
72
73 // It contains the LVLineDebug elements representing the inlined logical
74 // lines for the current compile unit, created by parsing the CodeView
75 // S_INLINESITE symbol annotation data.
76 using LVInlineeLine = std::map<LVScope *, std::unique_ptr<LVLines>>;
77 LVInlineeLine CUInlineeLines;
78
79 // Instruction lines for a logical scope. These instructions are fetched
80 // during its merge with the debug lines.
82
83 // Links the scope with its first assembler address line.
85
86 // Mapping from virtual address to section.
87 // The virtual address refers to the address where the section is loaded.
88 using LVSectionAddresses = std::map<LVSectionIndex, object::SectionRef>;
89 LVSectionAddresses SectionAddresses;
90
91 void addSectionAddress(const object::SectionRef &Section) {
92 if (SectionAddresses.find(Section.getAddress()) == SectionAddresses.end())
93 SectionAddresses.emplace(Section.getAddress(), Section);
94 }
95
96 // Scopes with ranges for current compile unit. It is used to find a line
97 // giving its exact or closest address. To support comdat functions, all
98 // addresses for the same section are recorded in the same map.
99 using LVSectionRanges = std::map<LVSectionIndex, std::unique_ptr<LVRange>>;
100 LVSectionRanges SectionRanges;
101
102 // Image base and virtual address for Executable file.
103 uint64_t ImageBaseAddress = 0;
104 uint64_t VirtualAddress = 0;
105
106 // Object sections with machine code.
107 using LVSections = std::map<LVSectionIndex, object::SectionRef>;
108 LVSections Sections;
109
110 std::vector<std::unique_ptr<LVLines>> DiscoveredLines;
111
112protected:
113 // It contains the LVLineDebug elements representing the logical lines for
114 // the current compile unit, created by parsing the debug line section.
116
117 std::unique_ptr<const MCRegisterInfo> MRI;
118 std::unique_ptr<const MCAsmInfo> MAI;
119 std::unique_ptr<const MCSubtargetInfo> STI;
120 std::unique_ptr<const MCInstrInfo> MII;
121 std::unique_ptr<const MCDisassembler> MD;
122 std::unique_ptr<MCContext> MC;
123 std::unique_ptr<MCInstPrinter> MIP;
124
125 // https://yurydelendik.github.io/webassembly-dwarf/
126 // 2. Consuming and Generating DWARF for WebAssembly Code
127 // Note: Some DWARF constructs don't map one-to-one onto WebAssembly
128 // constructs. We strive to enumerate and resolve any ambiguities here.
129 //
130 // 2.1. Code Addresses
131 // Note: DWARF associates various bits of debug info
132 // with particular locations in the program via its code address (instruction
133 // pointer or PC). However, WebAssembly's linear memory address space does not
134 // contain WebAssembly instructions.
135 //
136 // Wherever a code address (see 2.17 of [DWARF]) is used in DWARF for
137 // WebAssembly, it must be the offset of an instruction relative within the
138 // Code section of the WebAssembly file. The DWARF is considered malformed if
139 // a PC offset is between instruction boundaries within the Code section.
140 //
141 // Note: It is expected that a DWARF consumer does not know how to decode
142 // WebAssembly instructions. The instruction pointer is selected as the offset
143 // in the binary file of the first byte of the instruction, and it is
144 // consistent with the WebAssembly Web API conventions definition of the code
145 // location.
146 //
147 // EXAMPLE: .DEBUG_LINE INSTRUCTION POINTERS
148 // The .debug_line DWARF section maps instruction pointers to source
149 // locations. With WebAssembly, the .debug_line section maps Code
150 // section-relative instruction offsets to source locations.
151 //
152 // EXAMPLE: DW_AT_* ATTRIBUTES
153 // For entities with a single associated code address, DWARF uses
154 // the DW_AT_low_pc attribute to specify the associated code address value.
155 // For WebAssembly, the DW_AT_low_pc's value is a Code section-relative
156 // instruction offset.
157 //
158 // For entities with a single contiguous range of code, DWARF uses a
159 // pair of DW_AT_low_pc and DW_AT_high_pc attributes to specify the associated
160 // contiguous range of code address values. For WebAssembly, these attributes
161 // are Code section-relative instruction offsets.
162 //
163 // For entities with multiple ranges of code, DWARF uses the DW_AT_ranges
164 // attribute, which refers to the array located at the .debug_ranges section.
166
167 // Loads all info for the architecture of the provided object file.
168 Error loadGenericTargetInfo(StringRef TheTriple, StringRef TheFeatures);
169
170 virtual void mapRangeAddress(const object::ObjectFile &Obj) {}
171 virtual void mapRangeAddress(const object::ObjectFile &Obj,
172 const object::SectionRef &Section,
173 bool IsComdat) {}
174
175 // Create a mapping from virtual address to section.
176 void mapVirtualAddress(const object::ObjectFile &Obj);
177 void mapVirtualAddress(const object::COFFObjectFile &COFFObj);
178
180 getSection(LVScope *Scope, LVAddress Address, LVSectionIndex SectionIndex);
181
182 void addSectionRange(LVSectionIndex SectionIndex, LVScope *Scope);
183 void addSectionRange(LVSectionIndex SectionIndex, LVScope *Scope,
184 LVAddress LowerAddress, LVAddress UpperAddress);
186
188
192 const LVNameInfo &NameInfo);
193
194 void processLines(LVLines *DebugLines, LVSectionIndex SectionIndex);
195 void processLines(LVLines *DebugLines, LVSectionIndex SectionIndex,
197
198public:
199 LVBinaryReader() = delete;
201 LVBinaryType BinaryType)
202 : LVReader(Filename, FileFormatName, W, BinaryType) {}
205 virtual ~LVBinaryReader() = default;
206
207 void addInlineeLines(LVScope *Scope, LVLines &Lines) {
208 CUInlineeLines.emplace(Scope, std::make_unique<LVLines>(std::move(Lines)));
209 }
210
211 // Convert Segment::Offset pair to absolute address.
213 LVAddress Addendum = 0) {
214 return ImageBaseAddress + (Segment * VirtualAddress) + Offset + Addendum;
215 }
216
218 LVSectionIndex SectionIndex = 0);
220 LVSectionIndex SectionIndex, bool IsComdat);
222
227
229 return Scope ? getSymbolTableIndex(Scope->getLinkageName())
231 }
232
233 void print(raw_ostream &OS) const;
234
235#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
236 void dump() const { print(dbgs()); }
237#endif
238};
239
240} // end namespace logicalview
241} // end namespace llvm
242
243#endif // LLVM_DEBUGINFO_LOGICALVIEW_READERS_LVBINARYREADER_H
raw_pwrite_stream & OS
Lightweight error class with error context and mandatory checking.
Definition: Error.h:160
Tagged union holding either a T or a Error.
Definition: Error.h:481
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51
const LVSymbolTableEntry & getSymbolTableEntry(StringRef Name)
LVSectionIndex updateSymbolTable(LVScope *Function)
Expected< std::pair< LVSectionIndex, object::SectionRef > > getSection(LVScope *Scope, LVAddress Address, LVSectionIndex SectionIndex)
LVSectionIndex getSectionIndex(LVScope *Scope) override
std::unique_ptr< MCContext > MC
void includeInlineeLines(LVSectionIndex SectionIndex, LVScope *Function)
std::unique_ptr< const MCInstrInfo > MII
void addInlineeLines(LVScope *Scope, LVLines &Lines)
LVBinaryReader(const LVBinaryReader &)=delete
LVAddress getSymbolTableAddress(StringRef Name)
void print(raw_ostream &OS) const
std::unique_ptr< const MCSubtargetInfo > STI
LVAddress linearAddress(uint16_t Segment, uint32_t Offset, LVAddress Addendum=0)
void addToSymbolTable(StringRef Name, LVScope *Function, LVSectionIndex SectionIndex=0)
virtual void mapRangeAddress(const object::ObjectFile &Obj)
void processLines(LVLines *DebugLines, LVSectionIndex SectionIndex)
void mapVirtualAddress(const object::ObjectFile &Obj)
std::unique_ptr< const MCAsmInfo > MAI
LVSectionIndex getSymbolTableIndex(StringRef Name)
LVBinaryReader & operator=(const LVBinaryReader &)=delete
virtual void mapRangeAddress(const object::ObjectFile &Obj, const object::SectionRef &Section, bool IsComdat)
bool getSymbolTableIsComdat(StringRef Name)
std::unique_ptr< const MCRegisterInfo > MRI
LVBinaryReader(StringRef Filename, StringRef FileFormatName, ScopedPrinter &W, LVBinaryType BinaryType)
std::unique_ptr< const MCDisassembler > MD
LVRange * getSectionRanges(LVSectionIndex SectionIndex)
Error loadGenericTargetInfo(StringRef TheTriple, StringRef TheFeatures)
void addSectionRange(LVSectionIndex SectionIndex, LVScope *Scope)
std::unique_ptr< MCInstPrinter > MIP
The logical reader owns of all the logical elements created during the debug information parsing.
Definition: LVReader.h:60
std::string FileFormatName
Definition: LVReader.h:127
LVSectionIndex DotTextSectionIndex
Definition: LVReader.h:133
LVSectionIndex getIndex(StringRef Name)
LVAddress getAddress(StringRef Name)
void add(StringRef Name, LVScope *Function, LVSectionIndex SectionIndex=0)
LVSectionIndex update(LVScope *Function)
const LVSymbolTableEntry & getEntry(StringRef Name)
This class is the base class for all object file types.
Definition: ObjectFile.h:229
This is a value type class that represents a single section in the list of sections in the object fil...
Definition: ObjectFile.h:81
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52
std::pair< LVAddress, uint64_t > LVNameInfo
Definition: LVScope.h:29
constexpr bool UpdateHighAddress
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163
LVSymbolTableEntry(LVScope *Scope, LVAddress Address, LVSectionIndex SectionIndex, bool IsComdat)