docs/doxygen/DWARFGdbIndex_8cpp_source.html

//===- DWARFGdbIndex.cpp --------------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "llvm/DebugInfo/DWARF/DWARFGdbIndex.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/Support/DataExtractor.h"

#include "llvm/Support/Format.h"

#include "llvm/Support/FormatVariadic.h"

#include "llvm/Support/raw_ostream.h"

#include <cassert>

#include <cinttypes>

#include <cstdint>

#include <set>


using namespace llvm;


// .gdb_index section format reference:

// https://sourceware.org/gdb/onlinedocs/gdb/Index-Section-Format.html


void DWARFGdbIndex::dumpCUList(raw_ostream &OS) const {

  OS << format("\n  CU list offset = 0x%x, has %" PRId64 " entries:",

               CuListOffset, (uint64_t)CuList.size())

     << '\n';

  uint32_t I = 0;

  for (const CompUnitEntry &CU : CuList)

    OS << format("    %d: Offset = 0x%llx, Length = 0x%llx\n", I++, CU.Offset,

                 CU.Length);

}


void DWARFGdbIndex::dumpTUList(raw_ostream &OS) const {

  OS << formatv("\n  Types CU list offset = {0:x}, has {1} entries:\n",

                TuListOffset, TuList.size());

  uint32_t I = 0;

  for (const TypeUnitEntry &TU : TuList)

    OS << formatv("    {0}: offset = {1:x8}, type_offset = {2:x8}, "

                  "type_signature = {3:x16}\n",

                  I++, TU.Offset, TU.TypeOffset, TU.TypeSignature);

}


void DWARFGdbIndex::dumpAddressArea(raw_ostream &OS) const {

  OS << format("\n  Address area offset = 0x%x, has %" PRId64 " entries:",

               AddressAreaOffset, (uint64_t)AddressArea.size())

     << '\n';

  for (const AddressEntry &Addr : AddressArea)

    OS << format(

        "    Low/High address = [0x%llx, 0x%llx) (Size: 0x%llx), CU id = %d\n",

        Addr.LowAddress, Addr.HighAddress, Addr.HighAddress - Addr.LowAddress,

        Addr.CuIndex);

}


void DWARFGdbIndex::dumpSymbolTable(raw_ostream &OS) const {

  OS << format("\n  Symbol table offset = 0x%x, size = %" PRId64

               ", filled slots:",

               SymbolTableOffset, (uint64_t)SymbolTable.size())

     << '\n';


  const auto FindCuVectorId = [&](uint32_t VecOffset) {

    // Entries in ConstantPoolVectors are sorted by their offset in constant

    // pool, see how ConstantPoolVectors is populated in parseImpl.

    const auto *It =

        llvm::lower_bound(ConstantPoolVectors, VecOffset,

                          [](const auto &ConstantPoolEntry, uint32_t Offset) {

                            return ConstantPoolEntry.first < Offset;

                          });

    assert(It != ConstantPoolVectors.end() && It->first == VecOffset &&

           "Invalid symbol table");

    return It - ConstantPoolVectors.begin();

  };


  uint32_t I = -1;

  for (const SymTableEntry &E : SymbolTable) {

    ++I;

    if (!E.NameOffset && !E.VecOffset)

      continue;


    OS << format("    %d: Name offset = 0x%x, CU vector offset = 0x%x\n", I,

                 E.NameOffset, E.VecOffset);


    StringRef Name = ConstantPoolStrings.substr(

        ConstantPoolOffset - StringPoolOffset + E.NameOffset);


    const uint32_t CuVectorId = FindCuVectorId(E.VecOffset);

    OS << format("      String name: %s, CU vector index: %d\n", Name.data(),

                 CuVectorId);

  }

}


void DWARFGdbIndex::dumpConstantPool(raw_ostream &OS) const {

  OS << format("\n  Constant pool offset = 0x%x, has %" PRId64 " CU vectors:",

               ConstantPoolOffset, (uint64_t)ConstantPoolVectors.size());

  uint32_t I = 0;

  for (const auto &V : ConstantPoolVectors) {

    OS << format("\n    %d(0x%x): ", I++, V.first);

    for (uint32_t Val : V.second)

      OS << format("0x%x ", Val);

  }

  OS << '\n';

}


void DWARFGdbIndex::dump(raw_ostream &OS) {

  if (HasError) {

    OS << "\n<error parsing>\n";

    return;

  }


  if (HasContent) {

    OS << "  Version = " << Version << '\n';

    dumpCUList(OS);

    dumpTUList(OS);

    dumpAddressArea(OS);

    dumpSymbolTable(OS);

    dumpConstantPool(OS);

  }

}


bool DWARFGdbIndex::parseImpl(DataExtractor Data) {

  uint64_t Offset = 0;


  // Only version 7 and 8 are supported at this moment.

  Version = Data.getU32(&Offset);

  if (Version != 7 && Version != 8)

    return false;


  CuListOffset = Data.getU32(&Offset);

  TuListOffset = Data.getU32(&Offset);

  AddressAreaOffset = Data.getU32(&Offset);

  SymbolTableOffset = Data.getU32(&Offset);

  ConstantPoolOffset = Data.getU32(&Offset);


  if (Offset != CuListOffset)

    return false;


  uint32_t CuListSize = (TuListOffset - CuListOffset) / 16;

  CuList.reserve(CuListSize);

  for (uint32_t i = 0; i < CuListSize; ++i) {

    uint64_t CuOffset = Data.getU64(&Offset);

    uint64_t CuLength = Data.getU64(&Offset);

    CuList.push_back({CuOffset, CuLength});

  }


  // CU Types are no longer needed as DWARF skeleton type units never made it

  // into the standard.

  uint32_t TuListSize = (AddressAreaOffset - TuListOffset) / 24;

  TuList.resize(TuListSize);

  for (uint32_t I = 0; I < TuListSize; ++I) {

    uint64_t CuOffset = Data.getU64(&Offset);

    uint64_t TypeOffset = Data.getU64(&Offset);

    uint64_t Signature = Data.getU64(&Offset);

    TuList[I] = {CuOffset, TypeOffset, Signature};

  }


  uint32_t AddressAreaSize = (SymbolTableOffset - AddressAreaOffset) / 20;

  AddressArea.reserve(AddressAreaSize);

  for (uint32_t i = 0; i < AddressAreaSize; ++i) {

    uint64_t LowAddress = Data.getU64(&Offset);

    uint64_t HighAddress = Data.getU64(&Offset);

    uint32_t CuIndex = Data.getU32(&Offset);

    AddressArea.push_back({LowAddress, HighAddress, CuIndex});

  }


  // The symbol table. This is an open addressed hash table. The size of the

  // hash table is always a power of 2.

  // Each slot in the hash table consists of a pair of offset_type values. The

  // first value is the offset of the symbol's name in the constant pool. The

  // second value is the offset of the CU vector in the constant pool.

  // If both values are 0, then this slot in the hash table is empty. This is ok

  // because while 0 is a valid constant pool index, it cannot be a valid index

  // for both a string and a CU vector.

  uint32_t SymTableSize = (ConstantPoolOffset - SymbolTableOffset) / 8;

  SymbolTable.reserve(SymTableSize);

  std::set<uint32_t> CUOffsets;

  for (uint32_t i = 0; i < SymTableSize; ++i) {

    uint32_t NameOffset = Data.getU32(&Offset);

    uint32_t CuVecOffset = Data.getU32(&Offset);

    SymbolTable.push_back({NameOffset, CuVecOffset});

    if (NameOffset || CuVecOffset)

      CUOffsets.insert(CuVecOffset);

  }


  // The constant pool. CU vectors are stored first, followed by strings.

  // The first value is the number of CU indices in the vector. Each subsequent

  // value is the index and symbol attributes of a CU in the CU list.

  for (auto CUOffset : CUOffsets) {

    Offset = ConstantPoolOffset + CUOffset;

    ConstantPoolVectors.emplace_back(0, SmallVector<uint32_t, 0>());

    auto &Vec = ConstantPoolVectors.back();

    Vec.first = Offset - ConstantPoolOffset;


    uint32_t Num = Data.getU32(&Offset);

    for (uint32_t J = 0; J < Num; ++J)

      Vec.second.push_back(Data.getU32(&Offset));

  }


  ConstantPoolStrings = Data.getData().drop_front(Offset);

  StringPoolOffset = Offset;

  return true;

}


void DWARFGdbIndex::parse(DataExtractor Data) {

  HasContent = !Data.getData().empty();

  HasError = HasContent && !parseImpl(Data);

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

DWARFGdbIndex.h

DataExtractor.h

FormatVariadic.h

Format.h

I
#define I(x, y, z)
Definition MD5.cpp:57

SmallVector.h
This file defines the SmallVector class.

StringRef.h

llvm::DWARFGdbIndex::dump
void dump(raw_ostream &OS)
Definition DWARFGdbIndex.cpp:106

llvm::DWARFGdbIndex::HasError
bool HasError
Definition DWARFGdbIndex.h:77

llvm::DWARFGdbIndex::HasContent
bool HasContent
Definition DWARFGdbIndex.h:76

llvm::DWARFGdbIndex::parse
void parse(DataExtractor Data)
Definition DWARFGdbIndex.cpp:205

llvm::DataExtractor
Definition DataExtractor.h:38

llvm::SmallVectorImpl::reserve
void reserve(size_type N)
Definition SmallVector.h:666

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:419

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

uint32_t

uint64_t

llvm::GraphProgram::Name
Name
Definition GraphWriter.h:51

llvm::M68k::MemAddrModeKind::V
@ V
Definition M68kBaseInfo.h:63

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26

llvm::Offset
@ Offset
Definition DWP.cpp:532

llvm::formatv
auto formatv(bool Validate, const char *Fmt, Ts &&...Vals)
Definition FormatVariadic.h:249

llvm::Version
FunctionAddr VTableAddr uintptr_t uintptr_t Version
Definition InstrProf.h:302

llvm::format
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
Definition Format.h:129

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::lower_bound
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
Definition STLExtras.h:2042

raw_ostream.h