LLVM  6.0.0svn
DWARFDebugLine.cpp
Go to the documentation of this file.
1 //===- DWARFDebugLine.cpp -------------------------------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
11 #include "llvm/ADT/SmallString.h"
12 #include "llvm/ADT/SmallVector.h"
13 #include "llvm/ADT/StringRef.h"
18 #include "llvm/Support/Format.h"
19 #include "llvm/Support/Path.h"
21 #include <algorithm>
22 #include <cassert>
23 #include <cinttypes>
24 #include <cstdint>
25 #include <cstdio>
26 #include <utility>
27 
28 using namespace llvm;
29 using namespace dwarf;
30 
32 
33 namespace {
34 
35 struct ContentDescriptor {
38 };
39 
40 using ContentDescriptors = SmallVector<ContentDescriptor, 4>;
41 
42 } // end anonmyous namespace
43 
45 
47  TotalLength = PrologueLength = 0;
48  SegSelectorSize = 0;
49  MinInstLength = MaxOpsPerInst = DefaultIsStmt = LineBase = LineRange = 0;
50  OpcodeBase = 0;
51  FormParams = DWARFFormParams({0, 0, DWARF32});
52  StandardOpcodeLengths.clear();
53  IncludeDirectories.clear();
54  FileNames.clear();
55 }
56 
58  OS << "Line table prologue:\n"
59  << format(" total_length: 0x%8.8" PRIx64 "\n", TotalLength)
60  << format(" version: %u\n", getVersion());
61  if (getVersion() >= 5)
62  OS << format(" address_size: %u\n", getAddressSize())
63  << format(" seg_select_size: %u\n", SegSelectorSize);
64  OS << format(" prologue_length: 0x%8.8" PRIx64 "\n", PrologueLength)
65  << format(" min_inst_length: %u\n", MinInstLength)
66  << format(getVersion() >= 4 ? "max_ops_per_inst: %u\n" : "", MaxOpsPerInst)
67  << format(" default_is_stmt: %u\n", DefaultIsStmt)
68  << format(" line_base: %i\n", LineBase)
69  << format(" line_range: %u\n", LineRange)
70  << format(" opcode_base: %u\n", OpcodeBase);
71 
72  for (uint32_t I = 0; I != StandardOpcodeLengths.size(); ++I)
73  OS << format("standard_opcode_lengths[%s] = %u\n",
74  LNStandardString(I + 1).data(), StandardOpcodeLengths[I]);
75 
76  if (!IncludeDirectories.empty())
77  for (uint32_t I = 0; I != IncludeDirectories.size(); ++I)
78  OS << format("include_directories[%3u] = '", I + 1)
79  << IncludeDirectories[I] << "'\n";
80 
81  if (!FileNames.empty()) {
82  OS << " Dir Mod Time File Len File Name\n"
83  << " ---- ---------- ---------- -----------"
84  "----------------\n";
85  for (uint32_t I = 0; I != FileNames.size(); ++I) {
86  const FileNameEntry &FileEntry = FileNames[I];
87  OS << format("file_names[%3u] %4" PRIu64 " ", I + 1, FileEntry.DirIdx)
88  << format("0x%8.8" PRIx64 " 0x%8.8" PRIx64 " ", FileEntry.ModTime,
89  FileEntry.Length)
90  << FileEntry.Name << '\n';
91  }
92  }
93 }
94 
95 // Parse v2-v4 directory and file tables.
96 static void
98  uint32_t *OffsetPtr, uint64_t EndPrologueOffset,
99  std::vector<StringRef> &IncludeDirectories,
100  std::vector<DWARFDebugLine::FileNameEntry> &FileNames) {
101  while (*OffsetPtr < EndPrologueOffset) {
102  StringRef S = DebugLineData.getCStrRef(OffsetPtr);
103  if (S.empty())
104  break;
105  IncludeDirectories.push_back(S);
106  }
107 
108  while (*OffsetPtr < EndPrologueOffset) {
109  StringRef Name = DebugLineData.getCStrRef(OffsetPtr);
110  if (Name.empty())
111  break;
113  FileEntry.Name = Name;
114  FileEntry.DirIdx = DebugLineData.getULEB128(OffsetPtr);
115  FileEntry.ModTime = DebugLineData.getULEB128(OffsetPtr);
116  FileEntry.Length = DebugLineData.getULEB128(OffsetPtr);
117  FileNames.push_back(FileEntry);
118  }
119 }
120 
121 // Parse v5 directory/file entry content descriptions.
122 // Returns the descriptors, or an empty vector if we did not find a path or
123 // ran off the end of the prologue.
124 static ContentDescriptors
125 parseV5EntryFormat(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr,
126  uint64_t EndPrologueOffset) {
127  ContentDescriptors Descriptors;
128  int FormatCount = DebugLineData.getU8(OffsetPtr);
129  bool HasPath = false;
130  for (int I = 0; I != FormatCount; ++I) {
131  if (*OffsetPtr >= EndPrologueOffset)
132  return ContentDescriptors();
133  ContentDescriptor Descriptor;
134  Descriptor.Type =
135  dwarf::LineNumberEntryFormat(DebugLineData.getULEB128(OffsetPtr));
136  Descriptor.Form = dwarf::Form(DebugLineData.getULEB128(OffsetPtr));
137  if (Descriptor.Type == dwarf::DW_LNCT_path)
138  HasPath = true;
139  Descriptors.push_back(Descriptor);
140  }
141  return HasPath ? Descriptors : ContentDescriptors();
142 }
143 
144 static bool
146  uint32_t *OffsetPtr, uint64_t EndPrologueOffset,
147  const DWARFFormParams &FormParams,
148  std::vector<StringRef> &IncludeDirectories,
149  std::vector<DWARFDebugLine::FileNameEntry> &FileNames) {
150  // Get the directory entry description.
151  ContentDescriptors DirDescriptors =
152  parseV5EntryFormat(DebugLineData, OffsetPtr, EndPrologueOffset);
153  if (DirDescriptors.empty())
154  return false;
155 
156  // Get the directory entries, according to the format described above.
157  int DirEntryCount = DebugLineData.getU8(OffsetPtr);
158  for (int I = 0; I != DirEntryCount; ++I) {
159  if (*OffsetPtr >= EndPrologueOffset)
160  return false;
161  for (auto Descriptor : DirDescriptors) {
162  DWARFFormValue Value(Descriptor.Form);
163  switch (Descriptor.Type) {
164  case DW_LNCT_path:
165  if (!Value.extractValue(DebugLineData, OffsetPtr, nullptr))
166  return false;
167  IncludeDirectories.push_back(Value.getAsCString().getValue());
168  break;
169  default:
170  if (!Value.skipValue(DebugLineData, OffsetPtr, FormParams))
171  return false;
172  }
173  }
174  }
175 
176  // Get the file entry description.
177  ContentDescriptors FileDescriptors =
178  parseV5EntryFormat(DebugLineData, OffsetPtr, EndPrologueOffset);
179  if (FileDescriptors.empty())
180  return false;
181 
182  // Get the file entries, according to the format described above.
183  int FileEntryCount = DebugLineData.getU8(OffsetPtr);
184  for (int I = 0; I != FileEntryCount; ++I) {
185  if (*OffsetPtr >= EndPrologueOffset)
186  return false;
188  for (auto Descriptor : FileDescriptors) {
189  DWARFFormValue Value(Descriptor.Form);
190  if (!Value.extractValue(DebugLineData, OffsetPtr, nullptr))
191  return false;
192  switch (Descriptor.Type) {
193  case DW_LNCT_path:
194  FileEntry.Name = Value.getAsCString().getValue();
195  break;
196  case DW_LNCT_directory_index:
197  FileEntry.DirIdx = Value.getAsUnsignedConstant().getValue();
198  break;
199  case DW_LNCT_timestamp:
200  FileEntry.ModTime = Value.getAsUnsignedConstant().getValue();
201  break;
202  case DW_LNCT_size:
203  FileEntry.Length = Value.getAsUnsignedConstant().getValue();
204  break;
205  // FIXME: Add MD5
206  default:
207  break;
208  }
209  }
210  FileNames.push_back(FileEntry);
211  }
212  return true;
213 }
214 
216  uint32_t *OffsetPtr) {
217  const uint64_t PrologueOffset = *OffsetPtr;
218 
219  clear();
220  TotalLength = DebugLineData.getU32(OffsetPtr);
221  if (TotalLength == UINT32_MAX) {
222  FormParams.Format = dwarf::DWARF64;
223  TotalLength = DebugLineData.getU64(OffsetPtr);
224  } else if (TotalLength >= 0xffffff00) {
225  return false;
226  }
227  FormParams.Version = DebugLineData.getU16(OffsetPtr);
228  if (getVersion() < 2)
229  return false;
230 
231  if (getVersion() >= 5) {
232  FormParams.AddrSize = DebugLineData.getU8(OffsetPtr);
233  assert(getAddressSize() == DebugLineData.getAddressSize() &&
234  "Line table header and data extractor disagree");
235  SegSelectorSize = DebugLineData.getU8(OffsetPtr);
236  }
237 
238  PrologueLength = DebugLineData.getUnsigned(OffsetPtr, sizeofPrologueLength());
239  const uint64_t EndPrologueOffset = PrologueLength + *OffsetPtr;
240  MinInstLength = DebugLineData.getU8(OffsetPtr);
241  if (getVersion() >= 4)
242  MaxOpsPerInst = DebugLineData.getU8(OffsetPtr);
243  DefaultIsStmt = DebugLineData.getU8(OffsetPtr);
244  LineBase = DebugLineData.getU8(OffsetPtr);
245  LineRange = DebugLineData.getU8(OffsetPtr);
246  OpcodeBase = DebugLineData.getU8(OffsetPtr);
247 
248  StandardOpcodeLengths.reserve(OpcodeBase - 1);
249  for (uint32_t I = 1; I < OpcodeBase; ++I) {
250  uint8_t OpLen = DebugLineData.getU8(OffsetPtr);
251  StandardOpcodeLengths.push_back(OpLen);
252  }
253 
254  if (getVersion() >= 5) {
255  if (!parseV5DirFileTables(DebugLineData, OffsetPtr, EndPrologueOffset,
256  getFormParams(), IncludeDirectories, FileNames)) {
257  fprintf(stderr,
258  "warning: parsing line table prologue at 0x%8.8" PRIx64
259  " found an invalid directory or file table description at"
260  " 0x%8.8" PRIx64 "\n", PrologueOffset, (uint64_t)*OffsetPtr);
261  return false;
262  }
263  } else
264  parseV2DirFileTables(DebugLineData, OffsetPtr, EndPrologueOffset,
265  IncludeDirectories, FileNames);
266 
267  if (*OffsetPtr != EndPrologueOffset) {
268  fprintf(stderr,
269  "warning: parsing line table prologue at 0x%8.8" PRIx64
270  " should have ended at 0x%8.8" PRIx64
271  " but it ended at 0x%8.8" PRIx64 "\n",
272  PrologueOffset, EndPrologueOffset, (uint64_t)*OffsetPtr);
273  return false;
274  }
275  return true;
276 }
277 
278 DWARFDebugLine::Row::Row(bool DefaultIsStmt) { reset(DefaultIsStmt); }
279 
281  BasicBlock = false;
282  PrologueEnd = false;
283  EpilogueBegin = false;
284 }
285 
286 void DWARFDebugLine::Row::reset(bool DefaultIsStmt) {
287  Address = 0;
288  Line = 1;
289  Column = 0;
290  File = 1;
291  Isa = 0;
292  Discriminator = 0;
293  IsStmt = DefaultIsStmt;
294  BasicBlock = false;
295  EndSequence = false;
296  PrologueEnd = false;
297  EpilogueBegin = false;
298 }
299 
301  OS << "Address Line Column File ISA Discriminator Flags\n"
302  << "------------------ ------ ------ ------ --- ------------- "
303  "-------------\n";
304 }
305 
307  OS << format("0x%16.16" PRIx64 " %6u %6u", Address, Line, Column)
308  << format(" %6u %3u %13u ", File, Isa, Discriminator)
309  << (IsStmt ? " is_stmt" : "") << (BasicBlock ? " basic_block" : "")
310  << (PrologueEnd ? " prologue_end" : "")
311  << (EpilogueBegin ? " epilogue_begin" : "")
312  << (EndSequence ? " end_sequence" : "") << '\n';
313 }
314 
316 
318  LowPC = 0;
319  HighPC = 0;
320  FirstRowIndex = 0;
321  LastRowIndex = 0;
322  Empty = true;
323 }
324 
326 
328  Prologue.dump(OS);
329  OS << '\n';
330 
331  if (!Rows.empty()) {
332  Row::dumpTableHeader(OS);
333  for (const Row &R : Rows) {
334  R.dump(OS);
335  }
336  }
337 }
338 
340  Prologue.clear();
341  Rows.clear();
342  Sequences.clear();
343 }
344 
345 DWARFDebugLine::ParsingState::ParsingState(struct LineTable *LT)
346  : LineTable(LT) {
347  resetRowAndSequence();
348 }
349 
350 void DWARFDebugLine::ParsingState::resetRowAndSequence() {
352  Sequence.reset();
353 }
354 
355 void DWARFDebugLine::ParsingState::appendRowToMatrix(uint32_t Offset) {
356  if (Sequence.Empty) {
357  // Record the beginning of instruction sequence.
358  Sequence.Empty = false;
360  Sequence.FirstRowIndex = RowNumber;
361  }
362  ++RowNumber;
364  if (Row.EndSequence) {
365  // Record the end of instruction sequence.
367  Sequence.LastRowIndex = RowNumber;
368  if (Sequence.isValid())
370  Sequence.reset();
371  }
372  Row.postAppend();
373 }
374 
377  LineTableConstIter Pos = LineTableMap.find(Offset);
378  if (Pos != LineTableMap.end())
379  return &Pos->second;
380  return nullptr;
381 }
382 
385  uint32_t Offset) {
386  std::pair<LineTableIter, bool> Pos =
387  LineTableMap.insert(LineTableMapTy::value_type(Offset, LineTable()));
388  LineTable *LT = &Pos.first->second;
389  if (Pos.second) {
390  if (!LT->parse(DebugLineData, &Offset))
391  return nullptr;
392  }
393  return LT;
394 }
395 
397  uint32_t *OffsetPtr) {
398  const uint32_t DebugLineOffset = *OffsetPtr;
399 
400  clear();
401 
402  if (!Prologue.parse(DebugLineData, OffsetPtr)) {
403  // Restore our offset and return false to indicate failure!
404  *OffsetPtr = DebugLineOffset;
405  return false;
406  }
407 
408  const uint32_t EndOffset =
409  DebugLineOffset + Prologue.TotalLength + Prologue.sizeofTotalLength();
410 
411  ParsingState State(this);
412 
413  while (*OffsetPtr < EndOffset) {
414  uint8_t Opcode = DebugLineData.getU8(OffsetPtr);
415 
416  if (Opcode == 0) {
417  // Extended Opcodes always start with a zero opcode followed by
418  // a uleb128 length so you can skip ones you don't know about
419  uint32_t ExtOffset = *OffsetPtr;
420  uint64_t Len = DebugLineData.getULEB128(OffsetPtr);
421  uint32_t ArgSize = Len - (*OffsetPtr - ExtOffset);
422 
423  uint8_t SubOpcode = DebugLineData.getU8(OffsetPtr);
424  switch (SubOpcode) {
425  case DW_LNE_end_sequence:
426  // Set the end_sequence register of the state machine to true and
427  // append a row to the matrix using the current values of the
428  // state-machine registers. Then reset the registers to the initial
429  // values specified above. Every statement program sequence must end
430  // with a DW_LNE_end_sequence instruction which creates a row whose
431  // address is that of the byte after the last target machine instruction
432  // of the sequence.
433  State.Row.EndSequence = true;
434  State.appendRowToMatrix(*OffsetPtr);
435  State.resetRowAndSequence();
436  break;
437 
438  case DW_LNE_set_address:
439  // Takes a single relocatable address as an operand. The size of the
440  // operand is the size appropriate to hold an address on the target
441  // machine. Set the address register to the value given by the
442  // relocatable address. All of the other statement program opcodes
443  // that affect the address register add a delta to it. This instruction
444  // stores a relocatable value into it instead.
445  State.Row.Address = DebugLineData.getRelocatedAddress(OffsetPtr);
446  break;
447 
448  case DW_LNE_define_file:
449  // Takes 4 arguments. The first is a null terminated string containing
450  // a source file name. The second is an unsigned LEB128 number
451  // representing the directory index of the directory in which the file
452  // was found. The third is an unsigned LEB128 number representing the
453  // time of last modification of the file. The fourth is an unsigned
454  // LEB128 number representing the length in bytes of the file. The time
455  // and length fields may contain LEB128(0) if the information is not
456  // available.
457  //
458  // The directory index represents an entry in the include_directories
459  // section of the statement program prologue. The index is LEB128(0)
460  // if the file was found in the current directory of the compilation,
461  // LEB128(1) if it was found in the first directory in the
462  // include_directories section, and so on. The directory index is
463  // ignored for file names that represent full path names.
464  //
465  // The files are numbered, starting at 1, in the order in which they
466  // appear; the names in the prologue come before names defined by
467  // the DW_LNE_define_file instruction. These numbers are used in the
468  // the file register of the state machine.
469  {
470  FileNameEntry FileEntry;
471  FileEntry.Name = DebugLineData.getCStr(OffsetPtr);
472  FileEntry.DirIdx = DebugLineData.getULEB128(OffsetPtr);
473  FileEntry.ModTime = DebugLineData.getULEB128(OffsetPtr);
474  FileEntry.Length = DebugLineData.getULEB128(OffsetPtr);
475  Prologue.FileNames.push_back(FileEntry);
476  }
477  break;
478 
479  case DW_LNE_set_discriminator:
480  State.Row.Discriminator = DebugLineData.getULEB128(OffsetPtr);
481  break;
482 
483  default:
484  // Length doesn't include the zero opcode byte or the length itself, but
485  // it does include the sub_opcode, so we have to adjust for that below
486  (*OffsetPtr) += ArgSize;
487  break;
488  }
489  } else if (Opcode < Prologue.OpcodeBase) {
490  switch (Opcode) {
491  // Standard Opcodes
492  case DW_LNS_copy:
493  // Takes no arguments. Append a row to the matrix using the
494  // current values of the state-machine registers. Then set
495  // the basic_block register to false.
496  State.appendRowToMatrix(*OffsetPtr);
497  break;
498 
499  case DW_LNS_advance_pc:
500  // Takes a single unsigned LEB128 operand, multiplies it by the
501  // min_inst_length field of the prologue, and adds the
502  // result to the address register of the state machine.
503  State.Row.Address +=
504  DebugLineData.getULEB128(OffsetPtr) * Prologue.MinInstLength;
505  break;
506 
507  case DW_LNS_advance_line:
508  // Takes a single signed LEB128 operand and adds that value to
509  // the line register of the state machine.
510  State.Row.Line += DebugLineData.getSLEB128(OffsetPtr);
511  break;
512 
513  case DW_LNS_set_file:
514  // Takes a single unsigned LEB128 operand and stores it in the file
515  // register of the state machine.
516  State.Row.File = DebugLineData.getULEB128(OffsetPtr);
517  break;
518 
519  case DW_LNS_set_column:
520  // Takes a single unsigned LEB128 operand and stores it in the
521  // column register of the state machine.
522  State.Row.Column = DebugLineData.getULEB128(OffsetPtr);
523  break;
524 
525  case DW_LNS_negate_stmt:
526  // Takes no arguments. Set the is_stmt register of the state
527  // machine to the logical negation of its current value.
528  State.Row.IsStmt = !State.Row.IsStmt;
529  break;
530 
531  case DW_LNS_set_basic_block:
532  // Takes no arguments. Set the basic_block register of the
533  // state machine to true
534  State.Row.BasicBlock = true;
535  break;
536 
537  case DW_LNS_const_add_pc:
538  // Takes no arguments. Add to the address register of the state
539  // machine the address increment value corresponding to special
540  // opcode 255. The motivation for DW_LNS_const_add_pc is this:
541  // when the statement program needs to advance the address by a
542  // small amount, it can use a single special opcode, which occupies
543  // a single byte. When it needs to advance the address by up to
544  // twice the range of the last special opcode, it can use
545  // DW_LNS_const_add_pc followed by a special opcode, for a total
546  // of two bytes. Only if it needs to advance the address by more
547  // than twice that range will it need to use both DW_LNS_advance_pc
548  // and a special opcode, requiring three or more bytes.
549  {
550  uint8_t AdjustOpcode = 255 - Prologue.OpcodeBase;
551  uint64_t AddrOffset =
552  (AdjustOpcode / Prologue.LineRange) * Prologue.MinInstLength;
553  State.Row.Address += AddrOffset;
554  }
555  break;
556 
557  case DW_LNS_fixed_advance_pc:
558  // Takes a single uhalf operand. Add to the address register of
559  // the state machine the value of the (unencoded) operand. This
560  // is the only extended opcode that takes an argument that is not
561  // a variable length number. The motivation for DW_LNS_fixed_advance_pc
562  // is this: existing assemblers cannot emit DW_LNS_advance_pc or
563  // special opcodes because they cannot encode LEB128 numbers or
564  // judge when the computation of a special opcode overflows and
565  // requires the use of DW_LNS_advance_pc. Such assemblers, however,
566  // can use DW_LNS_fixed_advance_pc instead, sacrificing compression.
567  State.Row.Address += DebugLineData.getU16(OffsetPtr);
568  break;
569 
570  case DW_LNS_set_prologue_end:
571  // Takes no arguments. Set the prologue_end register of the
572  // state machine to true
573  State.Row.PrologueEnd = true;
574  break;
575 
576  case DW_LNS_set_epilogue_begin:
577  // Takes no arguments. Set the basic_block register of the
578  // state machine to true
579  State.Row.EpilogueBegin = true;
580  break;
581 
582  case DW_LNS_set_isa:
583  // Takes a single unsigned LEB128 operand and stores it in the
584  // column register of the state machine.
585  State.Row.Isa = DebugLineData.getULEB128(OffsetPtr);
586  break;
587 
588  default:
589  // Handle any unknown standard opcodes here. We know the lengths
590  // of such opcodes because they are specified in the prologue
591  // as a multiple of LEB128 operands for each opcode.
592  {
593  assert(Opcode - 1U < Prologue.StandardOpcodeLengths.size());
594  uint8_t OpcodeLength = Prologue.StandardOpcodeLengths[Opcode - 1];
595  for (uint8_t I = 0; I < OpcodeLength; ++I)
596  DebugLineData.getULEB128(OffsetPtr);
597  }
598  break;
599  }
600  } else {
601  // Special Opcodes
602 
603  // A special opcode value is chosen based on the amount that needs
604  // to be added to the line and address registers. The maximum line
605  // increment for a special opcode is the value of the line_base
606  // field in the header, plus the value of the line_range field,
607  // minus 1 (line base + line range - 1). If the desired line
608  // increment is greater than the maximum line increment, a standard
609  // opcode must be used instead of a special opcode. The "address
610  // advance" is calculated by dividing the desired address increment
611  // by the minimum_instruction_length field from the header. The
612  // special opcode is then calculated using the following formula:
613  //
614  // opcode = (desired line increment - line_base) +
615  // (line_range * address advance) + opcode_base
616  //
617  // If the resulting opcode is greater than 255, a standard opcode
618  // must be used instead.
619  //
620  // To decode a special opcode, subtract the opcode_base from the
621  // opcode itself to give the adjusted opcode. The amount to
622  // increment the address register is the result of the adjusted
623  // opcode divided by the line_range multiplied by the
624  // minimum_instruction_length field from the header. That is:
625  //
626  // address increment = (adjusted opcode / line_range) *
627  // minimum_instruction_length
628  //
629  // The amount to increment the line register is the line_base plus
630  // the result of the adjusted opcode modulo the line_range. That is:
631  //
632  // line increment = line_base + (adjusted opcode % line_range)
633 
634  uint8_t AdjustOpcode = Opcode - Prologue.OpcodeBase;
635  uint64_t AddrOffset =
636  (AdjustOpcode / Prologue.LineRange) * Prologue.MinInstLength;
637  int32_t LineOffset =
638  Prologue.LineBase + (AdjustOpcode % Prologue.LineRange);
639  State.Row.Line += LineOffset;
640  State.Row.Address += AddrOffset;
641  State.appendRowToMatrix(*OffsetPtr);
642  // Reset discriminator to 0.
643  State.Row.Discriminator = 0;
644  }
645  }
646 
647  if (!State.Sequence.Empty) {
648  fprintf(stderr, "warning: last sequence in debug line table is not"
649  "terminated!\n");
650  }
651 
652  // Sort all sequences so that address lookup will work faster.
653  if (!Sequences.empty()) {
654  std::sort(Sequences.begin(), Sequences.end(), Sequence::orderByLowPC);
655  // Note: actually, instruction address ranges of sequences should not
656  // overlap (in shared objects and executables). If they do, the address
657  // lookup would still work, though, but result would be ambiguous.
658  // We don't report warning in this case. For example,
659  // sometimes .so compiled from multiple object files contains a few
660  // rudimentary sequences for address ranges [0x0, 0xsomething).
661  }
662 
663  return EndOffset;
664 }
665 
666 uint32_t
667 DWARFDebugLine::LineTable::findRowInSeq(const DWARFDebugLine::Sequence &Seq,
668  uint64_t Address) const {
669  if (!Seq.containsPC(Address))
670  return UnknownRowIndex;
671  // Search for instruction address in the rows describing the sequence.
672  // Rows are stored in a vector, so we may use arithmetical operations with
673  // iterators.
675  Row.Address = Address;
676  RowIter FirstRow = Rows.begin() + Seq.FirstRowIndex;
677  RowIter LastRow = Rows.begin() + Seq.LastRowIndex;
678  LineTable::RowIter RowPos = std::lower_bound(
679  FirstRow, LastRow, Row, DWARFDebugLine::Row::orderByAddress);
680  if (RowPos == LastRow) {
681  return Seq.LastRowIndex - 1;
682  }
683  uint32_t Index = Seq.FirstRowIndex + (RowPos - FirstRow);
684  if (RowPos->Address > Address) {
685  if (RowPos == FirstRow)
686  return UnknownRowIndex;
687  else
688  Index--;
689  }
690  return Index;
691 }
692 
694  if (Sequences.empty())
695  return UnknownRowIndex;
696  // First, find an instruction sequence containing the given address.
698  Sequence.LowPC = Address;
699  SequenceIter FirstSeq = Sequences.begin();
700  SequenceIter LastSeq = Sequences.end();
701  SequenceIter SeqPos = std::lower_bound(
702  FirstSeq, LastSeq, Sequence, DWARFDebugLine::Sequence::orderByLowPC);
703  DWARFDebugLine::Sequence FoundSeq;
704  if (SeqPos == LastSeq) {
705  FoundSeq = Sequences.back();
706  } else if (SeqPos->LowPC == Address) {
707  FoundSeq = *SeqPos;
708  } else {
709  if (SeqPos == FirstSeq)
710  return UnknownRowIndex;
711  FoundSeq = *(SeqPos - 1);
712  }
713  return findRowInSeq(FoundSeq, Address);
714 }
715 
717  uint64_t Address, uint64_t Size, std::vector<uint32_t> &Result) const {
718  if (Sequences.empty())
719  return false;
720  uint64_t EndAddr = Address + Size;
721  // First, find an instruction sequence containing the given address.
723  Sequence.LowPC = Address;
724  SequenceIter FirstSeq = Sequences.begin();
725  SequenceIter LastSeq = Sequences.end();
726  SequenceIter SeqPos = std::lower_bound(
727  FirstSeq, LastSeq, Sequence, DWARFDebugLine::Sequence::orderByLowPC);
728  if (SeqPos == LastSeq || SeqPos->LowPC != Address) {
729  if (SeqPos == FirstSeq)
730  return false;
731  SeqPos--;
732  }
733  if (!SeqPos->containsPC(Address))
734  return false;
735 
736  SequenceIter StartPos = SeqPos;
737 
738  // Add the rows from the first sequence to the vector, starting with the
739  // index we just calculated
740 
741  while (SeqPos != LastSeq && SeqPos->LowPC < EndAddr) {
742  const DWARFDebugLine::Sequence &CurSeq = *SeqPos;
743  // For the first sequence, we need to find which row in the sequence is the
744  // first in our range.
745  uint32_t FirstRowIndex = CurSeq.FirstRowIndex;
746  if (SeqPos == StartPos)
747  FirstRowIndex = findRowInSeq(CurSeq, Address);
748 
749  // Figure out the last row in the range.
750  uint32_t LastRowIndex = findRowInSeq(CurSeq, EndAddr - 1);
751  if (LastRowIndex == UnknownRowIndex)
752  LastRowIndex = CurSeq.LastRowIndex - 1;
753 
754  assert(FirstRowIndex != UnknownRowIndex);
755  assert(LastRowIndex != UnknownRowIndex);
756 
757  for (uint32_t I = FirstRowIndex; I <= LastRowIndex; ++I) {
758  Result.push_back(I);
759  }
760 
761  ++SeqPos;
762  }
763 
764  return true;
765 }
766 
767 bool DWARFDebugLine::LineTable::hasFileAtIndex(uint64_t FileIndex) const {
768  return FileIndex != 0 && FileIndex <= Prologue.FileNames.size();
769 }
770 
772  const char *CompDir,
774  std::string &Result) const {
775  if (Kind == FileLineInfoKind::None || !hasFileAtIndex(FileIndex))
776  return false;
777  const FileNameEntry &Entry = Prologue.FileNames[FileIndex - 1];
778  StringRef FileName = Entry.Name;
779  if (Kind != FileLineInfoKind::AbsoluteFilePath ||
780  sys::path::is_absolute(FileName)) {
781  Result = FileName;
782  return true;
783  }
784 
785  SmallString<16> FilePath;
786  uint64_t IncludeDirIndex = Entry.DirIdx;
787  StringRef IncludeDir;
788  // Be defensive about the contents of Entry.
789  if (IncludeDirIndex > 0 &&
790  IncludeDirIndex <= Prologue.IncludeDirectories.size())
791  IncludeDir = Prologue.IncludeDirectories[IncludeDirIndex - 1];
792 
793  // We may still need to append compilation directory of compile unit.
794  // We know that FileName is not absolute, the only way to have an
795  // absolute path at this point would be if IncludeDir is absolute.
796  if (CompDir && Kind == FileLineInfoKind::AbsoluteFilePath &&
797  sys::path::is_relative(IncludeDir))
798  sys::path::append(FilePath, CompDir);
799 
800  // sys::path::append skips empty strings.
801  sys::path::append(FilePath, IncludeDir, FileName);
802  Result = FilePath.str();
803  return true;
804 }
805 
807  uint64_t Address, const char *CompDir, FileLineInfoKind Kind,
808  DILineInfo &Result) const {
809  // Get the index of row we're looking for in the line table.
810  uint32_t RowIndex = lookupAddress(Address);
811  if (RowIndex == -1U)
812  return false;
813  // Take file number and line/column from the row.
814  const auto &Row = Rows[RowIndex];
815  if (!getFileNameByIndex(Row.File, CompDir, Kind, Result.FileName))
816  return false;
817  Result.Line = Row.Line;
818  Result.Column = Row.Column;
820  return true;
821 }
SequenceVector::const_iterator SequenceIter
uint32_t Discriminator
Definition: DIContext.h:40
uint64_t LowPC
Sequence describes instructions at address range [LowPC, HighPC) and is described by line table rows ...
std::string FileName
Definition: DIContext.h:33
uint64_t getULEB128(uint32_t *offset_ptr) const
Extract a unsigned LEB128 value from *offset_ptr.
Compute iterated dominance frontiers using a linear time algorithm.
Definition: AllocatorList.h:24
Row(bool DefaultIsStmt=false)
bool parse(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr)
Parse prologue and all rows.
uint32_t sizeofTotalLength() const
static bool orderByAddress(const Row &LHS, const Row &RHS)
StringRef LNStandardString(unsigned Standard)
Definition: Dwarf.cpp:406
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
Definition: Format.h:124
uint8_t MinInstLength
The size in bytes of the smallest target machine instruction.
uint32_t Line
An unsigned integer indicating a source line number.
uint64_t getRelocatedAddress(uint32_t *Off, uint64_t *SecIx=nullptr) const
Extracts an address-sized value and applies a relocation to the result if one exists for the given of...
uint16_t getU16(uint32_t *offset_ptr) const
Extract a uint16_t value from *offset_ptr.
LLVM_NODISCARD LLVM_ATTRIBUTE_ALWAYS_INLINE const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Definition: StringRef.h:128
DILineInfo - a format-neutral container for source line information.
Definition: DIContext.h:32
void append(SmallVectorImpl< char > &path, const Twine &a, const Twine &b="", const Twine &c="", const Twine &d="")
Append to path.
Definition: Path.cpp:465
uint32_t getU32(uint32_t *offset_ptr) const
Extract a uint32_t value from *offset_ptr.
Represents a series of contiguous machine instructions.
uint64_t Address
The program-counter value corresponding to a machine instruction generated by the compiler...
bool hasFileAtIndex(uint64_t FileIndex) const
void postAppend()
Called after a row is appended to the matrix.
bool is_absolute(const Twine &path, Style style=Style::native)
Is path absolute?
Definition: Path.cpp:673
uint32_t lookupAddress(uint64_t Address) const
Returns the index of the row with file/line info for a given address, or UnknownRowIndex if there is ...
uint8_t LineRange
This parameter affects the meaning of the special opcodes. See below.
StringRef str() const
Explicit conversion to StringRef.
Definition: SmallString.h:267
uint8_t OpcodeBase
The number assigned to the first special opcode.
void reset(bool DefaultIsStmt)
const T & getValue() const LLVM_LVALUE_FUNCTION
Definition: Optional.h:129
bool parse(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr)
LLVM_NODISCARD LLVM_ATTRIBUTE_ALWAYS_INLINE bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:133
bool skipValue(DataExtractor DebugInfoData, uint32_t *OffsetPtr, const DWARFFormParams Params) const
Skip a form&#39;s value in DebugInfoData at the offset specified by OffsetPtr.
uint64_t TotalLength
The size in bytes of the statement information for this compilation unit (not including the total_len...
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
Definition: SmallString.h:26
static ContentDescriptors parseV5EntryFormat(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr, uint64_t EndPrologueOffset)
int64_t getSLEB128(uint32_t *offset_ptr) const
Extract a signed LEB128 value from *offset_ptr.
static void parseV2DirFileTables(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr, uint64_t EndPrologueOffset, std::vector< StringRef > &IncludeDirectories, std::vector< DWARFDebugLine::FileNameEntry > &FileNames)
bool extractValue(const DWARFDataExtractor &Data, uint32_t *OffsetPtr, const DWARFUnit *U)
Extracts a value in Data at offset *OffsetPtr.
const char * Name
uint8_t EndSequence
A boolean indicating that the current address is that of the first byte after the end of a sequence o...
* if(!EatIfPresent(lltok::kw_thread_local)) return false
ParseOptionalThreadLocal := /*empty.
uint32_t Column
Definition: DIContext.h:36
void dump(raw_ostream &OS) const
LLVM Basic Block Representation.
Definition: BasicBlock.h:59
uint16_t File
An unsigned integer indicating the identity of the source file corresponding to a machine instruction...
uint8_t getAddressSize() const
Get the address size for this extractor.
Definition: DataExtractor.h:59
uint8_t getU8(uint32_t *offset_ptr) const
Extract a uint8_t value from *offset_ptr.
Optional< uint64_t > getAsUnsignedConstant() const
uint64_t getU64(uint32_t *offset_ptr) const
Extract a uint64_t value from *offset_ptr.
void appendSequence(const DWARFDebugLine::Sequence &S)
Standard .debug_line state machine structure.
A DataExtractor (typically for an in-memory copy of an object-file section) plus a relocation map for...
bool lookupAddressRange(uint64_t Address, uint64_t Size, std::vector< uint32_t > &Result) const
bool containsPC(uint64_t PC) const
uint16_t Column
An unsigned integer indicating a column number within a source line.
bool getFileLineInfoForAddress(uint64_t Address, const char *CompDir, DILineInfoSpecifier::FileLineInfoKind Kind, DILineInfo &Result) const
Fills the Result argument with the file and line information corresponding to Address.
uint32_t Line
Definition: DIContext.h:35
This is a &#39;vector&#39; (really, a variable-sized array), optimized for the case when the array is small...
Definition: SmallVector.h:864
void appendRow(const DWARFDebugLine::Row &R)
A helper struct for DWARFFormValue methods, providing information that allows it to know the byte siz...
static void dumpTableHeader(raw_ostream &OS)
std::vector< uint8_t > StandardOpcodeLengths
static bool parseV5DirFileTables(const DWARFDataExtractor &DebugLineData, uint32_t *OffsetPtr, uint64_t EndPrologueOffset, const DWARFFormParams &FormParams, std::vector< StringRef > &IncludeDirectories, std::vector< DWARFDebugLine::FileNameEntry > &FileNames)
static void clear(coro::Shape &Shape)
Definition: Coroutines.cpp:191
constexpr char Size[]
Key for Kernel::Arg::Metadata::mSize.
std::vector< FileNameEntry > FileNames
uint32_t Discriminator
An unsigned integer representing the DWARF path discriminator value for this location.
RowVector::const_iterator RowIter
uint64_t getUnsigned(uint32_t *offset_ptr, uint32_t byte_size) const
Extract an unsigned integer of size byte_size from *offset_ptr.
#define I(x, y, z)
Definition: MD5.cpp:58
static bool orderByLowPC(const Sequence &LHS, const Sequence &RHS)
Optional< const char * > getAsCString() const
bool is_relative(const Twine &path, Style style=Style::native)
Is path relative?
Definition: Path.cpp:684
Sequence
A sequence of states that a pointer may go through in which an objc_retain and objc_release are actua...
Definition: PtrState.h:37
const char * getCStr(uint32_t *offset_ptr) const
Extract a C string from *offset_ptr.
uint8_t DefaultIsStmt
The initial value of theis_stmtregister.
const unsigned Kind
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
int8_t LineBase
This parameter affects the meaning of the special opcodes. See below.
bool getFileNameByIndex(uint64_t FileIndex, const char *CompDir, DILineInfoSpecifier::FileLineInfoKind Kind, std::string &Result) const
Extracts filename by its index in filename table in prologue.
const LineTable * getLineTable(uint32_t Offset) const
LLVM Value Representation.
Definition: Value.h:73
StringRef getCStrRef(uint32_t *OffsetPtr) const
Extract a C string from *OffsetPtr.
void dump(raw_ostream &OS) const
This class implements an extremely fast bulk output stream that can only output to a stream...
Definition: raw_ostream.h:44
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:49
void sort(Policy policy, RandomAccessIterator Start, RandomAccessIterator End, const Comparator &Comp=Comparator())
Definition: Parallel.h:201
LineNumberEntryFormat
Definition: Dwarf.h:234
const LineTable * getOrParseLineTable(const DWARFDataExtractor &DebugLineData, uint32_t Offset)
std::vector< StringRef > IncludeDirectories
void dump(raw_ostream &OS) const