52 return Addr == UINT32_MAX;
72 if (GsymFileIdx != UINT32_MAX)
77 DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath, File))
101 if (Die.
getTag() == dwarf::DW_TAG_inlined_subroutine)
108 switch (ParentDie.
getTag()) {
109 case dwarf::DW_TAG_namespace:
110 case dwarf::DW_TAG_structure_type:
111 case dwarf::DW_TAG_union_type:
112 case dwarf::DW_TAG_class_type:
113 case dwarf::DW_TAG_subprogram:
115 case dwarf::DW_TAG_lexical_block:
131static std::optional<uint32_t>
145 if (!(Language == dwarf::DW_LANG_C_plus_plus ||
146 Language == dwarf::DW_LANG_C_plus_plus_03 ||
147 Language == dwarf::DW_LANG_C_plus_plus_11 ||
148 Language == dwarf::DW_LANG_C_plus_plus_14 ||
149 Language == dwarf::DW_LANG_ObjC_plus_plus ||
152 Language == dwarf::DW_LANG_C))
163 if (ParentDeclCtxDie) {
165 while (ParentDeclCtxDie) {
167 if (!ParentName.
empty()) {
171 if (ParentName.
front() ==
'<' && ParentName.
back() ==
'>')
187 bool CheckChildren =
true;
189 case dwarf::DW_TAG_subprogram:
191 CheckChildren =
Depth == 0;
193 case dwarf::DW_TAG_inlined_subroutine:
211 if (DwarfRange.LowPC < DwarfRange.HighPC)
212 Ranges.insert({DwarfRange.LowPC, DwarfRange.HighPC});
226 if (Tag == dwarf::DW_TAG_inlined_subroutine) {
234 for (
const AddressRange &InlineRange : AllInlineRanges) {
237 if (InlineRange.empty()) {
241 II.Ranges.insert(InlineRange);
250 if (AllParentRanges.
contains(InlineRange)) {
253 Out.
Report(
"Function DIE has uncontained address range",
255 OS <<
"error: inlined function DIE at "
257 <<
HEX64(InlineRange.start()) <<
" - "
258 <<
HEX64(InlineRange.end())
259 <<
") that isn't contained in "
260 <<
"any parent address ranges, this inline range "
270 if (EmptyCount == AllInlineRanges.size())
273 if (
II.Ranges.empty())
277 II.Name = *NameIndex;
280 std::optional<uint32_t> OptGSymFileIdx =
282 if (OptGSymFileIdx) {
283 II.CallFile = OptGSymFileIdx.value();
288 AllInlineRanges, WarnIfEmpty);
292 "Inlined function die has invlaid file index in DW_AT_call_file",
295 <<
" has an invalid file index " << DwarfFileIdx
296 <<
" in its DW_AT_call_file attribute, this inline entry and "
298 <<
"children will be removed.\n";
302 if (Tag == dwarf::DW_TAG_subprogram || Tag == dwarf::DW_TAG_lexical_block) {
306 AllParentRanges, WarnIfEmpty);
313 std::vector<uint32_t> RowVector;
316 const uint64_t RangeSize = EndAddress - StartAddress;
321 std::optional<uint64_t> StmtSeqOffset;
322 if (
auto StmtSeqAttr = Die.
find(llvm::dwarf::DW_AT_LLVM_stmt_sequence)) {
329 StmtSeqOffset = StmtSeqVal;
337 DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath);
338 if (FilePath.empty()) {
345 <<
" has an invalid file index " << DwarfFileIdx
346 <<
" in its DW_AT_decl_file attribute, unable to create a single "
347 <<
"line entry from the DW_AT_decl_file/DW_AT_decl_line "
363 for (
uint32_t RowIndex : RowVector) {
366 std::optional<uint32_t> OptFileIdx =
370 "Invalid file index in DWARF line table", [&](
raw_ostream &
OS) {
372 <<
"a line entry with invalid DWARF file index, this entry will "
374 Row.dumpTableHeader(
OS, 0);
380 const uint32_t FileIdx = OptFileIdx.value();
381 uint64_t RowAddress = Row.Address.Address;
390 Out.
Report(
"Start address lies between valid Row table entries",
392 OS <<
"error: DIE has a start address whose LowPC is "
395 << RowIndex <<
"] with address " <<
HEX64(RowAddress)
396 <<
" and the next one.\n";
405 LineEntry LE(RowAddress, FileIdx, Row.Line);
406 if (RowIndex != RowVector[0] && Row.Address < PrevRow.
Address) {
414 if (FirstLE && *FirstLE == LE)
417 OS <<
"warning: duplicate line table detected for DIE:\n";
421 Out.
Report(
"Non-monotonically increasing addresses",
423 OS <<
"error: line table has addresses that do not "
424 <<
"monotonically increase:\n";
425 for (
uint32_t RowIndex2 : RowVector)
434 if (LastLE && LastLE->File == FileIdx && LastLE->Line == Row.Line)
439 if (Row.EndSequence) {
459 case dwarf::DW_TAG_subprogram: {
461 if (!RangesOrError) {
472 <<
" has no name\n ";
507 if (
Range.LowPC != 0) {
510 Out.
Report(
"Address range starts outside executable section",
512 OS <<
"warning: DIE has an address range whose "
514 "is not in any executable sections ("
516 <<
") and will not be processed:\n";
526 FI.
Name = *NameIndex;
532 FI.
Inline->Name = *NameIndex;
534 bool WarnIfEmpty =
true;
536 AllSubprogramRanges, WarnIfEmpty);
546 if (FI.
Inline->Children.empty()) {
547 if (WarnIfEmpty && !Gsym.
isQuiet())
548 Out.
Report(
"DIE contains inline functions with no valid ranges",
550 OS <<
"warning: DIE contains inline function "
551 "information that has no valid ranges, removing "
552 "inline information:\n";
560 if (LoadDwarfCallSites)
561 parseCallSiteInfoFromDwarf(CUI, Die, FI);
570 handleDie(Out, CUI, ChildDie);
573void DwarfTransformer::parseCallSiteInfoFromDwarf(
CUInfo &CUI,
DWARFDie Die,
585 if (Child.getTag() != dwarf::DW_TAG_call_site)
604 if (
const char *LinkName = OriginDie.getLinkageName()) {
607 }
else if (
const char *
ShortName = OriginDie.getShortName()) {
636 "warning: Unable to retrieve DWO .debug_info section for some "
637 "object files. (Remove the --quiet flag for full output)",
641 {dwarf::DW_AT_dwo_name, dwarf::DW_AT_GNU_dwo_name}),
643 OS <<
"warning: Unable to retrieve DWO .debug_info section for "
652 if (NumThreads == 1) {
657 CUInfo CUI(DICtx, dyn_cast<DWARFCompileUnit>(
CU.get()));
658 handleDie(Out, CUI, Die);
669 CU->getAbbreviations();
675 pool.
async([&
CU]() {
CU->getUnitDIE(
false ); });
683 CUInfo CUI(DICtx, dyn_cast<DWARFCompileUnit>(
CU.get()));
684 pool.
async([
this, CUI, &LogMutex, &Out, Die]()
mutable {
688 handleDie(ThreadOut, CUI, Die);
690 std::lock_guard<std::mutex> guard(LogMutex);
694 Out.
Merge(ThreadOut);
701 Out <<
"Loaded " << FunctionsAddedCount <<
" functions from DWARF.\n";
707 Out <<
"Verifying GSYM file \"" << GsymPath <<
"\":\n";
711 return Gsym.takeError();
713 auto NumAddrs = Gsym->getNumAddresses();
715 DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath,
716 DILineInfoSpecifier::FunctionNameKind::LinkageName);
717 std::string gsymFilename;
719 auto FuncAddr = Gsym->getAddress(
I);
722 "failed to extract address[%i]",
I);
724 auto FI = Gsym->getFunctionInfo(*FuncAddr);
727 std::errc::invalid_argument,
728 "failed to extract function info for address 0x%" PRIu64, *FuncAddr);
733 auto LR = Gsym->lookup(
Addr);
735 return LR.takeError();
737 auto DwarfInlineInfos =
739 uint32_t NumDwarfInlineInfos = DwarfInlineInfos.getNumberOfFrames();
740 if (NumDwarfInlineInfos == 0) {
741 DwarfInlineInfos.addFrame(
746 if (NumDwarfInlineInfos == 1 &&
747 DwarfInlineInfos.getFrame(0).FileName ==
"<invalid>") {
749 NumDwarfInlineInfos = 0;
751 if (NumDwarfInlineInfos > 0 &&
752 NumDwarfInlineInfos != LR->Locations.size()) {
755 Log <<
"error: address " <<
HEX64(
Addr) <<
" has "
756 << NumDwarfInlineInfos <<
" DWARF inline frames and GSYM has "
757 << LR->Locations.size() <<
"\n";
758 Log <<
" " << NumDwarfInlineInfos <<
" DWARF frames:\n";
759 for (
size_t Idx = 0;
Idx < NumDwarfInlineInfos; ++
Idx) {
760 const auto &dii = DwarfInlineInfos.getFrame(
Idx);
761 Log <<
" [" <<
Idx <<
"]: " << dii.FunctionName <<
" @ "
762 << dii.FileName <<
':' << dii.Line <<
'\n';
764 Log <<
" " << LR->Locations.size() <<
" GSYM frames:\n";
767 const auto &gii = LR->Locations[
Idx];
768 Log <<
" [" <<
Idx <<
"]: " << gii.Name <<
" @ " << gii.Dir
769 <<
'/' << gii.Base <<
':' << gii.Line <<
'\n';
771 Gsym->dump(Log, *FI);
778 const auto &gii = LR->Locations[
Idx];
779 if (
Idx < NumDwarfInlineInfos) {
780 const auto &dii = DwarfInlineInfos.getFrame(
Idx);
781 gsymFilename = LR->getSourceFile(
Idx);
784 Out <<
"error: address " <<
HEX64(
Addr) <<
" DWARF function \""
785 << dii.FunctionName.c_str()
786 <<
"\" doesn't match GSYM function \"" << gii.Name <<
"\"\n";
789 if (dii.FileName != gsymFilename)
790 Out <<
"error: address " <<
HEX64(
Addr) <<
" DWARF path \""
791 << dii.FileName.c_str() <<
"\" doesn't match GSYM path \""
792 << gsymFilename.c_str() <<
"\"\n";
794 if (dii.Line != gii.Line)
795 Out <<
"error: address " <<
HEX64(
Addr) <<
" DWARF line "
796 << dii.Line <<
" != GSYM line " << gii.Line <<
"\n";
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
uint64_t IntrinsicInst * II
A class that represents an address range.
bool contains(uint64_t Addr) const
bool contains(uint64_t Addr) const
The AddressRanges class helps normalize address range collections.
A format-neutral container for inlined code description.
DWARFContext This data structure is the top level entity that deals with dwarf debug information pars...
DIInliningInfo getInliningInfoForAddress(object::SectionedAddress Address, DILineInfoSpecifier Specifier=DILineInfoSpecifier()) override
compile_unit_range compile_units()
Get compile units in this context.
const DWARFDebugLine::LineTable * getLineTableForUnit(DWARFUnit *U)
Get a pointer to a parsed line table corresponding to a compile unit.
std::optional< DILineInfo > getLineInfoForAddress(object::SectionedAddress Address, DILineInfoSpecifier Specifier=DILineInfoSpecifier()) override
Utility class that carries the DWARF compile/type unit and the debug info entry in an object.
uint64_t getOffset() const
Get the absolute offset into the debug info or types section.
LLVM_ABI Expected< DWARFAddressRangesVector > getAddressRanges() const
Get the address ranges for this DIE.
iterator_range< iterator > children() const
LLVM_ABI DWARFDie getAttributeValueAsReferencedDie(dwarf::Attribute Attr) const
Extract the specified attribute from this DIE as the referenced DIE.
LLVM_ABI DWARFDie getParent() const
Get the parent of this DIE object.
LLVM_ABI std::optional< DWARFFormValue > find(dwarf::Attribute Attr) const
Extract the specified attribute from this DIE.
LLVM_ABI std::optional< DWARFFormValue > findRecursively(ArrayRef< dwarf::Attribute > Attrs) const
Extract the first value of any attribute in Attrs from this DIE and recurse into any DW_AT_specificat...
LLVM_ABI const char * getName(DINameKind Kind) const
Return the DIE name resolving DW_AT_specification or DW_AT_abstract_origin references if necessary.
LLVM_ABI std::string getDeclFile(DILineInfoSpecifier::FileLineInfoKind Kind) const
dwarf::Tag getTag() const
LLVM_ABI const char * getLinkageName() const
Return the DIE linkage name resolving DW_AT_specification or DW_AT_abstract_origin references if nece...
LLVM_ABI void dump(raw_ostream &OS, unsigned indent=0, DIDumpOptions DumpOpts=DIDumpOptions()) const
Dump the DIE and all of its attributes to the supplied stream.
DWARFDie getUnitDIE(bool ExtractUnitDIEOnly=true)
This dwarf writer support class manages information associated with a source file.
Lightweight error class with error context and mandatory checking.
static ErrorSuccess success()
Create a success value.
Tagged union holding either a T or a Error.
Error takeError()
Take ownership of the stored error.
reference get()
Returns a reference to the stored T value.
A non-threaded implementation.
void wait() override
Blocking wait for all the tasks to execute first.
StringRef - Represent a constant reference to a string, i.e.
std::string str() const
str - Get the contents as an std::string.
constexpr StringRef substr(size_t Start, size_t N=npos) const
Return a reference to the substring from [Start, Start + N).
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
constexpr bool empty() const
empty - Check if the string is empty.
char back() const
back - Get the last character in the string.
constexpr size_t size() const
size - Get the string size.
char front() const
front - Get the first character in the string.
auto async(Function &&F, Args &&...ArgList)
Asynchronous submission of a task to the pool.
GsymCreator is used to emit GSYM data to a stand alone file or section within a file.
LLVM_ABI void addFunctionInfo(FunctionInfo &&FI)
Add a function info to this GSYM creator.
LLVM_ABI uint32_t insertString(StringRef S, bool Copy=true)
Insert a string into the GSYM string table.
const std::optional< AddressRanges > GetValidTextRanges() const
Get the valid text ranges.
bool isQuiet() const
Whether the transformation should be quiet, i.e. not output warnings.
LLVM_ABI uint32_t insertFile(StringRef Path, sys::path::Style Style=sys::path::Style::native)
Insert a file into this GSYM creator.
LLVM_ABI size_t getNumFunctionInfos() const
Get the current number of FunctionInfo objects contained in this object.
LLVM_ABI bool IsValidTextAddress(uint64_t Addr) const
Check if an address is a valid code address.
static LLVM_ABI llvm::Expected< GsymReader > openFile(StringRef Path)
Construct a GsymReader from a file on disk.
LineTable class contains deserialized versions of line tables for each function's address ranges.
void Report(StringRef s, std::function< void(raw_ostream &o)> detailCallback)
raw_ostream * GetOS() const
void Merge(const OutputAggregator &other)
This class implements an extremely fast bulk output stream that can only output to a stream.
A raw_ostream that writes to an std::string.
std::optional< uint64_t > toAddress(const std::optional< DWARFFormValue > &V)
Take an optional DWARFFormValue and try to extract an address.
std::optional< const char * > toString(const std::optional< DWARFFormValue > &V)
Take an optional DWARFFormValue and try to extract a string value from it.
std::optional< uint64_t > toSectionOffset(const std::optional< DWARFFormValue > &V)
Take an optional DWARFFormValue and try to extract an section offset.
std::optional< uint64_t > toUnsigned(const std::optional< DWARFFormValue > &V)
Take an optional DWARFFormValue and try to extract an unsigned constant.
This is an optimization pass for GlobalISel generic memory operations.
ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount=0)
Returns a default thread strategy where all available hardware resources are to be used,...
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
std::vector< DWARFAddressRange > DWARFAddressRangesVector
DWARFAddressRangesVector - represents a set of absolute address ranges.
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
void consumeError(Error Err)
Consume a Error without doing anything.
static DIDumpOptions getForSingleDIE()
Return default option set for printing a single DIE without children.
Controls which fields of DILineInfo container should be filled with data.
A format-neutral container for source line information.
LLVM_ABI bool lookupAddressRange(object::SectionedAddress Address, uint64_t Size, std::vector< uint32_t > &Result, std::optional< uint64_t > StmtSequenceOffset=std::nullopt) const
Fills the Result argument with the indices of the rows that correspond to the address range specified...
Standard .debug_line state machine structure.
object::SectionedAddress Address
The program-counter value corresponding to a machine instruction generated by the compiler and sectio...
This type represents a file cache system that manages caching of files.
const DWARFDebugLine::LineTable * LineTable
std::optional< uint32_t > DWARFToGSYMFileIndex(GsymCreator &Gsym, uint32_t DwarfFileIdx)
Convert a DWARF compile unit file index into a GSYM global file index.
CUInfo(DWARFContext &DICtx, DWARFCompileUnit *CU)
bool isHighestAddress(uint64_t Addr) const
Return true if Addr is the highest address for a given compile unit.
std::vector< uint32_t > FileCache
std::vector< CallSiteInfo > CallSites
std::vector< uint32_t > MatchRegex
Offsets into the string table for function names regex patterns.
uint64_t ReturnOffset
The return offset of the call site - relative to the function start.
Function information in GSYM files encodes information for one contiguous address range.
std::optional< InlineInfo > Inline
uint64_t startAddress() const
uint64_t endAddress() const
std::optional< CallSiteInfoCollection > CallSites
uint32_t Name
String table offset in the string table.
std::optional< LineTable > OptLineTable
Inline information stores the name of the inline function along with an array of address ranges.
std::vector< InlineInfo > Children
Line entries are used to encode the line tables in FunctionInfo objects.
static const uint64_t UndefSection