LLVM 22.0.0git
Symbolize.cpp
Go to the documentation of this file.
1//===-- LLVMSymbolize.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Implementation for LLVM symbolization library.
10//
11//===----------------------------------------------------------------------===//
12
14
15#include "llvm/ADT/STLExtras.h"
24#include "llvm/Object/BuildID.h"
25#include "llvm/Object/COFF.h"
27#include "llvm/Object/MachO.h"
29#include "llvm/Support/CRC.h"
32#include "llvm/Support/Errc.h"
35#include "llvm/Support/Path.h"
36#include <cassert>
37#include <cstring>
38
39namespace llvm {
40namespace codeview {
41union DebugInfo;
42}
43namespace symbolize {
44
46
48 : Opts(Opts),
49 BIDFetcher(std::make_unique<BuildIDFetcher>(Opts.DebugFileDirectory)) {}
50
52
53template <typename T>
55LLVMSymbolizer::symbolizeCodeCommon(const T &ModuleSpecifier,
56 object::SectionedAddress ModuleOffset) {
57
58 auto InfoOrErr = getOrCreateModuleInfo(ModuleSpecifier);
59 if (!InfoOrErr)
60 return InfoOrErr.takeError();
61
62 SymbolizableModule *Info = *InfoOrErr;
63
64 // A null module means an error has already been reported. Return an empty
65 // result.
66 if (!Info)
67 return DILineInfo();
68
69 // If the user is giving us relative addresses, add the preferred base of the
70 // object to the offset before we do the query. It's what DIContext expects.
71 if (Opts.RelativeAddresses)
72 ModuleOffset.Address += Info->getModulePreferredBase();
73
74 DILineInfo LineInfo = Info->symbolizeCode(
75 ModuleOffset,
77 Opts.SkipLineZero),
78 Opts.UseSymbolTable);
79 if (Opts.Demangle)
80 LineInfo.FunctionName = DemangleName(LineInfo.FunctionName, Info);
81 return LineInfo;
82}
83
86 object::SectionedAddress ModuleOffset) {
87 return symbolizeCodeCommon(Obj, ModuleOffset);
88}
89
92 object::SectionedAddress ModuleOffset) {
93 return symbolizeCodeCommon(ModuleName, ModuleOffset);
94}
95
98 object::SectionedAddress ModuleOffset) {
99 return symbolizeCodeCommon(BuildID, ModuleOffset);
100}
101
102template <typename T>
103Expected<DIInliningInfo> LLVMSymbolizer::symbolizeInlinedCodeCommon(
104 const T &ModuleSpecifier, object::SectionedAddress ModuleOffset) {
105 auto InfoOrErr = getOrCreateModuleInfo(ModuleSpecifier);
106 if (!InfoOrErr)
107 return InfoOrErr.takeError();
108
109 SymbolizableModule *Info = *InfoOrErr;
110
111 // A null module means an error has already been reported. Return an empty
112 // result.
113 if (!Info)
114 return DIInliningInfo();
115
116 // If the user is giving us relative addresses, add the preferred base of the
117 // object to the offset before we do the query. It's what DIContext expects.
118 if (Opts.RelativeAddresses)
119 ModuleOffset.Address += Info->getModulePreferredBase();
120
121 DIInliningInfo InlinedContext = Info->symbolizeInlinedCode(
122 ModuleOffset,
124 Opts.SkipLineZero),
125 Opts.UseSymbolTable);
126 if (Opts.Demangle) {
127 for (int i = 0, n = InlinedContext.getNumberOfFrames(); i < n; i++) {
128 auto *Frame = InlinedContext.getMutableFrame(i);
129 Frame->FunctionName = DemangleName(Frame->FunctionName, Info);
130 }
131 }
132 return InlinedContext;
133}
134
135Expected<DIInliningInfo>
137 object::SectionedAddress ModuleOffset) {
138 return symbolizeInlinedCodeCommon(Obj, ModuleOffset);
139}
140
143 object::SectionedAddress ModuleOffset) {
144 return symbolizeInlinedCodeCommon(ModuleName, ModuleOffset);
145}
146
149 object::SectionedAddress ModuleOffset) {
150 return symbolizeInlinedCodeCommon(BuildID, ModuleOffset);
151}
152
153template <typename T>
155LLVMSymbolizer::symbolizeDataCommon(const T &ModuleSpecifier,
156 object::SectionedAddress ModuleOffset) {
157
158 auto InfoOrErr = getOrCreateModuleInfo(ModuleSpecifier);
159 if (!InfoOrErr)
160 return InfoOrErr.takeError();
161
162 SymbolizableModule *Info = *InfoOrErr;
163 // A null module means an error has already been reported. Return an empty
164 // result.
165 if (!Info)
166 return DIGlobal();
167
168 // If the user is giving us relative addresses, add the preferred base of
169 // the object to the offset before we do the query. It's what DIContext
170 // expects.
171 if (Opts.RelativeAddresses)
172 ModuleOffset.Address += Info->getModulePreferredBase();
173
174 DIGlobal Global = Info->symbolizeData(ModuleOffset);
175 if (Opts.Demangle)
176 Global.Name = DemangleName(Global.Name, Info);
177 return Global;
178}
179
182 object::SectionedAddress ModuleOffset) {
183 return symbolizeDataCommon(Obj, ModuleOffset);
184}
185
188 object::SectionedAddress ModuleOffset) {
189 return symbolizeDataCommon(ModuleName, ModuleOffset);
190}
191
194 object::SectionedAddress ModuleOffset) {
195 return symbolizeDataCommon(BuildID, ModuleOffset);
196}
197
198template <typename T>
200LLVMSymbolizer::symbolizeFrameCommon(const T &ModuleSpecifier,
201 object::SectionedAddress ModuleOffset) {
202 auto InfoOrErr = getOrCreateModuleInfo(ModuleSpecifier);
203 if (!InfoOrErr)
204 return InfoOrErr.takeError();
205
206 SymbolizableModule *Info = *InfoOrErr;
207 // A null module means an error has already been reported. Return an empty
208 // result.
209 if (!Info)
210 return std::vector<DILocal>();
211
212 // If the user is giving us relative addresses, add the preferred base of
213 // the object to the offset before we do the query. It's what DIContext
214 // expects.
215 if (Opts.RelativeAddresses)
216 ModuleOffset.Address += Info->getModulePreferredBase();
217
218 return Info->symbolizeFrame(ModuleOffset);
219}
220
223 object::SectionedAddress ModuleOffset) {
224 return symbolizeFrameCommon(Obj, ModuleOffset);
225}
226
229 object::SectionedAddress ModuleOffset) {
230 return symbolizeFrameCommon(ModuleName, ModuleOffset);
231}
232
235 object::SectionedAddress ModuleOffset) {
236 return symbolizeFrameCommon(BuildID, ModuleOffset);
237}
238
239template <typename T>
241LLVMSymbolizer::findSymbolCommon(const T &ModuleSpecifier, StringRef Symbol,
243 auto InfoOrErr = getOrCreateModuleInfo(ModuleSpecifier);
244 if (!InfoOrErr)
245 return InfoOrErr.takeError();
246
247 SymbolizableModule *Info = *InfoOrErr;
248 std::vector<DILineInfo> Result;
249
250 // A null module means an error has already been reported. Return an empty
251 // result.
252 if (!Info)
253 return Result;
254
255 for (object::SectionedAddress A : Info->findSymbol(Symbol, Offset)) {
256 DILineInfo LineInfo = Info->symbolizeCode(
258 Opts.UseSymbolTable);
259 if (LineInfo.FileName != DILineInfo::BadString) {
260 if (Opts.Demangle)
261 LineInfo.FunctionName = DemangleName(LineInfo.FunctionName, Info);
262 Result.push_back(std::move(LineInfo));
263 }
264 }
265
266 return Result;
267}
268
269Expected<std::vector<DILineInfo>>
272 return findSymbolCommon(Obj, Symbol, Offset);
273}
274
278 return findSymbolCommon(ModuleName, Symbol, Offset);
279}
280
284 return findSymbolCommon(BuildID, Symbol, Offset);
285}
286
288 ObjectForUBPathAndArch.clear();
289 LRUBinaries.clear();
290 CacheSize = 0;
291 BinaryForPath.clear();
292 ObjectPairForPathArch.clear();
293 Modules.clear();
294 BuildIDPaths.clear();
295}
296
297namespace {
298
299// For Path="/path/to/foo" and Basename="foo" assume that debug info is in
300// /path/to/foo.dSYM/Contents/Resources/DWARF/foo.
301// For Path="/path/to/bar.dSYM" and Basename="foo" assume that debug info is in
302// /path/to/bar.dSYM/Contents/Resources/DWARF/foo.
303std::string getDarwinDWARFResourceForPath(const std::string &Path,
304 const std::string &Basename) {
305 SmallString<16> ResourceName = StringRef(Path);
306 if (sys::path::extension(Path) != ".dSYM") {
307 ResourceName += ".dSYM";
308 }
309 sys::path::append(ResourceName, "Contents", "Resources", "DWARF");
310 sys::path::append(ResourceName, Basename);
311 return std::string(ResourceName);
312}
313
314bool checkFileCRC(StringRef Path, uint32_t CRCHash) {
315 ErrorOr<std::unique_ptr<MemoryBuffer>> MB =
317 if (!MB)
318 return false;
319 return CRCHash == llvm::crc32(arrayRefFromStringRef(MB.get()->getBuffer()));
320}
321
322bool getGNUDebuglinkContents(const ObjectFile *Obj, std::string &DebugName,
323 uint32_t &CRCHash) {
324 if (!Obj)
325 return false;
326 for (const SectionRef &Section : Obj->sections()) {
327 StringRef Name;
328 consumeError(Section.getName().moveInto(Name));
329
330 Name = Name.substr(Name.find_first_not_of("._"));
331 if (Name == "gnu_debuglink") {
332 Expected<StringRef> ContentsOrErr = Section.getContents();
333 if (!ContentsOrErr) {
334 consumeError(ContentsOrErr.takeError());
335 return false;
336 }
337 DataExtractor DE(*ContentsOrErr, Obj->isLittleEndian(), 0);
338 uint64_t Offset = 0;
339 if (const char *DebugNameStr = DE.getCStr(&Offset)) {
340 // 4-byte align the offset.
341 Offset = (Offset + 3) & ~0x3;
342 if (DE.isValidOffsetForDataOfSize(Offset, 4)) {
343 DebugName = DebugNameStr;
344 CRCHash = DE.getU32(&Offset);
345 return true;
346 }
347 }
348 break;
349 }
350 }
351 return false;
352}
353
354bool darwinDsymMatchesBinary(const MachOObjectFile *DbgObj,
355 const MachOObjectFile *Obj) {
356 ArrayRef<uint8_t> dbg_uuid = DbgObj->getUuid();
357 ArrayRef<uint8_t> bin_uuid = Obj->getUuid();
358 if (dbg_uuid.empty() || bin_uuid.empty())
359 return false;
360 return !memcmp(dbg_uuid.data(), bin_uuid.data(), dbg_uuid.size());
361}
362
363} // end anonymous namespace
364
365ObjectFile *LLVMSymbolizer::lookUpDsymFile(const std::string &ExePath,
366 const MachOObjectFile *MachExeObj,
367 const std::string &ArchName) {
368 // On Darwin we may find DWARF in separate object file in
369 // resource directory.
370 std::vector<std::string> DsymPaths;
371 StringRef Filename = sys::path::filename(ExePath);
372 DsymPaths.push_back(
373 getDarwinDWARFResourceForPath(ExePath, std::string(Filename)));
374 for (const auto &Path : Opts.DsymHints) {
375 DsymPaths.push_back(
376 getDarwinDWARFResourceForPath(Path, std::string(Filename)));
377 }
378 for (const auto &Path : DsymPaths) {
379 auto DbgObjOrErr = getOrCreateObject(Path, ArchName);
380 if (!DbgObjOrErr) {
381 // Ignore errors, the file might not exist.
382 consumeError(DbgObjOrErr.takeError());
383 continue;
384 }
385 ObjectFile *DbgObj = DbgObjOrErr.get();
386 if (!DbgObj)
387 continue;
388 const MachOObjectFile *MachDbgObj = dyn_cast<const MachOObjectFile>(DbgObj);
389 if (!MachDbgObj)
390 continue;
391 if (darwinDsymMatchesBinary(MachDbgObj, MachExeObj))
392 return DbgObj;
393 }
394 return nullptr;
395}
396
397ObjectFile *LLVMSymbolizer::lookUpDebuglinkObject(const std::string &Path,
398 const ObjectFile *Obj,
399 const std::string &ArchName) {
400 std::string DebuglinkName;
401 uint32_t CRCHash;
402 std::string DebugBinaryPath;
403 if (!getGNUDebuglinkContents(Obj, DebuglinkName, CRCHash))
404 return nullptr;
405 if (!findDebugBinary(Path, DebuglinkName, CRCHash, DebugBinaryPath))
406 return nullptr;
407 auto DbgObjOrErr = getOrCreateObject(DebugBinaryPath, ArchName);
408 if (!DbgObjOrErr) {
409 // Ignore errors, the file might not exist.
410 consumeError(DbgObjOrErr.takeError());
411 return nullptr;
412 }
413 return DbgObjOrErr.get();
414}
415
416ObjectFile *LLVMSymbolizer::lookUpBuildIDObject(const std::string &Path,
417 const ELFObjectFileBase *Obj,
418 const std::string &ArchName) {
419 auto BuildID = getBuildID(Obj);
420 if (BuildID.size() < 2)
421 return nullptr;
422 std::string DebugBinaryPath;
423 if (!getOrFindDebugBinary(BuildID, DebugBinaryPath))
424 return nullptr;
425 auto DbgObjOrErr = getOrCreateObject(DebugBinaryPath, ArchName);
426 if (!DbgObjOrErr) {
427 consumeError(DbgObjOrErr.takeError());
428 return nullptr;
429 }
430 return DbgObjOrErr.get();
431}
432
433bool LLVMSymbolizer::findDebugBinary(const std::string &OrigPath,
434 const std::string &DebuglinkName,
435 uint32_t CRCHash, std::string &Result) {
436 SmallString<16> OrigDir(OrigPath);
438 SmallString<16> DebugPath = OrigDir;
439 // Try relative/path/to/original_binary/debuglink_name
440 llvm::sys::path::append(DebugPath, DebuglinkName);
441 if (checkFileCRC(DebugPath, CRCHash)) {
442 Result = std::string(DebugPath);
443 return true;
444 }
445 // Try relative/path/to/original_binary/.debug/debuglink_name
446 DebugPath = OrigDir;
447 llvm::sys::path::append(DebugPath, ".debug", DebuglinkName);
448 if (checkFileCRC(DebugPath, CRCHash)) {
449 Result = std::string(DebugPath);
450 return true;
451 }
452 // Make the path absolute so that lookups will go to
453 // "/usr/lib/debug/full/path/to/debug", not
454 // "/usr/lib/debug/to/debug"
456 if (!Opts.FallbackDebugPath.empty()) {
457 // Try <FallbackDebugPath>/absolute/path/to/original_binary/debuglink_name
458 DebugPath = Opts.FallbackDebugPath;
459 } else {
460#if defined(__NetBSD__)
461 // Try /usr/libdata/debug/absolute/path/to/original_binary/debuglink_name
462 DebugPath = "/usr/libdata/debug";
463#else
464 // Try /usr/lib/debug/absolute/path/to/original_binary/debuglink_name
465 DebugPath = "/usr/lib/debug";
466#endif
467 }
469 DebuglinkName);
470 if (checkFileCRC(DebugPath, CRCHash)) {
471 Result = std::string(DebugPath);
472 return true;
473 }
474 return false;
475}
476
478 return StringRef(reinterpret_cast<const char *>(BuildID.data()),
479 BuildID.size());
480}
481
482bool LLVMSymbolizer::getOrFindDebugBinary(const ArrayRef<uint8_t> BuildID,
483 std::string &Result) {
484 StringRef BuildIDStr = getBuildIDStr(BuildID);
485 auto I = BuildIDPaths.find(BuildIDStr);
486 if (I != BuildIDPaths.end()) {
487 Result = I->second;
488 return true;
489 }
490 if (!BIDFetcher)
491 return false;
492 if (std::optional<std::string> Path = BIDFetcher->fetch(BuildID)) {
493 Result = *Path;
494 auto InsertResult = BuildIDPaths.insert({BuildIDStr, Result});
495 assert(InsertResult.second);
496 (void)InsertResult;
497 return true;
498 }
499
500 return false;
501}
502
503std::string LLVMSymbolizer::lookUpGsymFile(const std::string &Path) {
504 if (Opts.DisableGsym)
505 return {};
506
507 auto CheckGsymFile = [](const llvm::StringRef &GsymPath) {
508 sys::fs::file_status Status;
509 std::error_code EC = llvm::sys::fs::status(GsymPath, Status);
511 };
512
513 // First, look beside the binary file
514 if (const auto GsymPath = Path + ".gsym"; CheckGsymFile(GsymPath))
515 return GsymPath;
516
517 // Then, look in the directories specified by GsymFileDirectory
518
519 for (const auto &Directory : Opts.GsymFileDirectory) {
520 SmallString<16> GsymPath = llvm::StringRef{Directory};
522 llvm::sys::path::filename(Path) + ".gsym");
523
524 if (CheckGsymFile(GsymPath))
525 return static_cast<std::string>(GsymPath);
526 }
527
528 return {};
529}
530
531Expected<LLVMSymbolizer::ObjectPair>
532LLVMSymbolizer::getOrCreateObjectPair(const std::string &Path,
533 const std::string &ArchName) {
534 auto I = ObjectPairForPathArch.find(std::make_pair(Path, ArchName));
535 if (I != ObjectPairForPathArch.end()) {
536 recordAccess(BinaryForPath.find(Path)->second);
537 return I->second;
538 }
539
540 auto ObjOrErr = getOrCreateObject(Path, ArchName);
541 if (!ObjOrErr) {
542 ObjectPairForPathArch.emplace(std::make_pair(Path, ArchName),
543 ObjectPair(nullptr, nullptr));
544 return ObjOrErr.takeError();
545 }
546
547 ObjectFile *Obj = ObjOrErr.get();
548 assert(Obj != nullptr);
549 ObjectFile *DbgObj = nullptr;
550
551 if (auto MachObj = dyn_cast<const MachOObjectFile>(Obj))
552 DbgObj = lookUpDsymFile(Path, MachObj, ArchName);
553 else if (auto ELFObj = dyn_cast<const ELFObjectFileBase>(Obj))
554 DbgObj = lookUpBuildIDObject(Path, ELFObj, ArchName);
555 if (!DbgObj)
556 DbgObj = lookUpDebuglinkObject(Path, Obj, ArchName);
557 if (!DbgObj)
558 DbgObj = Obj;
559 ObjectPair Res = std::make_pair(Obj, DbgObj);
560 std::string DbgObjPath = DbgObj->getFileName().str();
561 auto Pair =
562 ObjectPairForPathArch.emplace(std::make_pair(Path, ArchName), Res);
563 BinaryForPath.find(DbgObjPath)->second.pushEvictor([this, I = Pair.first]() {
564 ObjectPairForPathArch.erase(I);
565 });
566 return Res;
567}
568
569Expected<ObjectFile *>
570LLVMSymbolizer::getOrCreateObject(const std::string &Path,
571 const std::string &ArchName) {
572 Binary *Bin;
573 auto Pair = BinaryForPath.emplace(Path, OwningBinary<Binary>());
574 if (!Pair.second) {
575 Bin = Pair.first->second->getBinary();
576 recordAccess(Pair.first->second);
577 } else {
578 Expected<OwningBinary<Binary>> BinOrErr = createBinary(Path);
579 if (!BinOrErr)
580 return BinOrErr.takeError();
581
582 CachedBinary &CachedBin = Pair.first->second;
583 CachedBin = std::move(BinOrErr.get());
584 CachedBin.pushEvictor([this, I = Pair.first]() { BinaryForPath.erase(I); });
585 LRUBinaries.push_back(CachedBin);
586 CacheSize += CachedBin.size();
587 Bin = CachedBin->getBinary();
588 }
589
590 if (!Bin)
591 return static_cast<ObjectFile *>(nullptr);
592
593 if (MachOUniversalBinary *UB = dyn_cast_or_null<MachOUniversalBinary>(Bin)) {
594 auto I = ObjectForUBPathAndArch.find(std::make_pair(Path, ArchName));
595 if (I != ObjectForUBPathAndArch.end())
596 return I->second.get();
597
598 Expected<std::unique_ptr<ObjectFile>> ObjOrErr =
599 UB->getMachOObjectForArch(ArchName);
600 if (!ObjOrErr) {
601 ObjectForUBPathAndArch.emplace(std::make_pair(Path, ArchName),
602 std::unique_ptr<ObjectFile>());
603 return ObjOrErr.takeError();
604 }
605 ObjectFile *Res = ObjOrErr->get();
606 auto Pair = ObjectForUBPathAndArch.emplace(std::make_pair(Path, ArchName),
607 std::move(ObjOrErr.get()));
608 BinaryForPath.find(Path)->second.pushEvictor(
609 [this, Iter = Pair.first]() { ObjectForUBPathAndArch.erase(Iter); });
610 return Res;
611 }
612 if (Bin->isObject()) {
613 return cast<ObjectFile>(Bin);
614 }
615 return errorCodeToError(object_error::arch_not_found);
616}
617
618Expected<SymbolizableModule *>
619LLVMSymbolizer::createModuleInfo(const ObjectFile *Obj,
620 std::unique_ptr<DIContext> Context,
621 StringRef ModuleName) {
622 auto InfoOrErr = SymbolizableObjectFile::create(Obj, std::move(Context),
623 Opts.UntagAddresses);
624 std::unique_ptr<SymbolizableModule> SymMod;
625 if (InfoOrErr)
626 SymMod = std::move(*InfoOrErr);
627 auto InsertResult = Modules.insert(
628 std::make_pair(std::string(ModuleName), std::move(SymMod)));
629 assert(InsertResult.second);
630 if (!InfoOrErr)
631 return InfoOrErr.takeError();
632 return InsertResult.first->second.get();
633}
634
635Expected<SymbolizableModule *>
637 StringRef BinaryName = ModuleName;
638 StringRef ArchName = Opts.DefaultArch;
639 size_t ColonPos = ModuleName.find_last_of(':');
640 // Verify that substring after colon form a valid arch name.
641 if (ColonPos != std::string::npos) {
642 StringRef ArchStr = ModuleName.substr(ColonPos + 1);
643 if (Triple(ArchStr).getArch() != Triple::UnknownArch) {
644 BinaryName = ModuleName.substr(0, ColonPos);
645 ArchName = ArchStr;
646 }
647 }
648
649 auto I = Modules.find(ModuleName);
650 if (I != Modules.end()) {
651 recordAccess(BinaryForPath.find(BinaryName)->second);
652 return I->second.get();
653 }
654
655 auto ObjectsOrErr =
656 getOrCreateObjectPair(std::string{BinaryName}, std::string{ArchName});
657 if (!ObjectsOrErr) {
658 // Failed to find valid object file.
659 Modules.emplace(ModuleName, std::unique_ptr<SymbolizableModule>());
660 return ObjectsOrErr.takeError();
661 }
662 ObjectPair Objects = ObjectsOrErr.get();
663
664 std::unique_ptr<DIContext> Context;
665 // If this is a COFF object containing PDB info and not containing DWARF
666 // section, use a PDBContext to symbolize. Otherwise, use DWARF.
667 // Create a DIContext to symbolize as follows:
668 // - If there is a GSYM file, create a GsymContext.
669 // - Otherwise, if this is a COFF object containing PDB info, create a
670 // PDBContext.
671 // - Otherwise, create a DWARFContext.
672 const auto GsymFile = lookUpGsymFile(BinaryName.str());
673 if (!GsymFile.empty()) {
674 auto ReaderOrErr = gsym::GsymReader::openFile(GsymFile);
675
676 if (ReaderOrErr) {
677 std::unique_ptr<gsym::GsymReader> Reader =
678 std::make_unique<gsym::GsymReader>(std::move(*ReaderOrErr));
679
680 Context = std::make_unique<gsym::GsymContext>(std::move(Reader));
681 }
682 }
683 if (!Context) {
684 if (auto CoffObject = dyn_cast<COFFObjectFile>(Objects.first)) {
686 StringRef PDBFileName;
687 auto EC = CoffObject->getDebugPDBInfo(DebugInfo, PDBFileName);
688 // Use DWARF if there're DWARF sections.
689 bool HasDwarf = llvm::any_of(
690 Objects.first->sections(), [](SectionRef Section) -> bool {
691 if (Expected<StringRef> SectionName = Section.getName())
692 return SectionName.get() == ".debug_info";
693 return false;
694 });
695 if (!EC && !HasDwarf && DebugInfo != nullptr && !PDBFileName.empty()) {
696 using namespace pdb;
697 std::unique_ptr<IPDBSession> Session;
698
699 PDB_ReaderType ReaderType =
700 Opts.UseDIA ? PDB_ReaderType::DIA : PDB_ReaderType::Native;
701 if (auto Err = loadDataForEXE(ReaderType, Objects.first->getFileName(),
702 Session)) {
703 Modules.emplace(ModuleName, std::unique_ptr<SymbolizableModule>());
704 // Return along the PDB filename to provide more context
705 return createFileError(PDBFileName, std::move(Err));
706 }
707 Context.reset(new PDBContext(*CoffObject, std::move(Session)));
708 }
709 }
710 }
711 if (!Context)
714 nullptr, Opts.DWPName);
715 auto ModuleOrErr =
716 createModuleInfo(Objects.first, std::move(Context), ModuleName);
717 if (ModuleOrErr) {
718 auto I = Modules.find(ModuleName);
719 BinaryForPath.find(BinaryName)->second.pushEvictor([this, I]() {
720 Modules.erase(I);
721 });
722 }
723 return ModuleOrErr;
724}
725
726// For BPF programs .BTF.ext section contains line numbers information,
727// use it if regular DWARF is not available (e.g. for stripped binary).
728static bool useBTFContext(const ObjectFile &Obj) {
729 return Obj.makeTriple().isBPF() && !Obj.hasDebugInfo() &&
731}
732
735 StringRef ObjName = Obj.getFileName();
736 auto I = Modules.find(ObjName);
737 if (I != Modules.end())
738 return I->second.get();
739
740 std::unique_ptr<DIContext> Context;
741 if (useBTFContext(Obj))
743 else
745 // FIXME: handle COFF object with PDB info to use PDBContext
746 return createModuleInfo(&Obj, std::move(Context), ObjName);
747}
748
749Expected<SymbolizableModule *>
751 std::string Path;
752 if (!getOrFindDebugBinary(BuildID, Path)) {
754 "could not find build ID");
755 }
756 return getOrCreateModuleInfo(Path);
757}
758
759namespace {
760
761// Undo these various manglings for Win32 extern "C" functions:
762// cdecl - _foo
763// stdcall - _foo@12
764// fastcall - @foo@12
765// vectorcall - foo@@12
766// These are all different linkage names for 'foo'.
767StringRef demanglePE32ExternCFunc(StringRef SymbolName) {
768 char Front = SymbolName.empty() ? '\0' : SymbolName[0];
769
770 // Remove any '@[0-9]+' suffix.
771 bool HasAtNumSuffix = false;
772 if (Front != '?') {
773 size_t AtPos = SymbolName.rfind('@');
774 if (AtPos != StringRef::npos &&
775 all_of(drop_begin(SymbolName, AtPos + 1), isDigit)) {
776 SymbolName = SymbolName.substr(0, AtPos);
777 HasAtNumSuffix = true;
778 }
779 }
780
781 // Remove any ending '@' for vectorcall.
782 bool IsVectorCall = false;
783 if (HasAtNumSuffix && SymbolName.ends_with("@")) {
784 SymbolName = SymbolName.drop_back();
785 IsVectorCall = true;
786 }
787
788 // If not vectorcall, remove any '_' or '@' prefix.
789 if (!IsVectorCall && (Front == '_' || Front == '@'))
790 SymbolName = SymbolName.drop_front();
791
792 return SymbolName;
793}
794
795} // end anonymous namespace
796
797std::string
799 const SymbolizableModule *DbiModuleDescriptor) {
800 std::string Result;
801 if (nonMicrosoftDemangle(Name, Result))
802 return Result;
803
804 if (Name.starts_with('?')) {
805 // Only do MSVC C++ demangling on symbols starting with '?'.
806 int status = 0;
807 char *DemangledName = microsoftDemangle(
808 Name, nullptr, &status,
811 if (status != 0)
812 return std::string{Name};
813 Result = DemangledName;
814 free(DemangledName);
815 return Result;
816 }
817
818 if (DbiModuleDescriptor && DbiModuleDescriptor->isWin32Module()) {
819 std::string DemangledCName(demanglePE32ExternCFunc(Name));
820 // On i386 Windows, the C name mangling for different calling conventions
821 // may also be applied on top of the Itanium or Rust name mangling.
822 if (nonMicrosoftDemangle(DemangledCName, Result))
823 return Result;
824 return DemangledCName;
825 }
826 return std::string{Name};
827}
828
829void LLVMSymbolizer::recordAccess(CachedBinary &Bin) {
830 if (Bin->getBinary())
831 LRUBinaries.splice(LRUBinaries.end(), LRUBinaries, Bin.getIterator());
832}
833
835 // Evict the LRU binary until the max cache size is reached or there's <= 1
836 // item in the cache. The MRU binary is always kept to avoid thrashing if it's
837 // larger than the cache size.
838 while (CacheSize > Opts.MaxCacheSize && !LRUBinaries.empty() &&
839 std::next(LRUBinaries.begin()) != LRUBinaries.end()) {
840 CachedBinary &Bin = LRUBinaries.front();
841 CacheSize -= Bin.size();
842 LRUBinaries.pop_front();
843 Bin.evict();
844 }
845}
846
847void CachedBinary::pushEvictor(std::function<void()> NewEvictor) {
848 if (Evictor) {
849 this->Evictor = [OldEvictor = std::move(this->Evictor),
850 NewEvictor = std::move(NewEvictor)]() {
851 NewEvictor();
852 OldEvictor();
853 };
854 } else {
855 this->Evictor = std::move(NewEvictor);
856 }
857}
858
859} // namespace symbolize
860} // namespace llvm
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file declares a library for handling Build IDs and using them to find debug info.
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
Analysis containing CSE Info
Definition: CSEInfo.cpp:27
std::string Name
#define I(x, y, z)
Definition: MD5.cpp:58
Merge contiguous icmps into a memcmp
Definition: MergeICmps.cpp:915
static bool isDigit(const char C)
This file contains some templates that are useful if you are working with the STL at all.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41
static std::unique_ptr< BTFContext > create(const object::ObjectFile &Obj, std::function< void(Error)> ErrorHandler=WithColor::defaultErrorHandler)
Definition: BTFContext.cpp:65
static LLVM_ABI bool hasBTFSections(const ObjectFile &Obj)
Definition: BTFParser.cpp:410
A format-neutral container for inlined code description.
Definition: DIContext.h:94
static std::unique_ptr< DWARFContext > create(const object::ObjectFile &Obj, ProcessDebugRelocations RelocAction=ProcessDebugRelocations::Process, const LoadedObjectInfo *L=nullptr, std::string DWPName="", std::function< void(Error)> RecoverableErrorHandler=WithColor::defaultErrorHandler, std::function< void(Error)> WarningHandler=WithColor::defaultWarningHandler, bool ThreadSafe=false)
Tagged union holding either a T or a Error.
Definition: Error.h:485
static ErrorOr< std::unique_ptr< MemoryBuffer > > getFileOrSTDIN(const Twine &Filename, bool IsText=false, bool RequiresNullTerminator=true, std::optional< Align > Alignment=std::nullopt)
Open the specified file as a MemoryBuffer, or open stdin if the Filename is "-".
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
Definition: SmallString.h:26
size_t size() const
Definition: SmallVector.h:79
pointer data()
Return a pointer to the vector's buffer, even if empty().
Definition: SmallVector.h:287
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197
iterator end()
Definition: StringMap.h:224
iterator find(StringRef Key)
Definition: StringMap.h:235
bool insert(MapEntryTy *KeyValue)
insert - Insert the specified key/value pair into the map.
Definition: StringMap.h:310
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:55
std::string str() const
str - Get the contents as an std::string.
Definition: StringRef.h:233
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:151
static constexpr size_t npos
Definition: StringRef.h:57
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:47
bool isBPF() const
Tests whether the target is eBPF.
Definition: Triple.h:1138
@ UnknownArch
Definition: Triple.h:50
static LLVM_ABI llvm::Expected< GsymReader > openFile(StringRef Path)
Construct a GsymReader from a file on disk.
Definition: GsymReader.cpp:32
StringRef getFileName() const
Definition: Binary.cpp:41
BuildIDFetcher searches local cache directories for debug info.
Definition: BuildID.h:40
This class is the base class for all object file types.
Definition: ObjectFile.h:231
Triple makeTriple() const
Create a triple from the data in this object file.
Definition: ObjectFile.cpp:110
virtual bool hasDebugInfo() const
Definition: ObjectFile.cpp:100
This is a value type class that represents a single section in the list of sections in the object fil...
Definition: ObjectFile.h:83
LLVM_ABI void pushEvictor(std::function< void()> Evictor)
Definition: Symbolize.cpp:847
static LLVM_ABI std::string DemangleName(StringRef Name, const SymbolizableModule *DbiModuleDescriptor)
Definition: Symbolize.cpp:798
LLVM_ABI Expected< std::vector< DILineInfo > > findSymbol(const ObjectFile &Obj, StringRef Symbol, uint64_t Offset)
Definition: Symbolize.cpp:270
LLVM_ABI Expected< DIInliningInfo > symbolizeInlinedCode(const ObjectFile &Obj, object::SectionedAddress ModuleOffset)
Definition: Symbolize.cpp:136
LLVM_ABI Expected< DILineInfo > symbolizeCode(const ObjectFile &Obj, object::SectionedAddress ModuleOffset)
Definition: Symbolize.cpp:85
LLVM_ABI Expected< DIGlobal > symbolizeData(const ObjectFile &Obj, object::SectionedAddress ModuleOffset)
Definition: Symbolize.cpp:181
LLVM_ABI Expected< std::vector< DILocal > > symbolizeFrame(const ObjectFile &Obj, object::SectionedAddress ModuleOffset)
Definition: Symbolize.cpp:222
LLVM_ABI Expected< SymbolizableModule * > getOrCreateModuleInfo(StringRef ModuleName)
Returns a SymbolizableModule or an error if loading debug info failed.
Definition: Symbolize.cpp:636
virtual bool isWin32Module() const =0
static Expected< std::unique_ptr< SymbolizableObjectFile > > create(const object::ObjectFile *Obj, std::unique_ptr< DIContext > DICtx, bool UntagAddresses)
constexpr char SymbolName[]
Key for Kernel::Metadata::mSymbolName.
SmallVector< uint8_t, 10 > BuildID
A build ID in binary form.
Definition: BuildID.h:26
LLVM_ABI BuildIDRef getBuildID(const ObjectFile *Obj)
Returns the build ID, if any, contained in the given object file.
Definition: BuildID.cpp:56
LLVM_ABI Expected< std::unique_ptr< Binary > > createBinary(MemoryBufferRef Source, LLVMContext *Context=nullptr, bool InitContent=true)
Create a Binary from Source, autodetecting the file type.
Definition: Binary.cpp:45
static bool useBTFContext(const ObjectFile &Obj)
Definition: Symbolize.cpp:728
static StringRef getBuildIDStr(ArrayRef< uint8_t > BuildID)
Definition: Symbolize.cpp:477
LLVM_ABI void make_absolute(const Twine &current_directory, SmallVectorImpl< char > &path)
Make path an absolute path.
Definition: Path.cpp:906
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
LLVM_ABI bool is_directory(const basic_file_status &status)
Does status represent a directory?
Definition: Path.cpp:1092
LLVM_ABI void remove_filename(SmallVectorImpl< char > &path, Style style=Style::native)
Remove the last component from path unless it is the root dir.
Definition: Path.cpp:474
LLVM_ABI StringRef filename(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get filename.
Definition: Path.cpp:577
LLVM_ABI void append(SmallVectorImpl< char > &path, const Twine &a, const Twine &b="", const Twine &c="", const Twine &d="")
Append to path.
Definition: Path.cpp:456
LLVM_ABI StringRef extension(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get extension.
Definition: Path.cpp:590
LLVM_ABI StringRef relative_path(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get relative path.
Definition: Path.cpp:413
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition: STLExtras.h:338
@ Offset
Definition: DWP.cpp:477
DEMANGLE_ABI bool nonMicrosoftDemangle(std::string_view MangledName, std::string &Result, bool CanHaveLeadingDot=true, bool ParseParams=true)
Definition: Demangle.cpp:50
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1744
Error createFileError(const Twine &F, Error E)
Concatenate a source file path and/or name with an Error.
Definition: Error.h:1399
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
Definition: Error.h:1305
@ no_such_file_or_directory
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1751
@ Global
Append to llvm.global_dtors.
LLVM_ABI uint32_t crc32(ArrayRef< uint8_t > Data)
Definition: CRC.cpp:101
DEMANGLE_ABI char * microsoftDemangle(std::string_view mangled_name, size_t *n_read, int *status, MSDemangleFlags Flags=MSDF_None)
Demangles the Microsoft symbol pointed at by mangled_name and returns it.
MSDemangleFlags
Definition: Demangle.h:40
@ MSDF_NoReturnType
Definition: Demangle.h:45
@ MSDF_NoMemberType
Definition: Demangle.h:46
@ MSDF_NoCallingConvention
Definition: Demangle.h:44
@ MSDF_NoAccessSpecifier
Definition: Demangle.h:43
LLVM_ABI Error errorCodeToError(std::error_code EC)
Helper for converting an std::error_code to a Error.
Definition: Error.cpp:111
void consumeError(Error Err)
Consume a Error without doing anything.
Definition: Error.h:1083
Implement std::hash so that hash_code can be used in STL containers.
Definition: BitVector.h:851
Container for description of a global variable.
Definition: DIContext.h:120
Controls which fields of DILineInfo container should be filled with data.
Definition: DIContext.h:146
A format-neutral container for source line information.
Definition: DIContext.h:32
static constexpr const char *const BadString
Definition: DIContext.h:35
std::string FileName
Definition: DIContext.h:38
std::string FunctionName
Definition: DIContext.h:39
std::vector< std::string > GsymFileDirectory
Definition: Symbolize.h:68
std::vector< std::string > DsymHints
Definition: Symbolize.h:64