58#define DEBUG_TYPE "elf-object-writer"
63STATISTIC(ELFHeaderBytes,
"Total size of ELF headers");
64STATISTIC(SectionHeaderBytes,
"Total size of section headers table");
65STATISTIC(AllocTextBytes,
"Total size of SHF_ALLOC text sections");
66STATISTIC(AllocROBytes,
"Total size of SHF_ALLOC readonly sections");
67STATISTIC(AllocRWBytes,
"Total size of SHF_ALLOC read-write sections");
68STATISTIC(StrtabBytes,
"Total size of SHT_STRTAB sections");
69STATISTIC(SymtabBytes,
"Total size of SHT_SYMTAB sections");
70STATISTIC(RelocationBytes,
"Total size of relocation sections");
71STATISTIC(DynsymBytes,
"Total size of SHT_DYNSYM sections");
74 "Total size of debug info sections (not including those written to .dwo)");
75STATISTIC(UnwindBytes,
"Total size of unwind sections");
76STATISTIC(OtherBytes,
"Total size of uncategorized sections");
77STATISTIC(DwoBytes,
"Total size of sections written to .dwo file");
87class SymbolTableWriter {
92 std::vector<uint32_t> ShndxIndexes;
97 void createSymtabShndx();
102 SymbolTableWriter(ELFWriter &EWriter,
bool Is64Bit);
125 struct ELFSymbolData {
141 unsigned LastLocalSymbolIndex = ~0
u;
143 unsigned StringTableIndex = ~0
u;
145 unsigned SymbolTableIndex = ~0
u;
148 std::vector<MCSectionELF *> SectionTable;
162 bool IsLittleEndian, DwoMode Mode)
163 :
Asm(
Asm), OWriter(OWriter),
168 MCContext &getContext()
const {
return Asm.getContext(); }
177 template <
typename T>
void write(
T Val) {
183 void writeSymbol(SymbolTableWriter &Writer,
uint32_t StringIndex,
193 void computeSymbolTable(
const RevGroupMapTy &RevGroupMap);
195 void writeAddrsigSection();
200 void writeSectionHeaders();
220 W.OS.write_zeros(NewOffset -
Offset);
224unsigned ELFWriter::addToSectionTable(
MCSectionELF *Sec) {
225 SectionTable.push_back(Sec);
226 StrTabBuilder.add(Sec->
getName());
227 return SectionTable.size();
230void SymbolTableWriter::createSymtabShndx() {
231 if (!ShndxIndexes.empty())
234 ShndxIndexes.resize(NumWritten);
237template <
typename T>
void SymbolTableWriter::write(
T Value) {
238 EWriter.write(
Value);
241SymbolTableWriter::SymbolTableWriter(ELFWriter &EWriter,
bool Is64Bit)
242 : EWriter(EWriter), Is64Bit(Is64Bit), NumWritten(0) {}
252 if (!ShndxIndexes.empty()) {
254 ShndxIndexes.push_back(shndx);
256 ShndxIndexes.push_back(0);
280bool ELFWriter::is64Bit()
const {
285void ELFWriter::writeHeader() {
348 return Sym.getCommonAlignment()->value();
351 if (!
Asm.getSymbolOffset(
Sym, Res))
354 if (
Asm.isThumbFunc(&
Sym))
398 if (!Symbol->isVariable() ||
399 !(
Value = dyn_cast<MCSymbolRefExpr>(Symbol->getVariableValue())) ||
400 Value->getSpecifier() ||
409void ELFWriter::writeSymbol(SymbolTableWriter &Writer,
uint32_t StringIndex,
410 ELFSymbolData &MSD) {
436 const MCExpr *ESize = MSD.Symbol->getSize();
437 if (!ESize &&
Base) {
439 ESize =
Base->getSize();
446 while (
Sym->isVariable()) {
447 if (
auto *Expr = dyn_cast<MCSymbolRefExpr>(
Sym->getVariableValue())) {
451 ESize =
Sym->getSize();
465 Writer.writeSymbol(StringIndex, Info,
Value,
Size,
Other, MSD.SectionIndex,
469bool ELFWriter::isInSymtab(
const MCSymbolELF &Symbol) {
473 if (OWriter.
Renames.count(&Symbol))
476 if (
Symbol.isVariable()) {
479 if (
const auto *
T = dyn_cast<MCTargetExpr>(Expr))
480 if (
T->inlineAssignedExpr())
486 if (
Symbol.isUndefined()) {
488 Asm.getBaseSymbol(Symbol);
499void ELFWriter::computeSymbolTable(
const RevGroupMapTy &RevGroupMap) {
501 SymbolTableWriter Writer(*
this,
is64Bit());
508 SymbolTableIndex = addToSectionTable(SymtabSection);
513 Writer.writeSymbol(0, 0, 0, 0, 0, 0,
false);
515 std::vector<ELFSymbolData> LocalSymbolData;
516 std::vector<ELFSymbolData> ExternalSymbolData;
519 for (
const std::pair<std::string, size_t> &
F : FileNames)
520 StrTabBuilder.add(
F.first);
523 bool HasLargeSectionIndex =
false;
536 MSD.Order = It.index();
541 if (
Symbol.isAbsolute()) {
543 }
else if (
Symbol.isCommon()) {
544 auto Shndx =
Symbol.getIndex();
549 MSD.SectionIndex = Shndx;
550 }
else if (
Symbol.isUndefined()) {
552 MSD.SectionIndex = RevGroupMap.lookup(&Symbol);
554 HasLargeSectionIndex =
true;
564 MSD.SectionIndex =
Section.getOrdinal();
565 assert(MSD.SectionIndex &&
"Invalid section index!");
567 HasLargeSectionIndex =
true;
581 StrTabBuilder.add(
Name);
585 LocalSymbolData.push_back(MSD);
587 ExternalSymbolData.push_back(MSD);
591 unsigned SymtabShndxSectionIndex = 0;
593 if (HasLargeSectionIndex) {
596 SymtabShndxSectionIndex = addToSectionTable(SymtabShndxSection);
600 StrTabBuilder.finalize();
604 auto FileNameIt = FileNames.begin();
605 if (!FileNames.empty())
606 FileNames[0].second = 0;
608 for (ELFSymbolData &MSD : LocalSymbolData) {
610 for (; FileNameIt != FileNames.end() && FileNameIt->second <= MSD.Order;
612 Writer.writeSymbol(StrTabBuilder.getOffset(FileNameIt->first),
620 : StrTabBuilder.getOffset(MSD.Name);
621 MSD.Symbol->setIndex(Index++);
622 writeSymbol(Writer, StringIndex, MSD);
624 for (; FileNameIt != FileNames.end(); ++FileNameIt) {
625 Writer.writeSymbol(StrTabBuilder.getOffset(FileNameIt->first),
632 LastLocalSymbolIndex =
Index;
634 for (ELFSymbolData &MSD : ExternalSymbolData) {
635 unsigned StringIndex = StrTabBuilder.getOffset(MSD.Name);
636 MSD.Symbol->setIndex(Index++);
637 writeSymbol(Writer, StringIndex, MSD);
645 if (ShndxIndexes.
empty()) {
646 assert(SymtabShndxSectionIndex == 0);
649 assert(SymtabShndxSectionIndex != 0);
651 SecStart =
W.OS.tell();
652 MCSectionELF *SymtabShndxSection = SectionTable[SymtabShndxSectionIndex - 1];
655 SecEnd =
W.OS.tell();
656 SymtabShndxSection->
setOffsets(SecStart, SecEnd);
659void ELFWriter::writeAddrsigSection() {
661 if (
Sym->getIndex() != 0)
676 if (TO && TO->
Crel) {
683 const bool Rela = OWriter.
usesRela(TO, Sec);
699bool ELFWriter::maybeWriteCompression(
704 if (
Size <= HdrSize + CompressedContents.
size())
722void ELFWriter::writeSectionData(
MCSection &Sec) {
725 auto &Ctx =
Asm.getContext();
728 : DebugCompressionType::None;
729 if (CompressionType == DebugCompressionType::None ||
731 Asm.writeSectionData(
W.OS, &Section);
737 Asm.writeSectionData(VecOS, &Section);
740 UncompressedData.
size());
744 switch (CompressionType) {
745 case DebugCompressionType::None:
747 case DebugCompressionType::Zlib:
750 case DebugCompressionType::Zstd:
756 if (!maybeWriteCompression(ChType, UncompressedData.
size(), Compressed,
758 W.OS << UncompressedData;
783 writeWord(Alignment ? Alignment->value() : 0);
784 writeWord(EntrySize);
789 using uint = std::conditional_t<Is64, uint64_t, uint32_t>;
791 uint32_t SymIdx = R.Symbol ? R.Symbol->getIndex() : 0;
793 std::make_signed_t<uint>(R.Addend)};
797void ELFWriter::writeRelocations(
const MCSectionELF &Sec) {
798 std::vector<ELFRelocationEntry> &Relocs = OWriter.
Relocations[&Sec];
800 const bool Rela = OWriter.
usesRela(TO, Sec);
840 }
else if (TO && TO->
Crel) {
842 encodeCrel<true>(Relocs,
W.OS);
844 encodeCrel<false>(Relocs,
W.OS);
883 sh_link = SymbolTableIndex;
884 assert(sh_link &&
".symtab not found");
891 sh_link = StringTableIndex;
892 sh_info = LastLocalSymbolIndex;
898 sh_link = SymbolTableIndex;
902 sh_link = SymbolTableIndex;
903 sh_info = GroupSymbolIndex;
911 if (
Sym &&
Sym->isInSection())
912 sh_link =
Sym->getSection().getOrdinal();
915 writeSectionHeaderEntry(StrTabBuilder.getOffset(
Section.getName()),
921void ELFWriter::writeSectionHeaders() {
923 const unsigned NumSections = SectionTable.size();
928 writeSectionHeaderEntry(0, 0, 0, 0, 0, FirstSectionSize, 0, 0, std::nullopt,
935 GroupSymbolIndex = 0;
937 GroupSymbolIndex =
Section->getGroup()->getIndex();
942 Size =
Asm.getSectionAddressSize(*Section);
950 if (Mode == DwoOnly) {
951 stats::DwoBytes +=
Size;
952 }
else if (
Section->getName().starts_with(
".debug")) {
953 stats::DebugBytes +=
Size;
954 }
else if (
Section->getName().starts_with(
".eh_frame")) {
955 stats::UnwindBytes +=
Size;
958 stats::AllocTextBytes +=
Size;
960 stats::AllocRWBytes +=
Size;
962 stats::AllocROBytes +=
Size;
967 stats::StrtabBytes +=
Size;
970 stats::SymtabBytes +=
Size;
973 stats::DynsymBytes +=
Size;
978 stats::RelocationBytes +=
Size;
981 stats::OtherBytes +=
Size;
986 writeSectionHeader(GroupSymbolIndex,
Offsets.first,
Size, *Section);
989 stats::SectionHeaderBytes +=
W.OS.tell() - Start;
998 StringTableIndex = addToSectionTable(StrtabSection);
1000 RevGroupMapTy RevGroupMap;
1005 stats::ELFHeaderBytes +=
W.OS.tell() - StartOffset;
1023 writeSectionData(Section);
1026 Section.setOffsets(SecStart, SecEnd);
1028 MCSectionELF *RelSection = createRelocationSection(Ctx, Section);
1030 unsigned *GroupIdxEntry =
nullptr;
1031 if (SignatureSymbol) {
1032 GroupIdxEntry = &RevGroupMap[SignatureSymbol];
1033 if (!*GroupIdxEntry) {
1036 *GroupIdxEntry = addToSectionTable(Group);
1039 GroupMap.
resize(*GroupIdxEntry + 1);
1040 GroupMap[*GroupIdxEntry] =
Groups.size();
1045 Section.setOrdinal(addToSectionTable(&Section));
1047 RelSection->
setOrdinal(addToSectionTable(RelSection));
1051 if (GroupIdxEntry) {
1052 auto &Members =
Groups[GroupMap[*GroupIdxEntry]];
1053 Members.second.push_back(
Section.getOrdinal());
1055 Members.second.push_back(RelSection->
getOrdinal());
1059 for (
auto &[Group, Members] :
Groups) {
1064 W.write<
unsigned>(Members);
1070 if (Mode == DwoOnly) {
1073 StrTabBuilder.finalize();
1079 addToSectionTable(AddrsigSection);
1083 computeSymbolTable(RevGroupMap);
1098 writeAddrsigSection();
1100 AddrsigSection->
setOffsets(SecStart, SecEnd);
1106 StrTabBuilder.write(
W.OS);
1113 writeSectionHeaders();
1115 uint16_t NumSections = support::endian::byte_swap<uint16_t>(
1117 : SectionTable.size() + 1,
1119 unsigned NumSectionsOffset;
1124 support::endian::byte_swap<uint64_t>(SectionHeaderOffset,
W.Endian);
1125 Stream.pwrite(
reinterpret_cast<char *
>(&Val),
sizeof(Val),
1130 support::endian::byte_swap<uint32_t>(SectionHeaderOffset,
W.Endian);
1131 Stream.pwrite(
reinterpret_cast<char *
>(&Val),
sizeof(Val),
1135 Stream.pwrite(
reinterpret_cast<char *
>(&NumSections),
sizeof(NumSections),
1138 return W.OS.tell() - StartOffset;
1144 IsLittleEndian(IsLittleEndian) {}
1148 : TargetObjectWriter(
std::
move(MOTW)),
OS(
OS), DwoOS(&DwoOS),
1149 IsLittleEndian(IsLittleEndian) {}
1152 ELFHeaderEFlags = 0;
1177 auto &Symbol =
static_cast<const MCSymbolELF &
>(*S.Sym);
1178 size_t Pos = AliasName.
find(
'@');
1185 Tail = Rest.
substr(Symbol.isUndefined() ? 2 : 1);
1191 Alias->setVariableValue(
Value);
1195 Alias->setBinding(Symbol.getBinding());
1196 Alias->setVisibility(Symbol.getVisibility());
1197 Alias->setOther(Symbol.getOther());
1199 if (!Symbol.isUndefined() && S.KeepOriginalSym)
1202 if (Symbol.isUndefined() && Rest.
starts_with(
"@@") &&
1205 AliasName +
" must be defined");
1209 if (
auto It =
Renames.find(&Symbol);
1210 It !=
Renames.end() && It->second != Alias) {
1216 Renames.insert(std::make_pair(&Symbol, Alias));
1223 if (
Sym->isInSection() &&
Sym->getName().starts_with(
".L"))
1224 Sym =
Sym->getSection().getBeginSymbol();
1225 Sym->setUsedInReloc();
1233 if (!Alias->isRegistered())
1235 auto *Expr = Alias->getVariableValue();
1236 if (
const auto *Inner = dyn_cast<MCSymbolRefExpr>(Expr)) {
1237 auto &
Sym =
static_cast<const MCSymbolELF &
>(Inner->getSymbol());
1249 unsigned Type)
const {
1263 if (
Sym->isInSection()) {
1273 Type == ELF::R_386_GOTOFF)
1307 "A relocation may not refer to a dwo section");
1316 auto &Section =
static_cast<const MCSectionELF &
>(*
F.getParent());
1321 (SymA && SymA->isInSection())
1322 ?
static_cast<const MCSectionELF *
>(&SymA->getSection())
1327 bool IsPCRel =
Fixup.isPCRel();
1330 if (
auto *RefB =
Target.getSubSym()) {
1331 auto &SymB =
static_cast<const MCSymbolELF &
>(*RefB);
1332 if (SymB.isUndefined()) {
1334 Twine(
"symbol '") + SymB.getName() +
1335 "' can not be undefined in a subtraction expression");
1339 assert(!SymB.isAbsolute() &&
"Should have been folded");
1340 const MCSection &SecB = SymB.getSection();
1341 if (&SecB != &Section) {
1343 "Cannot represent a difference across sections");
1347 assert(!IsPCRel &&
"should have been folded");
1361 bool UseSectionSym = SymA && SymA->getBinding() ==
ELF::STB_LOCAL &&
1362 !SymA->isUndefined() &&
1371 SymA->setUsedInReloc();
1386 auto &SymA =
static_cast<const MCSymbolELF &
>(SA);
1393 return &SymA.getSection() == FB.
getParent();
1399 DwoOS ? ELFWriter::NonDwoOnly : ELFWriter::AllSections)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define offsetof(TYPE, MEMBER)
BlockVerifier::State From
Analysis containing CSE Info
DXIL Resource Implicit Binding
Given that RA is a live value
This file defines the DenseMap class.
static uint8_t mergeTypeForSet(uint8_t origType, uint8_t newType)
static void encodeCrel(ArrayRef< ELFRelocationEntry > Relocs, raw_ostream &OS)
static bool isIFunc(const MCSymbolELF *Symbol)
std::optional< std::vector< StOtherPiece > > Other
PowerPC TLS Dynamic Call Fixup
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static bool isInSymtab(const MCSymbolWasm &Sym)
static bool isDwoSection(const MCSection &Sec)
static bool is64Bit(const char *name)
static const X86InstrFMA3Group Groups[]
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
bool empty() const
empty - Check if the array is empty.
std::unique_ptr< MCELFObjectTargetWriter > TargetObjectWriter
ELFObjectWriter(std::unique_ptr< MCELFObjectTargetWriter > MOTW, raw_pwrite_stream &OS, bool IsLittleEndian)
void setAssembler(MCAssembler *Asm) override
SmallVector< const MCSymbolELF *, 0 > Weakrefs
bool checkRelocation(SMLoc Loc, const MCSectionELF *From, const MCSectionELF *To)
unsigned getELFHeaderEFlags() const
void reset() override
lifetime management
std::optional< uint8_t > OverrideABIVersion
uint64_t writeObject() override
Write the object file and returns the number of bytes written.
DenseMap< const MCSectionELF *, std::vector< ELFRelocationEntry > > Relocations
void executePostLayoutBinding() override
Perform any late binding of symbols (for example, to assign symbol indices for use when generating re...
bool isSymbolRefDifferenceFullyResolvedImpl(const MCSymbol &SymA, const MCFragment &FB, bool InSet, bool IsPCRel) const override
SmallVector< Symver, 0 > Symvers
bool hasRelocationAddend() const
void recordRelocation(const MCFragment &F, const MCFixup &Fixup, MCValue Target, uint64_t &FixedValue) override
Record a relocation entry.
raw_pwrite_stream * DwoOS
bool usesRela(const MCTargetOptions *TO, const MCSectionELF &Sec) const
bool useSectionSymbol(const MCValue &Val, const MCSymbolELF *Sym, uint64_t C, unsigned Type) const
DenseMap< const MCSymbolELF *, const MCSymbolELF * > Renames
MCContext & getContext() const
LLVM_ABI bool getSymbolOffset(const MCSymbol &S, uint64_t &Val) const
LLVM_ABI bool registerSymbol(const MCSymbol &Symbol)
uint64_t getFragmentOffset(const MCFragment &F) const
Context object for machine code objects.
LLVM_ABI MCSectionELF * createELFRelSection(const Twine &Name, unsigned Type, unsigned Flags, unsigned EntrySize, const MCSymbolELF *Group, const MCSectionELF *RelInfoSection)
MCSectionELF * getELFSection(const Twine &Section, unsigned Type, unsigned Flags)
LLVM_ABI void reportError(SMLoc L, const Twine &Msg)
LLVM_ABI MCSymbol * getOrCreateSymbol(const Twine &Name)
Lookup the symbol inside with the specified Name.
const MCTargetOptions * getTargetOptions() const
LLVM_ABI MCSectionELF * createELFGroupSection(const MCSymbolELF *Group, bool IsComdat)
Base class for the full range of assembler expressions which are needed for parsing.
LLVM_ABI bool evaluateKnownAbsolute(int64_t &Res, const MCAssembler &Asm) const
Aggressive variant of evaluateAsRelocatable when relocations are unavailable (e.g.
Encode information on a single operation to perform on a byte sequence (e.g., an encoded instruction)...
MCSection * getParent() const
MutableArrayRef< std::pair< std::string, size_t > > getFileNames()
virtual void setAssembler(MCAssembler *A)
bool getEmitAddrsigSection()
std::vector< const MCSymbol * > & getAddrsigSyms()
virtual void reset()
lifetime management
std::vector< const MCSymbol * > AddrsigSyms
MCContext & getContext() const
This represents a section on linux, lots of unix variants and some bare metal systems.
const MCSection * getLinkedToSection() const
unsigned getFlags() const
void setOffsets(uint64_t Start, uint64_t End)
const MCSymbolELF * getGroup() const
Instances of this class represent a uniqued identifier for a section in the current translation unit.
void setAlignment(Align Value)
unsigned getOrdinal() const
void setOrdinal(unsigned Value)
StringRef getName() const
MCSymbol * getBeginSymbol()
Represent a reference to a symbol from inside an expression.
static const MCSymbolRefExpr * create(const MCSymbol *Symbol, MCContext &Ctx, SMLoc Loc=SMLoc())
MCSymbol - Instances of this class represent a symbol name in the MC file, and MCSymbols are created ...
DebugCompressionType CompressDebugSections
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Represents a location in source code.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
constexpr StringRef substr(size_t Start, size_t N=npos) const
Return a reference to the substring from [Start, Start + N).
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
size_t find(char C, size_t From=0) const
Search for the first character C in the string.
bool ends_with(StringRef Suffix) const
Check if this string ends with the given Suffix.
static constexpr size_t npos
Utility for building string tables with deduplicated suffixes.
Target - Wrapper for Target specific information.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM Value Representation.
This class implements an extremely fast bulk output stream that can only output to a stream.
An abstract base class for streams implementations that also support a pwrite operation.
A raw_ostream that writes to an SmallVector or SmallString.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ Tail
Attemps to make calls as fast as possible while guaranteeing that tail call optimization can always b...
@ C
The default llvm calling convention, compatible with C.
static const char ElfMagic[]
@ SHT_LLVM_CALL_GRAPH_PROFILE
Flag
These should be considered private to the implementation of the MCInstrDesc class.
LLVM_ABI void compress(Params P, ArrayRef< uint8_t > Input, SmallVectorImpl< uint8_t > &Output)
StringRef toStringRef(const std::optional< DWARFFormValue > &V, StringRef Default={})
Take an optional DWARFFormValue and try to extract a string value from it.
support::ulittle32_t Word
bool isRelocRelocation(MCFixupKind FixupKind)
This is an optimization pass for GlobalISel generic memory operations.
@ FirstLiteralRelocationKind
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
LLVM_ABI Error write(MCStreamer &Out, ArrayRef< std::string > Inputs, OnCuIndexOverflow OverflowOptValue)
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
unsigned encodeULEB128(uint64_t Value, raw_ostream &OS, unsigned PadTo=0)
Utility function to encode a ULEB128 value to an output stream.
Implement std::hash so that hash_code can be used in STL containers.
This struct is a compact representation of a valid (non-zero power of two) alignment.
uint64_t value() const
This is a hole in the type system and should not be abused.
void setSymbolAndType(Elf32_Word s, unsigned char t)
void setSymbolAndType(Elf64_Word s, Elf64_Word t)
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Adapter to write values to a stream in a particular byte order.