//===- InputSection.h -------------------------------------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #ifndef LLD_ELF_INPUT_SECTION_H #define LLD_ELF_INPUT_SECTION_H #include "Relocations.h" #include "lld/Common/CommonLinkerContext.h" #include "lld/Common/LLVM.h" #include "lld/Common/Memory.h" #include "llvm/ADT/CachedHashString.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/TinyPtrVector.h" #include "llvm/Object/ELF.h" namespace lld { namespace elf { class InputFile; class Symbol; class Defined; struct Partition; class SyntheticSection; template class ObjFile; class OutputSection; extern std::vector partitions; // Returned by InputSectionBase::relsOrRelas. At least one member is empty. template struct RelsOrRelas { ArrayRef rels; ArrayRef relas; bool areRelocsRel() const { return rels.size(); } }; // This is the base class of all sections that lld handles. Some are sections in // input files, some are sections in the produced output file and some exist // just as a convenience for implementing special ways of combining some // sections. class SectionBase { public: enum Kind { Regular, Synthetic, EHFrame, Merge, Output }; Kind kind() const { return (Kind)sectionKind; } StringRef name; uint8_t sectionKind : 3; // The next two bit fields are only used by InputSectionBase, but we // put them here so the struct packs better. uint8_t bss : 1; // Set for sections that should not be folded by ICF. uint8_t keepUnique : 1; // The 1-indexed partition that this section is assigned to by the garbage // collector, or 0 if this section is dead. Normally there is only one // partition, so this will either be 0 or 1. uint8_t partition = 1; elf::Partition &getPartition() const; // These corresponds to the fields in Elf_Shdr. uint32_t alignment; uint64_t flags; uint32_t entsize; uint32_t type; uint32_t link; uint32_t info; OutputSection *getOutputSection(); const OutputSection *getOutputSection() const { return const_cast(this)->getOutputSection(); } // Translate an offset in the input section to an offset in the output // section. uint64_t getOffset(uint64_t offset) const; uint64_t getVA(uint64_t offset = 0) const; bool isLive() const { return partition != 0; } void markLive() { partition = 1; } void markDead() { partition = 0; } protected: constexpr SectionBase(Kind sectionKind, StringRef name, uint64_t flags, uint32_t entsize, uint32_t alignment, uint32_t type, uint32_t info, uint32_t link) : name(name), sectionKind(sectionKind), bss(false), keepUnique(false), alignment(alignment), flags(flags), entsize(entsize), type(type), link(link), info(info) {} }; struct RISCVRelaxAux; // This corresponds to a section of an input file. class InputSectionBase : public SectionBase { public: template InputSectionBase(ObjFile &file, const typename ELFT::Shdr &header, StringRef name, Kind sectionKind); InputSectionBase(InputFile *file, uint64_t flags, uint32_t type, uint64_t entsize, uint32_t link, uint32_t info, uint32_t alignment, ArrayRef data, StringRef name, Kind sectionKind); static bool classof(const SectionBase *s) { return s->kind() != Output; } // The file which contains this section. Its dynamic type is always // ObjFile, but in order to avoid ELFT, we use InputFile as // its static type. InputFile *file; // Input sections are part of an output section. Special sections // like .eh_frame and merge sections are first combined into a // synthetic section that is then added to an output section. In all // cases this points one level up. SectionBase *parent = nullptr; // Section index of the relocation section if exists. uint32_t relSecIdx = 0; template ObjFile *getFile() const { return cast_or_null>(file); } // Used by --optimize-bb-jumps and RISC-V linker relaxation temporarily to // indicate the number of bytes which is not counted in the size. This should // be reset to zero after uses. uint16_t bytesDropped = 0; // Whether the section needs to be padded with a NOP filler due to // deleteFallThruJmpInsn. bool nopFiller = false; void drop_back(unsigned num) { assert(bytesDropped + num < 256); bytesDropped += num; } void push_back(uint64_t num) { assert(bytesDropped >= num); bytesDropped -= num; } mutable ArrayRef rawData; void trim() { if (bytesDropped) { rawData = rawData.drop_back(bytesDropped); bytesDropped = 0; } } ArrayRef data() const { if (uncompressedSize >= 0) uncompress(); return rawData; } // The next member in the section group if this section is in a group. This is // used by --gc-sections. InputSectionBase *nextInSectionGroup = nullptr; template RelsOrRelas relsOrRelas() const; // InputSections that are dependent on us (reverse dependency for GC) llvm::TinyPtrVector dependentSections; // Returns the size of this section (even if this is a common or BSS.) size_t getSize() const; InputSection *getLinkOrderDep() const; // Get the function symbol that encloses this offset from within the // section. Defined *getEnclosingFunction(uint64_t offset); // Returns a source location string. Used to construct an error message. std::string getLocation(uint64_t offset); std::string getSrcMsg(const Symbol &sym, uint64_t offset); std::string getObjMsg(uint64_t offset); // Each section knows how to relocate itself. These functions apply // relocations, assuming that Buf points to this section's copy in // the mmap'ed output buffer. template void relocate(uint8_t *buf, uint8_t *bufEnd); void relocateAlloc(uint8_t *buf, uint8_t *bufEnd); static uint64_t getRelocTargetVA(const InputFile *File, RelType Type, int64_t A, uint64_t P, const Symbol &Sym, RelExpr Expr); // The native ELF reloc data type is not very convenient to handle. // So we convert ELF reloc records to our own records in Relocations.cpp. // This vector contains such "cooked" relocations. SmallVector relocations; union { // These are modifiers to jump instructions that are necessary when basic // block sections are enabled. Basic block sections creates opportunities // to relax jump instructions at basic block boundaries after reordering the // basic blocks. JumpInstrMod *jumpInstrMod = nullptr; // Auxiliary information for RISC-V linker relaxation. RISC-V does not use // jumpInstrMod. RISCVRelaxAux *relaxAux; }; // A function compiled with -fsplit-stack calling a function // compiled without -fsplit-stack needs its prologue adjusted. Find // such functions and adjust their prologues. This is very similar // to relocation. See https://gcc.gnu.org/wiki/SplitStacks for more // information. template void adjustSplitStackFunctionPrologues(uint8_t *buf, uint8_t *end); template llvm::ArrayRef getDataAs() const { size_t s = rawData.size(); assert(s % sizeof(T) == 0); return llvm::makeArrayRef((const T *)rawData.data(), s / sizeof(T)); } protected: template void parseCompressedHeader(); void uncompress() const; // This field stores the uncompressed size of the compressed data in rawData, // or -1 if rawData is not compressed (either because the section wasn't // compressed in the first place, or because we ended up uncompressing it). // Since the feature is not used often, this is usually -1. mutable int64_t uncompressedSize = -1; }; // SectionPiece represents a piece of splittable section contents. // We allocate a lot of these and binary search on them. This means that they // have to be as compact as possible, which is why we don't store the size (can // be found by looking at the next one). struct SectionPiece { SectionPiece() = default; SectionPiece(size_t off, uint32_t hash, bool live) : inputOff(off), live(live), hash(hash >> 1) {} uint32_t inputOff; uint32_t live : 1; uint32_t hash : 31; uint64_t outputOff = 0; }; static_assert(sizeof(SectionPiece) == 16, "SectionPiece is too big"); // This corresponds to a SHF_MERGE section of an input file. class MergeInputSection : public InputSectionBase { public: template MergeInputSection(ObjFile &f, const typename ELFT::Shdr &header, StringRef name); MergeInputSection(uint64_t flags, uint32_t type, uint64_t entsize, ArrayRef data, StringRef name); static bool classof(const SectionBase *s) { return s->kind() == Merge; } void splitIntoPieces(); // Translate an offset in the input section to an offset in the parent // MergeSyntheticSection. uint64_t getParentOffset(uint64_t offset) const; // Splittable sections are handled as a sequence of data // rather than a single large blob of data. SmallVector pieces; // Returns I'th piece's data. This function is very hot when // string merging is enabled, so we want to inline. LLVM_ATTRIBUTE_ALWAYS_INLINE llvm::CachedHashStringRef getData(size_t i) const { size_t begin = pieces[i].inputOff; size_t end = (pieces.size() - 1 == i) ? rawData.size() : pieces[i + 1].inputOff; return {toStringRef(rawData.slice(begin, end - begin)), pieces[i].hash}; } // Returns the SectionPiece at a given input section offset. SectionPiece &getSectionPiece(uint64_t offset); const SectionPiece &getSectionPiece(uint64_t offset) const { return const_cast(this)->getSectionPiece(offset); } SyntheticSection *getParent() const; private: void splitStrings(StringRef s, size_t size); void splitNonStrings(ArrayRef a, size_t size); }; struct EhSectionPiece { EhSectionPiece(size_t off, InputSectionBase *sec, uint32_t size, unsigned firstRelocation) : inputOff(off), sec(sec), size(size), firstRelocation(firstRelocation) {} ArrayRef data() const { return {sec->rawData.data() + this->inputOff, size}; } size_t inputOff; ssize_t outputOff = -1; InputSectionBase *sec; uint32_t size; unsigned firstRelocation; }; // This corresponds to a .eh_frame section of an input file. class EhInputSection : public InputSectionBase { public: template EhInputSection(ObjFile &f, const typename ELFT::Shdr &header, StringRef name); static bool classof(const SectionBase *s) { return s->kind() == EHFrame; } template void split(); template void split(ArrayRef rels); // Splittable sections are handled as a sequence of data // rather than a single large blob of data. SmallVector pieces; SyntheticSection *getParent() const; uint64_t getParentOffset(uint64_t offset) const; }; // This is a section that is added directly to an output section // instead of needing special combination via a synthetic section. This // includes all input sections with the exceptions of SHF_MERGE and // .eh_frame. It also includes the synthetic sections themselves. class InputSection : public InputSectionBase { public: InputSection(InputFile *f, uint64_t flags, uint32_t type, uint32_t alignment, ArrayRef data, StringRef name, Kind k = Regular); template InputSection(ObjFile &f, const typename ELFT::Shdr &header, StringRef name); static bool classof(const SectionBase *s) { return s->kind() == SectionBase::Regular || s->kind() == SectionBase::Synthetic; } // Write this section to a mmap'ed file, assuming Buf is pointing to // beginning of the output section. template void writeTo(uint8_t *buf); OutputSection *getParent() const { return reinterpret_cast(parent); } // This variable has two usages. Initially, it represents an index in the // OutputSection's InputSection list, and is used when ordering SHF_LINK_ORDER // sections. After assignAddresses is called, it represents the offset from // the beginning of the output section this section was assigned to. uint64_t outSecOff = 0; InputSectionBase *getRelocatedSection() const; template void relocateNonAlloc(uint8_t *buf, llvm::ArrayRef rels); // Points to the canonical section. If ICF folds two sections, repl pointer of // one section points to the other. InputSection *repl = this; // Used by ICF. uint32_t eqClass[2] = {0, 0}; // Called by ICF to merge two input sections. void replace(InputSection *other); static InputSection discarded; private: template void copyRelocations(uint8_t *buf, llvm::ArrayRef rels); template void copyShtGroup(uint8_t *buf); }; static_assert(sizeof(InputSection) <= 160, "InputSection is too big"); inline bool isDebugSection(const InputSectionBase &sec) { return (sec.flags & llvm::ELF::SHF_ALLOC) == 0 && sec.name.startswith(".debug"); } // The list of all input sections. extern SmallVector inputSections; // The set of TOC entries (.toc + addend) for which we should not apply // toc-indirect to toc-relative relaxation. const Symbol * refers to the // STT_SECTION symbol associated to the .toc input section. extern llvm::DenseSet> ppc64noTocRelax; } // namespace elf std::string toString(const elf::InputSectionBase *); } // namespace lld #endif