10b57cec5SDimitry Andric //===- SymbolTable.h --------------------------------------------*- C++ -*-===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #ifndef LLD_ELF_SYMBOL_TABLE_H 100b57cec5SDimitry Andric #define LLD_ELF_SYMBOL_TABLE_H 110b57cec5SDimitry Andric 120b57cec5SDimitry Andric #include "Symbols.h" 130b57cec5SDimitry Andric #include "llvm/ADT/CachedHashString.h" 140b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h" 15bdd1243dSDimitry Andric #include "llvm/Support/Compiler.h" 160b57cec5SDimitry Andric 17bdd1243dSDimitry Andric namespace lld::elf { 180b57cec5SDimitry Andric 1981ad6265SDimitry Andric class InputFile; 2081ad6265SDimitry Andric class SharedFile; 2181ad6265SDimitry Andric 2206c3fb27SDimitry Andric struct ArmCmseEntryFunction { 2306c3fb27SDimitry Andric Symbol *acleSeSym; 2406c3fb27SDimitry Andric Symbol *sym; 2506c3fb27SDimitry Andric }; 2606c3fb27SDimitry Andric 270b57cec5SDimitry Andric // SymbolTable is a bucket of all known symbols, including defined, 280b57cec5SDimitry Andric // undefined, or lazy symbols (the last one is symbols in archive 290b57cec5SDimitry Andric // files whose archive members are not yet loaded). 300b57cec5SDimitry Andric // 310b57cec5SDimitry Andric // We put all symbols of all files to a SymbolTable, and the 320b57cec5SDimitry Andric // SymbolTable selects the "best" symbols if there are name 330b57cec5SDimitry Andric // conflicts. For example, obviously, a defined symbol is better than 340b57cec5SDimitry Andric // an undefined symbol. Or, if there's a conflict between a lazy and a 350b57cec5SDimitry Andric // undefined, it'll read an archive member to read a real definition 360b57cec5SDimitry Andric // to replace the lazy symbol. The logic is implemented in the 370b57cec5SDimitry Andric // add*() functions, which are called by input files as they are parsed. There 380b57cec5SDimitry Andric // is one add* function per symbol type. 390b57cec5SDimitry Andric class SymbolTable { 40480093f4SDimitry Andric public: getSymbols()41bdd1243dSDimitry Andric ArrayRef<Symbol *> getSymbols() const { return symVector; } 420b57cec5SDimitry Andric 43480093f4SDimitry Andric void wrap(Symbol *sym, Symbol *real, Symbol *wrap); 44480093f4SDimitry Andric 450b57cec5SDimitry Andric Symbol *insert(StringRef name); 460b57cec5SDimitry Andric addSymbol(const T & newSym)47bdd1243dSDimitry Andric template <typename T> Symbol *addSymbol(const T &newSym) { 48bdd1243dSDimitry Andric Symbol *sym = insert(newSym.getName()); 49bdd1243dSDimitry Andric sym->resolve(newSym); 50bdd1243dSDimitry Andric return sym; 51bdd1243dSDimitry Andric } 5281ad6265SDimitry Andric Symbol *addAndCheckDuplicate(const Defined &newSym); 530b57cec5SDimitry Andric 540b57cec5SDimitry Andric void scanVersionScript(); 550b57cec5SDimitry Andric 560b57cec5SDimitry Andric Symbol *find(StringRef name); 570b57cec5SDimitry Andric 580b57cec5SDimitry Andric void handleDynamicList(); 590b57cec5SDimitry Andric 60*0fca6ea1SDimitry Andric Symbol *addUnusedUndefined(StringRef name, 61*0fca6ea1SDimitry Andric uint8_t binding = llvm::ELF::STB_GLOBAL); 62*0fca6ea1SDimitry Andric 630b57cec5SDimitry Andric // Set of .so files to not link the same shared object file more than once. 6404eeddc0SDimitry Andric llvm::DenseMap<llvm::CachedHashStringRef, SharedFile *> soNames; 650b57cec5SDimitry Andric 660b57cec5SDimitry Andric // Comdat groups define "link once" sections. If two comdat groups have the 670b57cec5SDimitry Andric // same name, only one of them is linked, and the other is ignored. This map 680b57cec5SDimitry Andric // is used to uniquify them. 690b57cec5SDimitry Andric llvm::DenseMap<llvm::CachedHashStringRef, const InputFile *> comdatGroups; 700b57cec5SDimitry Andric 7106c3fb27SDimitry Andric // The Map of __acle_se_<sym>, <sym> pairs found in the input objects. 7206c3fb27SDimitry Andric // Key is the <sym> name. 7306c3fb27SDimitry Andric llvm::SmallMapVector<StringRef, ArmCmseEntryFunction, 1> cmseSymMap; 7406c3fb27SDimitry Andric 7506c3fb27SDimitry Andric // Map of symbols defined in the Arm CMSE import library. The linker must 7606c3fb27SDimitry Andric // preserve the addresses in the output objects. 7706c3fb27SDimitry Andric llvm::StringMap<Defined *> cmseImportLib; 7806c3fb27SDimitry Andric 7906c3fb27SDimitry Andric // True if <sym> from the input Arm CMSE import library is written to the 8006c3fb27SDimitry Andric // output Arm CMSE import library. 8106c3fb27SDimitry Andric llvm::StringMap<bool> inCMSEOutImpLib; 8206c3fb27SDimitry Andric 830b57cec5SDimitry Andric private: 840eae32dcSDimitry Andric SmallVector<Symbol *, 0> findByVersion(SymbolVersion ver); 850eae32dcSDimitry Andric SmallVector<Symbol *, 0> findAllByVersion(SymbolVersion ver, 866e75b2fbSDimitry Andric bool includeNonDefault); 870b57cec5SDimitry Andric 880eae32dcSDimitry Andric llvm::StringMap<SmallVector<Symbol *, 0>> &getDemangledSyms(); 896e75b2fbSDimitry Andric bool assignExactVersion(SymbolVersion ver, uint16_t versionId, 906e75b2fbSDimitry Andric StringRef versionName, bool includeNonDefault); 916e75b2fbSDimitry Andric void assignWildcardVersion(SymbolVersion ver, uint16_t versionId, 926e75b2fbSDimitry Andric bool includeNonDefault); 930b57cec5SDimitry Andric 9406c3fb27SDimitry Andric // Global symbols and a map from symbol name to the index. The order is not 9506c3fb27SDimitry Andric // defined. We can use an arbitrary order, but it has to be deterministic even 9606c3fb27SDimitry Andric // when cross linking. 970b57cec5SDimitry Andric llvm::DenseMap<llvm::CachedHashStringRef, int> symMap; 980eae32dcSDimitry Andric SmallVector<Symbol *, 0> symVector; 990b57cec5SDimitry Andric 1000b57cec5SDimitry Andric // A map from demangled symbol names to their symbol objects. 1010b57cec5SDimitry Andric // This mapping is 1:N because two symbols with different versions 1020b57cec5SDimitry Andric // can have the same name. We use this map to handle "extern C++ {}" 1030b57cec5SDimitry Andric // directive in version scripts. 104bdd1243dSDimitry Andric std::optional<llvm::StringMap<SmallVector<Symbol *, 0>>> demangledSyms; 1050b57cec5SDimitry Andric }; 1060b57cec5SDimitry Andric 107bdd1243dSDimitry Andric LLVM_LIBRARY_VISIBILITY extern SymbolTable symtab; 1080b57cec5SDimitry Andric 109bdd1243dSDimitry Andric } // namespace lld::elf 1100b57cec5SDimitry Andric 1110b57cec5SDimitry Andric #endif 112