xref: /freebsd/contrib/llvm-project/lld/ELF/SymbolTable.h (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
10b57cec5SDimitry Andric //===- SymbolTable.h --------------------------------------------*- C++ -*-===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #ifndef LLD_ELF_SYMBOL_TABLE_H
100b57cec5SDimitry Andric #define LLD_ELF_SYMBOL_TABLE_H
110b57cec5SDimitry Andric 
120b57cec5SDimitry Andric #include "Symbols.h"
130b57cec5SDimitry Andric #include "llvm/ADT/CachedHashString.h"
140b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h"
15bdd1243dSDimitry Andric #include "llvm/Support/Compiler.h"
160b57cec5SDimitry Andric 
17bdd1243dSDimitry Andric namespace lld::elf {
180b57cec5SDimitry Andric 
1981ad6265SDimitry Andric class InputFile;
2081ad6265SDimitry Andric class SharedFile;
2181ad6265SDimitry Andric 
2206c3fb27SDimitry Andric struct ArmCmseEntryFunction {
2306c3fb27SDimitry Andric   Symbol *acleSeSym;
2406c3fb27SDimitry Andric   Symbol *sym;
2506c3fb27SDimitry Andric };
2606c3fb27SDimitry Andric 
270b57cec5SDimitry Andric // SymbolTable is a bucket of all known symbols, including defined,
280b57cec5SDimitry Andric // undefined, or lazy symbols (the last one is symbols in archive
290b57cec5SDimitry Andric // files whose archive members are not yet loaded).
300b57cec5SDimitry Andric //
310b57cec5SDimitry Andric // We put all symbols of all files to a SymbolTable, and the
320b57cec5SDimitry Andric // SymbolTable selects the "best" symbols if there are name
330b57cec5SDimitry Andric // conflicts. For example, obviously, a defined symbol is better than
340b57cec5SDimitry Andric // an undefined symbol. Or, if there's a conflict between a lazy and a
350b57cec5SDimitry Andric // undefined, it'll read an archive member to read a real definition
360b57cec5SDimitry Andric // to replace the lazy symbol. The logic is implemented in the
370b57cec5SDimitry Andric // add*() functions, which are called by input files as they are parsed. There
380b57cec5SDimitry Andric // is one add* function per symbol type.
390b57cec5SDimitry Andric class SymbolTable {
40480093f4SDimitry Andric public:
getSymbols()41bdd1243dSDimitry Andric   ArrayRef<Symbol *> getSymbols() const { return symVector; }
420b57cec5SDimitry Andric 
43480093f4SDimitry Andric   void wrap(Symbol *sym, Symbol *real, Symbol *wrap);
44480093f4SDimitry Andric 
450b57cec5SDimitry Andric   Symbol *insert(StringRef name);
460b57cec5SDimitry Andric 
addSymbol(const T & newSym)47bdd1243dSDimitry Andric   template <typename T> Symbol *addSymbol(const T &newSym) {
48bdd1243dSDimitry Andric     Symbol *sym = insert(newSym.getName());
49bdd1243dSDimitry Andric     sym->resolve(newSym);
50bdd1243dSDimitry Andric     return sym;
51bdd1243dSDimitry Andric   }
5281ad6265SDimitry Andric   Symbol *addAndCheckDuplicate(const Defined &newSym);
530b57cec5SDimitry Andric 
540b57cec5SDimitry Andric   void scanVersionScript();
550b57cec5SDimitry Andric 
560b57cec5SDimitry Andric   Symbol *find(StringRef name);
570b57cec5SDimitry Andric 
580b57cec5SDimitry Andric   void handleDynamicList();
590b57cec5SDimitry Andric 
60*0fca6ea1SDimitry Andric   Symbol *addUnusedUndefined(StringRef name,
61*0fca6ea1SDimitry Andric                              uint8_t binding = llvm::ELF::STB_GLOBAL);
62*0fca6ea1SDimitry Andric 
630b57cec5SDimitry Andric   // Set of .so files to not link the same shared object file more than once.
6404eeddc0SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, SharedFile *> soNames;
650b57cec5SDimitry Andric 
660b57cec5SDimitry Andric   // Comdat groups define "link once" sections. If two comdat groups have the
670b57cec5SDimitry Andric   // same name, only one of them is linked, and the other is ignored. This map
680b57cec5SDimitry Andric   // is used to uniquify them.
690b57cec5SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, const InputFile *> comdatGroups;
700b57cec5SDimitry Andric 
7106c3fb27SDimitry Andric   // The Map of __acle_se_<sym>, <sym> pairs found in the input objects.
7206c3fb27SDimitry Andric   // Key is the <sym> name.
7306c3fb27SDimitry Andric   llvm::SmallMapVector<StringRef, ArmCmseEntryFunction, 1> cmseSymMap;
7406c3fb27SDimitry Andric 
7506c3fb27SDimitry Andric   // Map of symbols defined in the Arm CMSE import library. The linker must
7606c3fb27SDimitry Andric   // preserve the addresses in the output objects.
7706c3fb27SDimitry Andric   llvm::StringMap<Defined *> cmseImportLib;
7806c3fb27SDimitry Andric 
7906c3fb27SDimitry Andric   // True if <sym> from the input Arm CMSE import library is written to the
8006c3fb27SDimitry Andric   // output Arm CMSE import library.
8106c3fb27SDimitry Andric   llvm::StringMap<bool> inCMSEOutImpLib;
8206c3fb27SDimitry Andric 
830b57cec5SDimitry Andric private:
840eae32dcSDimitry Andric   SmallVector<Symbol *, 0> findByVersion(SymbolVersion ver);
850eae32dcSDimitry Andric   SmallVector<Symbol *, 0> findAllByVersion(SymbolVersion ver,
866e75b2fbSDimitry Andric                                             bool includeNonDefault);
870b57cec5SDimitry Andric 
880eae32dcSDimitry Andric   llvm::StringMap<SmallVector<Symbol *, 0>> &getDemangledSyms();
896e75b2fbSDimitry Andric   bool assignExactVersion(SymbolVersion ver, uint16_t versionId,
906e75b2fbSDimitry Andric                           StringRef versionName, bool includeNonDefault);
916e75b2fbSDimitry Andric   void assignWildcardVersion(SymbolVersion ver, uint16_t versionId,
926e75b2fbSDimitry Andric                              bool includeNonDefault);
930b57cec5SDimitry Andric 
9406c3fb27SDimitry Andric   // Global symbols and a map from symbol name to the index. The order is not
9506c3fb27SDimitry Andric   // defined. We can use an arbitrary order, but it has to be deterministic even
9606c3fb27SDimitry Andric   // when cross linking.
970b57cec5SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, int> symMap;
980eae32dcSDimitry Andric   SmallVector<Symbol *, 0> symVector;
990b57cec5SDimitry Andric 
1000b57cec5SDimitry Andric   // A map from demangled symbol names to their symbol objects.
1010b57cec5SDimitry Andric   // This mapping is 1:N because two symbols with different versions
1020b57cec5SDimitry Andric   // can have the same name. We use this map to handle "extern C++ {}"
1030b57cec5SDimitry Andric   // directive in version scripts.
104bdd1243dSDimitry Andric   std::optional<llvm::StringMap<SmallVector<Symbol *, 0>>> demangledSyms;
1050b57cec5SDimitry Andric };
1060b57cec5SDimitry Andric 
107bdd1243dSDimitry Andric LLVM_LIBRARY_VISIBILITY extern SymbolTable symtab;
1080b57cec5SDimitry Andric 
109bdd1243dSDimitry Andric } // namespace lld::elf
1100b57cec5SDimitry Andric 
1110b57cec5SDimitry Andric #endif
112