xref: /freebsd/contrib/llvm-project/lld/ELF/SymbolTable.h (revision 06c3fb2749bda94cb5201f81ffdb8fa6c3161b2e)
10b57cec5SDimitry Andric //===- SymbolTable.h --------------------------------------------*- C++ -*-===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #ifndef LLD_ELF_SYMBOL_TABLE_H
100b57cec5SDimitry Andric #define LLD_ELF_SYMBOL_TABLE_H
110b57cec5SDimitry Andric 
120b57cec5SDimitry Andric #include "Symbols.h"
130b57cec5SDimitry Andric #include "llvm/ADT/CachedHashString.h"
140b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h"
15bdd1243dSDimitry Andric #include "llvm/Support/Compiler.h"
160b57cec5SDimitry Andric 
17bdd1243dSDimitry Andric namespace lld::elf {
180b57cec5SDimitry Andric 
1981ad6265SDimitry Andric class InputFile;
2081ad6265SDimitry Andric class SharedFile;
2181ad6265SDimitry Andric 
22*06c3fb27SDimitry Andric struct ArmCmseEntryFunction {
23*06c3fb27SDimitry Andric   Symbol *acleSeSym;
24*06c3fb27SDimitry Andric   Symbol *sym;
25*06c3fb27SDimitry Andric };
26*06c3fb27SDimitry Andric 
270b57cec5SDimitry Andric // SymbolTable is a bucket of all known symbols, including defined,
280b57cec5SDimitry Andric // undefined, or lazy symbols (the last one is symbols in archive
290b57cec5SDimitry Andric // files whose archive members are not yet loaded).
300b57cec5SDimitry Andric //
310b57cec5SDimitry Andric // We put all symbols of all files to a SymbolTable, and the
320b57cec5SDimitry Andric // SymbolTable selects the "best" symbols if there are name
330b57cec5SDimitry Andric // conflicts. For example, obviously, a defined symbol is better than
340b57cec5SDimitry Andric // an undefined symbol. Or, if there's a conflict between a lazy and a
350b57cec5SDimitry Andric // undefined, it'll read an archive member to read a real definition
360b57cec5SDimitry Andric // to replace the lazy symbol. The logic is implemented in the
370b57cec5SDimitry Andric // add*() functions, which are called by input files as they are parsed. There
380b57cec5SDimitry Andric // is one add* function per symbol type.
390b57cec5SDimitry Andric class SymbolTable {
40480093f4SDimitry Andric public:
41bdd1243dSDimitry Andric   ArrayRef<Symbol *> getSymbols() const { return symVector; }
420b57cec5SDimitry Andric 
43480093f4SDimitry Andric   void wrap(Symbol *sym, Symbol *real, Symbol *wrap);
44480093f4SDimitry Andric 
450b57cec5SDimitry Andric   Symbol *insert(StringRef name);
460b57cec5SDimitry Andric 
47bdd1243dSDimitry Andric   template <typename T> Symbol *addSymbol(const T &newSym) {
48bdd1243dSDimitry Andric     Symbol *sym = insert(newSym.getName());
49bdd1243dSDimitry Andric     sym->resolve(newSym);
50bdd1243dSDimitry Andric     return sym;
51bdd1243dSDimitry Andric   }
5281ad6265SDimitry Andric   Symbol *addAndCheckDuplicate(const Defined &newSym);
530b57cec5SDimitry Andric 
540b57cec5SDimitry Andric   void scanVersionScript();
550b57cec5SDimitry Andric 
560b57cec5SDimitry Andric   Symbol *find(StringRef name);
570b57cec5SDimitry Andric 
580b57cec5SDimitry Andric   void handleDynamicList();
590b57cec5SDimitry Andric 
600b57cec5SDimitry Andric   // Set of .so files to not link the same shared object file more than once.
6104eeddc0SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, SharedFile *> soNames;
620b57cec5SDimitry Andric 
630b57cec5SDimitry Andric   // Comdat groups define "link once" sections. If two comdat groups have the
640b57cec5SDimitry Andric   // same name, only one of them is linked, and the other is ignored. This map
650b57cec5SDimitry Andric   // is used to uniquify them.
660b57cec5SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, const InputFile *> comdatGroups;
670b57cec5SDimitry Andric 
68*06c3fb27SDimitry Andric   // The Map of __acle_se_<sym>, <sym> pairs found in the input objects.
69*06c3fb27SDimitry Andric   // Key is the <sym> name.
70*06c3fb27SDimitry Andric   llvm::SmallMapVector<StringRef, ArmCmseEntryFunction, 1> cmseSymMap;
71*06c3fb27SDimitry Andric 
72*06c3fb27SDimitry Andric   // Map of symbols defined in the Arm CMSE import library. The linker must
73*06c3fb27SDimitry Andric   // preserve the addresses in the output objects.
74*06c3fb27SDimitry Andric   llvm::StringMap<Defined *> cmseImportLib;
75*06c3fb27SDimitry Andric 
76*06c3fb27SDimitry Andric   // True if <sym> from the input Arm CMSE import library is written to the
77*06c3fb27SDimitry Andric   // output Arm CMSE import library.
78*06c3fb27SDimitry Andric   llvm::StringMap<bool> inCMSEOutImpLib;
79*06c3fb27SDimitry Andric 
800b57cec5SDimitry Andric private:
810eae32dcSDimitry Andric   SmallVector<Symbol *, 0> findByVersion(SymbolVersion ver);
820eae32dcSDimitry Andric   SmallVector<Symbol *, 0> findAllByVersion(SymbolVersion ver,
836e75b2fbSDimitry Andric                                             bool includeNonDefault);
840b57cec5SDimitry Andric 
850eae32dcSDimitry Andric   llvm::StringMap<SmallVector<Symbol *, 0>> &getDemangledSyms();
866e75b2fbSDimitry Andric   bool assignExactVersion(SymbolVersion ver, uint16_t versionId,
876e75b2fbSDimitry Andric                           StringRef versionName, bool includeNonDefault);
886e75b2fbSDimitry Andric   void assignWildcardVersion(SymbolVersion ver, uint16_t versionId,
896e75b2fbSDimitry Andric                              bool includeNonDefault);
900b57cec5SDimitry Andric 
91*06c3fb27SDimitry Andric   // Global symbols and a map from symbol name to the index. The order is not
92*06c3fb27SDimitry Andric   // defined. We can use an arbitrary order, but it has to be deterministic even
93*06c3fb27SDimitry Andric   // when cross linking.
940b57cec5SDimitry Andric   llvm::DenseMap<llvm::CachedHashStringRef, int> symMap;
950eae32dcSDimitry Andric   SmallVector<Symbol *, 0> symVector;
960b57cec5SDimitry Andric 
970b57cec5SDimitry Andric   // A map from demangled symbol names to their symbol objects.
980b57cec5SDimitry Andric   // This mapping is 1:N because two symbols with different versions
990b57cec5SDimitry Andric   // can have the same name. We use this map to handle "extern C++ {}"
1000b57cec5SDimitry Andric   // directive in version scripts.
101bdd1243dSDimitry Andric   std::optional<llvm::StringMap<SmallVector<Symbol *, 0>>> demangledSyms;
1020b57cec5SDimitry Andric };
1030b57cec5SDimitry Andric 
104bdd1243dSDimitry Andric LLVM_LIBRARY_VISIBILITY extern SymbolTable symtab;
1050b57cec5SDimitry Andric 
106bdd1243dSDimitry Andric } // namespace lld::elf
1070b57cec5SDimitry Andric 
1080b57cec5SDimitry Andric #endif
109