xref: /freebsd/contrib/llvm-project/lld/COFF/SymbolTable.cpp (revision fe6060f10f634930ff71b7c50291ddc610da2475)
10b57cec5SDimitry Andric //===- SymbolTable.cpp ----------------------------------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #include "SymbolTable.h"
100b57cec5SDimitry Andric #include "Config.h"
110b57cec5SDimitry Andric #include "Driver.h"
120b57cec5SDimitry Andric #include "LTO.h"
130b57cec5SDimitry Andric #include "PDB.h"
140b57cec5SDimitry Andric #include "Symbols.h"
150b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h"
160b57cec5SDimitry Andric #include "lld/Common/Memory.h"
170b57cec5SDimitry Andric #include "lld/Common/Timer.h"
1885868e8aSDimitry Andric #include "llvm/DebugInfo/Symbolize/Symbolize.h"
190b57cec5SDimitry Andric #include "llvm/IR/LLVMContext.h"
20480093f4SDimitry Andric #include "llvm/LTO/LTO.h"
210b57cec5SDimitry Andric #include "llvm/Object/WindowsMachineFlag.h"
220b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
230b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
240b57cec5SDimitry Andric #include <utility>
250b57cec5SDimitry Andric 
260b57cec5SDimitry Andric using namespace llvm;
270b57cec5SDimitry Andric 
280b57cec5SDimitry Andric namespace lld {
290b57cec5SDimitry Andric namespace coff {
300b57cec5SDimitry Andric 
31*fe6060f1SDimitry Andric StringRef ltrim1(StringRef s, const char *chars) {
32*fe6060f1SDimitry Andric   if (!s.empty() && strchr(chars, s[0]))
33*fe6060f1SDimitry Andric     return s.substr(1);
34*fe6060f1SDimitry Andric   return s;
35*fe6060f1SDimitry Andric }
36*fe6060f1SDimitry Andric 
370b57cec5SDimitry Andric static Timer ltoTimer("LTO", Timer::root());
380b57cec5SDimitry Andric 
390b57cec5SDimitry Andric SymbolTable *symtab;
400b57cec5SDimitry Andric 
410b57cec5SDimitry Andric void SymbolTable::addFile(InputFile *file) {
420b57cec5SDimitry Andric   log("Reading " + toString(file));
430b57cec5SDimitry Andric   file->parse();
440b57cec5SDimitry Andric 
450b57cec5SDimitry Andric   MachineTypes mt = file->getMachineType();
460b57cec5SDimitry Andric   if (config->machine == IMAGE_FILE_MACHINE_UNKNOWN) {
470b57cec5SDimitry Andric     config->machine = mt;
480b57cec5SDimitry Andric   } else if (mt != IMAGE_FILE_MACHINE_UNKNOWN && config->machine != mt) {
490b57cec5SDimitry Andric     error(toString(file) + ": machine type " + machineToStr(mt) +
500b57cec5SDimitry Andric           " conflicts with " + machineToStr(config->machine));
510b57cec5SDimitry Andric     return;
520b57cec5SDimitry Andric   }
530b57cec5SDimitry Andric 
540b57cec5SDimitry Andric   if (auto *f = dyn_cast<ObjFile>(file)) {
550b57cec5SDimitry Andric     ObjFile::instances.push_back(f);
560b57cec5SDimitry Andric   } else if (auto *f = dyn_cast<BitcodeFile>(file)) {
570b57cec5SDimitry Andric     BitcodeFile::instances.push_back(f);
580b57cec5SDimitry Andric   } else if (auto *f = dyn_cast<ImportFile>(file)) {
590b57cec5SDimitry Andric     ImportFile::instances.push_back(f);
600b57cec5SDimitry Andric   }
610b57cec5SDimitry Andric 
620b57cec5SDimitry Andric   driver->parseDirectives(file);
630b57cec5SDimitry Andric }
640b57cec5SDimitry Andric 
650b57cec5SDimitry Andric static void errorOrWarn(const Twine &s) {
660b57cec5SDimitry Andric   if (config->forceUnresolved)
670b57cec5SDimitry Andric     warn(s);
680b57cec5SDimitry Andric   else
690b57cec5SDimitry Andric     error(s);
700b57cec5SDimitry Andric }
710b57cec5SDimitry Andric 
7285868e8aSDimitry Andric // Causes the file associated with a lazy symbol to be linked in.
7385868e8aSDimitry Andric static void forceLazy(Symbol *s) {
7485868e8aSDimitry Andric   s->pendingArchiveLoad = true;
7585868e8aSDimitry Andric   switch (s->kind()) {
7685868e8aSDimitry Andric   case Symbol::Kind::LazyArchiveKind: {
7785868e8aSDimitry Andric     auto *l = cast<LazyArchive>(s);
7885868e8aSDimitry Andric     l->file->addMember(l->sym);
7985868e8aSDimitry Andric     break;
8085868e8aSDimitry Andric   }
8185868e8aSDimitry Andric   case Symbol::Kind::LazyObjectKind:
8285868e8aSDimitry Andric     cast<LazyObject>(s)->file->fetch();
8385868e8aSDimitry Andric     break;
84*fe6060f1SDimitry Andric   case Symbol::Kind::LazyDLLSymbolKind: {
85*fe6060f1SDimitry Andric     auto *l = cast<LazyDLLSymbol>(s);
86*fe6060f1SDimitry Andric     l->file->makeImport(l->sym);
87*fe6060f1SDimitry Andric     break;
88*fe6060f1SDimitry Andric   }
8985868e8aSDimitry Andric   default:
9085868e8aSDimitry Andric     llvm_unreachable(
9185868e8aSDimitry Andric         "symbol passed to forceLazy is not a LazyArchive or LazyObject");
9285868e8aSDimitry Andric   }
9385868e8aSDimitry Andric }
9485868e8aSDimitry Andric 
950b57cec5SDimitry Andric // Returns the symbol in SC whose value is <= Addr that is closest to Addr.
960b57cec5SDimitry Andric // This is generally the global variable or function whose definition contains
970b57cec5SDimitry Andric // Addr.
980b57cec5SDimitry Andric static Symbol *getSymbol(SectionChunk *sc, uint32_t addr) {
990b57cec5SDimitry Andric   DefinedRegular *candidate = nullptr;
1000b57cec5SDimitry Andric 
1010b57cec5SDimitry Andric   for (Symbol *s : sc->file->getSymbols()) {
1020b57cec5SDimitry Andric     auto *d = dyn_cast_or_null<DefinedRegular>(s);
10385868e8aSDimitry Andric     if (!d || !d->data || d->file != sc->file || d->getChunk() != sc ||
10485868e8aSDimitry Andric         d->getValue() > addr ||
1050b57cec5SDimitry Andric         (candidate && d->getValue() < candidate->getValue()))
1060b57cec5SDimitry Andric       continue;
1070b57cec5SDimitry Andric 
1080b57cec5SDimitry Andric     candidate = d;
1090b57cec5SDimitry Andric   }
1100b57cec5SDimitry Andric 
1110b57cec5SDimitry Andric   return candidate;
1120b57cec5SDimitry Andric }
1130b57cec5SDimitry Andric 
11485868e8aSDimitry Andric static std::vector<std::string> getSymbolLocations(BitcodeFile *file) {
11585868e8aSDimitry Andric   std::string res("\n>>> referenced by ");
11685868e8aSDimitry Andric   StringRef source = file->obj->getSourceFileName();
11785868e8aSDimitry Andric   if (!source.empty())
11885868e8aSDimitry Andric     res += source.str() + "\n>>>               ";
11985868e8aSDimitry Andric   res += toString(file);
12085868e8aSDimitry Andric   return {res};
12185868e8aSDimitry Andric }
12285868e8aSDimitry Andric 
12385868e8aSDimitry Andric static Optional<std::pair<StringRef, uint32_t>>
12485868e8aSDimitry Andric getFileLineDwarf(const SectionChunk *c, uint32_t addr) {
12585868e8aSDimitry Andric   Optional<DILineInfo> optionalLineInfo =
12685868e8aSDimitry Andric       c->file->getDILineInfo(addr, c->getSectionNumber() - 1);
12785868e8aSDimitry Andric   if (!optionalLineInfo)
12885868e8aSDimitry Andric     return None;
12985868e8aSDimitry Andric   const DILineInfo &lineInfo = *optionalLineInfo;
13085868e8aSDimitry Andric   if (lineInfo.FileName == DILineInfo::BadString)
13185868e8aSDimitry Andric     return None;
13285868e8aSDimitry Andric   return std::make_pair(saver.save(lineInfo.FileName), lineInfo.Line);
13385868e8aSDimitry Andric }
13485868e8aSDimitry Andric 
13585868e8aSDimitry Andric static Optional<std::pair<StringRef, uint32_t>>
13685868e8aSDimitry Andric getFileLine(const SectionChunk *c, uint32_t addr) {
13785868e8aSDimitry Andric   // MinGW can optionally use codeview, even if the default is dwarf.
13885868e8aSDimitry Andric   Optional<std::pair<StringRef, uint32_t>> fileLine =
13985868e8aSDimitry Andric       getFileLineCodeView(c, addr);
14085868e8aSDimitry Andric   // If codeview didn't yield any result, check dwarf in MinGW mode.
14185868e8aSDimitry Andric   if (!fileLine && config->mingw)
14285868e8aSDimitry Andric     fileLine = getFileLineDwarf(c, addr);
14385868e8aSDimitry Andric   return fileLine;
14485868e8aSDimitry Andric }
14585868e8aSDimitry Andric 
1460b57cec5SDimitry Andric // Given a file and the index of a symbol in that file, returns a description
1470b57cec5SDimitry Andric // of all references to that symbol from that file. If no debug information is
1480b57cec5SDimitry Andric // available, returns just the name of the file, else one string per actual
1490b57cec5SDimitry Andric // reference as described in the debug info.
150590d96feSDimitry Andric // Returns up to maxStrings string descriptions, along with the total number of
151590d96feSDimitry Andric // locations found.
152590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t>
153590d96feSDimitry Andric getSymbolLocations(ObjFile *file, uint32_t symIndex, size_t maxStrings) {
1540b57cec5SDimitry Andric   struct Location {
1550b57cec5SDimitry Andric     Symbol *sym;
1560b57cec5SDimitry Andric     std::pair<StringRef, uint32_t> fileLine;
1570b57cec5SDimitry Andric   };
1580b57cec5SDimitry Andric   std::vector<Location> locations;
159590d96feSDimitry Andric   size_t numLocations = 0;
1600b57cec5SDimitry Andric 
1610b57cec5SDimitry Andric   for (Chunk *c : file->getChunks()) {
1620b57cec5SDimitry Andric     auto *sc = dyn_cast<SectionChunk>(c);
1630b57cec5SDimitry Andric     if (!sc)
1640b57cec5SDimitry Andric       continue;
1650b57cec5SDimitry Andric     for (const coff_relocation &r : sc->getRelocs()) {
1660b57cec5SDimitry Andric       if (r.SymbolTableIndex != symIndex)
1670b57cec5SDimitry Andric         continue;
168590d96feSDimitry Andric       numLocations++;
169590d96feSDimitry Andric       if (locations.size() >= maxStrings)
170590d96feSDimitry Andric         continue;
171590d96feSDimitry Andric 
17285868e8aSDimitry Andric       Optional<std::pair<StringRef, uint32_t>> fileLine =
1730b57cec5SDimitry Andric           getFileLine(sc, r.VirtualAddress);
1740b57cec5SDimitry Andric       Symbol *sym = getSymbol(sc, r.VirtualAddress);
17585868e8aSDimitry Andric       if (fileLine)
17685868e8aSDimitry Andric         locations.push_back({sym, *fileLine});
17785868e8aSDimitry Andric       else if (sym)
17885868e8aSDimitry Andric         locations.push_back({sym, {"", 0}});
1790b57cec5SDimitry Andric     }
1800b57cec5SDimitry Andric   }
1810b57cec5SDimitry Andric 
182590d96feSDimitry Andric   if (maxStrings == 0)
183590d96feSDimitry Andric     return std::make_pair(std::vector<std::string>(), numLocations);
184590d96feSDimitry Andric 
185590d96feSDimitry Andric   if (numLocations == 0)
186590d96feSDimitry Andric     return std::make_pair(
187590d96feSDimitry Andric         std::vector<std::string>{"\n>>> referenced by " + toString(file)}, 1);
1880b57cec5SDimitry Andric 
1890b57cec5SDimitry Andric   std::vector<std::string> symbolLocations(locations.size());
1900b57cec5SDimitry Andric   size_t i = 0;
1910b57cec5SDimitry Andric   for (Location loc : locations) {
1920b57cec5SDimitry Andric     llvm::raw_string_ostream os(symbolLocations[i++]);
1930b57cec5SDimitry Andric     os << "\n>>> referenced by ";
1940b57cec5SDimitry Andric     if (!loc.fileLine.first.empty())
1950b57cec5SDimitry Andric       os << loc.fileLine.first << ":" << loc.fileLine.second
1960b57cec5SDimitry Andric          << "\n>>>               ";
1970b57cec5SDimitry Andric     os << toString(file);
1980b57cec5SDimitry Andric     if (loc.sym)
1990b57cec5SDimitry Andric       os << ":(" << toString(*loc.sym) << ')';
2000b57cec5SDimitry Andric   }
201590d96feSDimitry Andric   return std::make_pair(symbolLocations, numLocations);
2020b57cec5SDimitry Andric }
2030b57cec5SDimitry Andric 
204590d96feSDimitry Andric std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex) {
205590d96feSDimitry Andric   return getSymbolLocations(file, symIndex, SIZE_MAX).first;
206590d96feSDimitry Andric }
207590d96feSDimitry Andric 
208590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t>
209590d96feSDimitry Andric getSymbolLocations(InputFile *file, uint32_t symIndex, size_t maxStrings) {
21085868e8aSDimitry Andric   if (auto *o = dyn_cast<ObjFile>(file))
211590d96feSDimitry Andric     return getSymbolLocations(o, symIndex, maxStrings);
212590d96feSDimitry Andric   if (auto *b = dyn_cast<BitcodeFile>(file)) {
213590d96feSDimitry Andric     std::vector<std::string> symbolLocations = getSymbolLocations(b);
214590d96feSDimitry Andric     size_t numLocations = symbolLocations.size();
215590d96feSDimitry Andric     if (symbolLocations.size() > maxStrings)
216590d96feSDimitry Andric       symbolLocations.resize(maxStrings);
217590d96feSDimitry Andric     return std::make_pair(symbolLocations, numLocations);
218590d96feSDimitry Andric   }
21985868e8aSDimitry Andric   llvm_unreachable("unsupported file type passed to getSymbolLocations");
220590d96feSDimitry Andric   return std::make_pair(std::vector<std::string>(), (size_t)0);
22185868e8aSDimitry Andric }
22285868e8aSDimitry Andric 
2230b57cec5SDimitry Andric // For an undefined symbol, stores all files referencing it and the index of
2240b57cec5SDimitry Andric // the undefined symbol in each file.
2250b57cec5SDimitry Andric struct UndefinedDiag {
2260b57cec5SDimitry Andric   Symbol *sym;
2270b57cec5SDimitry Andric   struct File {
22885868e8aSDimitry Andric     InputFile *file;
22985868e8aSDimitry Andric     uint32_t symIndex;
2300b57cec5SDimitry Andric   };
2310b57cec5SDimitry Andric   std::vector<File> files;
2320b57cec5SDimitry Andric };
2330b57cec5SDimitry Andric 
2340b57cec5SDimitry Andric static void reportUndefinedSymbol(const UndefinedDiag &undefDiag) {
2350b57cec5SDimitry Andric   std::string out;
2360b57cec5SDimitry Andric   llvm::raw_string_ostream os(out);
2370b57cec5SDimitry Andric   os << "undefined symbol: " << toString(*undefDiag.sym);
2380b57cec5SDimitry Andric 
2395ffd83dbSDimitry Andric   const size_t maxUndefReferences = 3;
240590d96feSDimitry Andric   size_t numDisplayedRefs = 0, numRefs = 0;
2410b57cec5SDimitry Andric   for (const UndefinedDiag::File &ref : undefDiag.files) {
242590d96feSDimitry Andric     std::vector<std::string> symbolLocations;
243590d96feSDimitry Andric     size_t totalLocations = 0;
244590d96feSDimitry Andric     std::tie(symbolLocations, totalLocations) = getSymbolLocations(
245590d96feSDimitry Andric         ref.file, ref.symIndex, maxUndefReferences - numDisplayedRefs);
246590d96feSDimitry Andric 
247590d96feSDimitry Andric     numRefs += totalLocations;
248590d96feSDimitry Andric     numDisplayedRefs += symbolLocations.size();
2490b57cec5SDimitry Andric     for (const std::string &s : symbolLocations) {
2500b57cec5SDimitry Andric       os << s;
2510b57cec5SDimitry Andric     }
2520b57cec5SDimitry Andric   }
253590d96feSDimitry Andric   if (numDisplayedRefs < numRefs)
254590d96feSDimitry Andric     os << "\n>>> referenced " << numRefs - numDisplayedRefs << " more times";
2550b57cec5SDimitry Andric   errorOrWarn(os.str());
2560b57cec5SDimitry Andric }
2570b57cec5SDimitry Andric 
258*fe6060f1SDimitry Andric void SymbolTable::loadMinGWSymbols() {
2590b57cec5SDimitry Andric   for (auto &i : symMap) {
2600b57cec5SDimitry Andric     Symbol *sym = i.second;
2610b57cec5SDimitry Andric     auto *undef = dyn_cast<Undefined>(sym);
2620b57cec5SDimitry Andric     if (!undef)
2630b57cec5SDimitry Andric       continue;
26485868e8aSDimitry Andric     if (undef->getWeakAlias())
26585868e8aSDimitry Andric       continue;
2660b57cec5SDimitry Andric 
2670b57cec5SDimitry Andric     StringRef name = undef->getName();
2680b57cec5SDimitry Andric 
269*fe6060f1SDimitry Andric     if (config->machine == I386 && config->stdcallFixup) {
270*fe6060f1SDimitry Andric       // Check if we can resolve an undefined decorated symbol by finding
271*fe6060f1SDimitry Andric       // the indended target as an undecorated symbol (only with a leading
272*fe6060f1SDimitry Andric       // underscore).
273*fe6060f1SDimitry Andric       StringRef origName = name;
274*fe6060f1SDimitry Andric       StringRef baseName = name;
275*fe6060f1SDimitry Andric       // Trim down stdcall/fastcall/vectorcall symbols to the base name.
276*fe6060f1SDimitry Andric       baseName = ltrim1(baseName, "_@");
277*fe6060f1SDimitry Andric       baseName = baseName.substr(0, baseName.find('@'));
278*fe6060f1SDimitry Andric       // Add a leading underscore, as it would be in cdecl form.
279*fe6060f1SDimitry Andric       std::string newName = ("_" + baseName).str();
280*fe6060f1SDimitry Andric       Symbol *l;
281*fe6060f1SDimitry Andric       if (newName != origName && (l = find(newName)) != nullptr) {
282*fe6060f1SDimitry Andric         // If we found a symbol and it is lazy; load it.
283*fe6060f1SDimitry Andric         if (l->isLazy() && !l->pendingArchiveLoad) {
284*fe6060f1SDimitry Andric           log("Loading lazy " + l->getName() + " from " +
285*fe6060f1SDimitry Andric               l->getFile()->getName() + " for stdcall fixup");
286*fe6060f1SDimitry Andric           forceLazy(l);
287*fe6060f1SDimitry Andric         }
288*fe6060f1SDimitry Andric         // If it's lazy or already defined, hook it up as weak alias.
289*fe6060f1SDimitry Andric         if (l->isLazy() || isa<Defined>(l)) {
290*fe6060f1SDimitry Andric           if (config->warnStdcallFixup)
291*fe6060f1SDimitry Andric             warn("Resolving " + origName + " by linking to " + newName);
292*fe6060f1SDimitry Andric           else
293*fe6060f1SDimitry Andric             log("Resolving " + origName + " by linking to " + newName);
294*fe6060f1SDimitry Andric           undef->weakAlias = l;
295*fe6060f1SDimitry Andric           continue;
296*fe6060f1SDimitry Andric         }
297*fe6060f1SDimitry Andric       }
298*fe6060f1SDimitry Andric     }
299*fe6060f1SDimitry Andric 
300*fe6060f1SDimitry Andric     if (config->autoImport) {
3010b57cec5SDimitry Andric       if (name.startswith("__imp_"))
3020b57cec5SDimitry Andric         continue;
30385868e8aSDimitry Andric       // If we have an undefined symbol, but we have a lazy symbol we could
30485868e8aSDimitry Andric       // load, load it.
30585868e8aSDimitry Andric       Symbol *l = find(("__imp_" + name).str());
30685868e8aSDimitry Andric       if (!l || l->pendingArchiveLoad || !l->isLazy())
3070b57cec5SDimitry Andric         continue;
3080b57cec5SDimitry Andric 
30985868e8aSDimitry Andric       log("Loading lazy " + l->getName() + " from " + l->getFile()->getName() +
3100b57cec5SDimitry Andric           " for automatic import");
31185868e8aSDimitry Andric       forceLazy(l);
3120b57cec5SDimitry Andric     }
3130b57cec5SDimitry Andric   }
314*fe6060f1SDimitry Andric }
3150b57cec5SDimitry Andric 
31685868e8aSDimitry Andric Defined *SymbolTable::impSymbol(StringRef name) {
31785868e8aSDimitry Andric   if (name.startswith("__imp_"))
31885868e8aSDimitry Andric     return nullptr;
31985868e8aSDimitry Andric   return dyn_cast_or_null<Defined>(find(("__imp_" + name).str()));
32085868e8aSDimitry Andric }
32185868e8aSDimitry Andric 
3220b57cec5SDimitry Andric bool SymbolTable::handleMinGWAutomaticImport(Symbol *sym, StringRef name) {
32385868e8aSDimitry Andric   Defined *imp = impSymbol(name);
3240b57cec5SDimitry Andric   if (!imp)
3250b57cec5SDimitry Andric     return false;
3260b57cec5SDimitry Andric 
3270b57cec5SDimitry Andric   // Replace the reference directly to a variable with a reference
3280b57cec5SDimitry Andric   // to the import address table instead. This obviously isn't right,
3290b57cec5SDimitry Andric   // but we mark the symbol as isRuntimePseudoReloc, and a later pass
3300b57cec5SDimitry Andric   // will add runtime pseudo relocations for every relocation against
3310b57cec5SDimitry Andric   // this Symbol. The runtime pseudo relocation framework expects the
3320b57cec5SDimitry Andric   // reference itself to point at the IAT entry.
3330b57cec5SDimitry Andric   size_t impSize = 0;
3340b57cec5SDimitry Andric   if (isa<DefinedImportData>(imp)) {
3350b57cec5SDimitry Andric     log("Automatically importing " + name + " from " +
3360b57cec5SDimitry Andric         cast<DefinedImportData>(imp)->getDLLName());
3370b57cec5SDimitry Andric     impSize = sizeof(DefinedImportData);
3380b57cec5SDimitry Andric   } else if (isa<DefinedRegular>(imp)) {
3390b57cec5SDimitry Andric     log("Automatically importing " + name + " from " +
3400b57cec5SDimitry Andric         toString(cast<DefinedRegular>(imp)->file));
3410b57cec5SDimitry Andric     impSize = sizeof(DefinedRegular);
3420b57cec5SDimitry Andric   } else {
3430b57cec5SDimitry Andric     warn("unable to automatically import " + name + " from " + imp->getName() +
3440b57cec5SDimitry Andric          " from " + toString(cast<DefinedRegular>(imp)->file) +
3450b57cec5SDimitry Andric          "; unexpected symbol type");
3460b57cec5SDimitry Andric     return false;
3470b57cec5SDimitry Andric   }
3480b57cec5SDimitry Andric   sym->replaceKeepingName(imp, impSize);
3490b57cec5SDimitry Andric   sym->isRuntimePseudoReloc = true;
3500b57cec5SDimitry Andric 
3510b57cec5SDimitry Andric   // There may exist symbols named .refptr.<name> which only consist
3520b57cec5SDimitry Andric   // of a single pointer to <name>. If it turns out <name> is
3530b57cec5SDimitry Andric   // automatically imported, we don't need to keep the .refptr.<name>
3540b57cec5SDimitry Andric   // pointer at all, but redirect all accesses to it to the IAT entry
3550b57cec5SDimitry Andric   // for __imp_<name> instead, and drop the whole .refptr.<name> chunk.
3560b57cec5SDimitry Andric   DefinedRegular *refptr =
3570b57cec5SDimitry Andric       dyn_cast_or_null<DefinedRegular>(find((".refptr." + name).str()));
3580b57cec5SDimitry Andric   if (refptr && refptr->getChunk()->getSize() == config->wordsize) {
3590b57cec5SDimitry Andric     SectionChunk *sc = dyn_cast_or_null<SectionChunk>(refptr->getChunk());
3600b57cec5SDimitry Andric     if (sc && sc->getRelocs().size() == 1 && *sc->symbols().begin() == sym) {
3610b57cec5SDimitry Andric       log("Replacing .refptr." + name + " with " + imp->getName());
3620b57cec5SDimitry Andric       refptr->getChunk()->live = false;
3630b57cec5SDimitry Andric       refptr->replaceKeepingName(imp, impSize);
3640b57cec5SDimitry Andric     }
3650b57cec5SDimitry Andric   }
3660b57cec5SDimitry Andric   return true;
3670b57cec5SDimitry Andric }
3680b57cec5SDimitry Andric 
36985868e8aSDimitry Andric /// Helper function for reportUnresolvable and resolveRemainingUndefines.
37085868e8aSDimitry Andric /// This function emits an "undefined symbol" diagnostic for each symbol in
37185868e8aSDimitry Andric /// undefs. If localImports is not nullptr, it also emits a "locally
37285868e8aSDimitry Andric /// defined symbol imported" diagnostic for symbols in localImports.
37385868e8aSDimitry Andric /// objFiles and bitcodeFiles (if not nullptr) are used to report where
37485868e8aSDimitry Andric /// undefined symbols are referenced.
37585868e8aSDimitry Andric static void
37685868e8aSDimitry Andric reportProblemSymbols(const SmallPtrSetImpl<Symbol *> &undefs,
37785868e8aSDimitry Andric                      const DenseMap<Symbol *, Symbol *> *localImports,
37885868e8aSDimitry Andric                      const std::vector<ObjFile *> objFiles,
37985868e8aSDimitry Andric                      const std::vector<BitcodeFile *> *bitcodeFiles) {
38085868e8aSDimitry Andric 
38185868e8aSDimitry Andric   // Return early if there is nothing to report (which should be
38285868e8aSDimitry Andric   // the common case).
38385868e8aSDimitry Andric   if (undefs.empty() && (!localImports || localImports->empty()))
38485868e8aSDimitry Andric     return;
38585868e8aSDimitry Andric 
38685868e8aSDimitry Andric   for (Symbol *b : config->gcroot) {
38785868e8aSDimitry Andric     if (undefs.count(b))
38885868e8aSDimitry Andric       errorOrWarn("<root>: undefined symbol: " + toString(*b));
38985868e8aSDimitry Andric     if (localImports)
39085868e8aSDimitry Andric       if (Symbol *imp = localImports->lookup(b))
39185868e8aSDimitry Andric         warn("<root>: locally defined symbol imported: " + toString(*imp) +
39285868e8aSDimitry Andric              " (defined in " + toString(imp->getFile()) + ") [LNK4217]");
39385868e8aSDimitry Andric   }
39485868e8aSDimitry Andric 
39585868e8aSDimitry Andric   std::vector<UndefinedDiag> undefDiags;
39685868e8aSDimitry Andric   DenseMap<Symbol *, int> firstDiag;
39785868e8aSDimitry Andric 
39885868e8aSDimitry Andric   auto processFile = [&](InputFile *file, ArrayRef<Symbol *> symbols) {
39985868e8aSDimitry Andric     uint32_t symIndex = (uint32_t)-1;
40085868e8aSDimitry Andric     for (Symbol *sym : symbols) {
40185868e8aSDimitry Andric       ++symIndex;
40285868e8aSDimitry Andric       if (!sym)
40385868e8aSDimitry Andric         continue;
40485868e8aSDimitry Andric       if (undefs.count(sym)) {
40585868e8aSDimitry Andric         auto it = firstDiag.find(sym);
40685868e8aSDimitry Andric         if (it == firstDiag.end()) {
40785868e8aSDimitry Andric           firstDiag[sym] = undefDiags.size();
40885868e8aSDimitry Andric           undefDiags.push_back({sym, {{file, symIndex}}});
40985868e8aSDimitry Andric         } else {
41085868e8aSDimitry Andric           undefDiags[it->second].files.push_back({file, symIndex});
41185868e8aSDimitry Andric         }
41285868e8aSDimitry Andric       }
41385868e8aSDimitry Andric       if (localImports)
41485868e8aSDimitry Andric         if (Symbol *imp = localImports->lookup(sym))
41585868e8aSDimitry Andric           warn(toString(file) +
41685868e8aSDimitry Andric                ": locally defined symbol imported: " + toString(*imp) +
41785868e8aSDimitry Andric                " (defined in " + toString(imp->getFile()) + ") [LNK4217]");
41885868e8aSDimitry Andric     }
41985868e8aSDimitry Andric   };
42085868e8aSDimitry Andric 
42185868e8aSDimitry Andric   for (ObjFile *file : objFiles)
42285868e8aSDimitry Andric     processFile(file, file->getSymbols());
42385868e8aSDimitry Andric 
42485868e8aSDimitry Andric   if (bitcodeFiles)
42585868e8aSDimitry Andric     for (BitcodeFile *file : *bitcodeFiles)
42685868e8aSDimitry Andric       processFile(file, file->getSymbols());
42785868e8aSDimitry Andric 
42885868e8aSDimitry Andric   for (const UndefinedDiag &undefDiag : undefDiags)
42985868e8aSDimitry Andric     reportUndefinedSymbol(undefDiag);
43085868e8aSDimitry Andric }
43185868e8aSDimitry Andric 
43285868e8aSDimitry Andric void SymbolTable::reportUnresolvable() {
43385868e8aSDimitry Andric   SmallPtrSet<Symbol *, 8> undefs;
43485868e8aSDimitry Andric   for (auto &i : symMap) {
43585868e8aSDimitry Andric     Symbol *sym = i.second;
43685868e8aSDimitry Andric     auto *undef = dyn_cast<Undefined>(sym);
437e8d8bef9SDimitry Andric     if (!undef || sym->deferUndefined)
43885868e8aSDimitry Andric       continue;
43985868e8aSDimitry Andric     if (undef->getWeakAlias())
44085868e8aSDimitry Andric       continue;
44185868e8aSDimitry Andric     StringRef name = undef->getName();
44285868e8aSDimitry Andric     if (name.startswith("__imp_")) {
44385868e8aSDimitry Andric       Symbol *imp = find(name.substr(strlen("__imp_")));
44485868e8aSDimitry Andric       if (imp && isa<Defined>(imp))
44585868e8aSDimitry Andric         continue;
44685868e8aSDimitry Andric     }
44785868e8aSDimitry Andric     if (name.contains("_PchSym_"))
44885868e8aSDimitry Andric       continue;
449e8d8bef9SDimitry Andric     if (config->autoImport && impSymbol(name))
45085868e8aSDimitry Andric       continue;
45185868e8aSDimitry Andric     undefs.insert(sym);
45285868e8aSDimitry Andric   }
45385868e8aSDimitry Andric 
45485868e8aSDimitry Andric   reportProblemSymbols(undefs,
45585868e8aSDimitry Andric                        /* localImports */ nullptr, ObjFile::instances,
45685868e8aSDimitry Andric                        &BitcodeFile::instances);
45785868e8aSDimitry Andric }
45885868e8aSDimitry Andric 
45985868e8aSDimitry Andric void SymbolTable::resolveRemainingUndefines() {
4600b57cec5SDimitry Andric   SmallPtrSet<Symbol *, 8> undefs;
4610b57cec5SDimitry Andric   DenseMap<Symbol *, Symbol *> localImports;
4620b57cec5SDimitry Andric 
4630b57cec5SDimitry Andric   for (auto &i : symMap) {
4640b57cec5SDimitry Andric     Symbol *sym = i.second;
4650b57cec5SDimitry Andric     auto *undef = dyn_cast<Undefined>(sym);
4660b57cec5SDimitry Andric     if (!undef)
4670b57cec5SDimitry Andric       continue;
4680b57cec5SDimitry Andric     if (!sym->isUsedInRegularObj)
4690b57cec5SDimitry Andric       continue;
4700b57cec5SDimitry Andric 
4710b57cec5SDimitry Andric     StringRef name = undef->getName();
4720b57cec5SDimitry Andric 
4730b57cec5SDimitry Andric     // A weak alias may have been resolved, so check for that.
4740b57cec5SDimitry Andric     if (Defined *d = undef->getWeakAlias()) {
4750b57cec5SDimitry Andric       // We want to replace Sym with D. However, we can't just blindly
4760b57cec5SDimitry Andric       // copy sizeof(SymbolUnion) bytes from D to Sym because D may be an
4770b57cec5SDimitry Andric       // internal symbol, and internal symbols are stored as "unparented"
4780b57cec5SDimitry Andric       // Symbols. For that reason we need to check which type of symbol we
4790b57cec5SDimitry Andric       // are dealing with and copy the correct number of bytes.
4800b57cec5SDimitry Andric       if (isa<DefinedRegular>(d))
4810b57cec5SDimitry Andric         memcpy(sym, d, sizeof(DefinedRegular));
4820b57cec5SDimitry Andric       else if (isa<DefinedAbsolute>(d))
4830b57cec5SDimitry Andric         memcpy(sym, d, sizeof(DefinedAbsolute));
4840b57cec5SDimitry Andric       else
4850b57cec5SDimitry Andric         memcpy(sym, d, sizeof(SymbolUnion));
4860b57cec5SDimitry Andric       continue;
4870b57cec5SDimitry Andric     }
4880b57cec5SDimitry Andric 
4890b57cec5SDimitry Andric     // If we can resolve a symbol by removing __imp_ prefix, do that.
4900b57cec5SDimitry Andric     // This odd rule is for compatibility with MSVC linker.
4910b57cec5SDimitry Andric     if (name.startswith("__imp_")) {
4920b57cec5SDimitry Andric       Symbol *imp = find(name.substr(strlen("__imp_")));
4930b57cec5SDimitry Andric       if (imp && isa<Defined>(imp)) {
4940b57cec5SDimitry Andric         auto *d = cast<Defined>(imp);
4950b57cec5SDimitry Andric         replaceSymbol<DefinedLocalImport>(sym, name, d);
4960b57cec5SDimitry Andric         localImportChunks.push_back(cast<DefinedLocalImport>(sym)->getChunk());
4970b57cec5SDimitry Andric         localImports[sym] = d;
4980b57cec5SDimitry Andric         continue;
4990b57cec5SDimitry Andric       }
5000b57cec5SDimitry Andric     }
5010b57cec5SDimitry Andric 
5020b57cec5SDimitry Andric     // We don't want to report missing Microsoft precompiled headers symbols.
5030b57cec5SDimitry Andric     // A proper message will be emitted instead in PDBLinker::aquirePrecompObj
5040b57cec5SDimitry Andric     if (name.contains("_PchSym_"))
5050b57cec5SDimitry Andric       continue;
5060b57cec5SDimitry Andric 
5075ffd83dbSDimitry Andric     if (config->autoImport && handleMinGWAutomaticImport(sym, name))
5080b57cec5SDimitry Andric       continue;
5090b57cec5SDimitry Andric 
5100b57cec5SDimitry Andric     // Remaining undefined symbols are not fatal if /force is specified.
5110b57cec5SDimitry Andric     // They are replaced with dummy defined symbols.
5120b57cec5SDimitry Andric     if (config->forceUnresolved)
5130b57cec5SDimitry Andric       replaceSymbol<DefinedAbsolute>(sym, name, 0);
5140b57cec5SDimitry Andric     undefs.insert(sym);
5150b57cec5SDimitry Andric   }
5160b57cec5SDimitry Andric 
51785868e8aSDimitry Andric   reportProblemSymbols(
51885868e8aSDimitry Andric       undefs, config->warnLocallyDefinedImported ? &localImports : nullptr,
51985868e8aSDimitry Andric       ObjFile::instances, /* bitcode files no longer needed */ nullptr);
5200b57cec5SDimitry Andric }
5210b57cec5SDimitry Andric 
5220b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name) {
5230b57cec5SDimitry Andric   bool inserted = false;
5240b57cec5SDimitry Andric   Symbol *&sym = symMap[CachedHashStringRef(name)];
5250b57cec5SDimitry Andric   if (!sym) {
5260b57cec5SDimitry Andric     sym = reinterpret_cast<Symbol *>(make<SymbolUnion>());
5270b57cec5SDimitry Andric     sym->isUsedInRegularObj = false;
5280b57cec5SDimitry Andric     sym->pendingArchiveLoad = false;
529e8d8bef9SDimitry Andric     sym->canInline = true;
5300b57cec5SDimitry Andric     inserted = true;
5310b57cec5SDimitry Andric   }
5320b57cec5SDimitry Andric   return {sym, inserted};
5330b57cec5SDimitry Andric }
5340b57cec5SDimitry Andric 
5350b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name, InputFile *file) {
5360b57cec5SDimitry Andric   std::pair<Symbol *, bool> result = insert(name);
5370b57cec5SDimitry Andric   if (!file || !isa<BitcodeFile>(file))
5380b57cec5SDimitry Andric     result.first->isUsedInRegularObj = true;
5390b57cec5SDimitry Andric   return result;
5400b57cec5SDimitry Andric }
5410b57cec5SDimitry Andric 
5420b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name, InputFile *f,
5430b57cec5SDimitry Andric                                   bool isWeakAlias) {
5440b57cec5SDimitry Andric   Symbol *s;
5450b57cec5SDimitry Andric   bool wasInserted;
5460b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(name, f);
54785868e8aSDimitry Andric   if (wasInserted || (s->isLazy() && isWeakAlias)) {
5480b57cec5SDimitry Andric     replaceSymbol<Undefined>(s, name);
5490b57cec5SDimitry Andric     return s;
5500b57cec5SDimitry Andric   }
55185868e8aSDimitry Andric   if (s->isLazy())
55285868e8aSDimitry Andric     forceLazy(s);
5530b57cec5SDimitry Andric   return s;
5540b57cec5SDimitry Andric }
5550b57cec5SDimitry Andric 
55685868e8aSDimitry Andric void SymbolTable::addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym) {
5570b57cec5SDimitry Andric   StringRef name = sym.getName();
5580b57cec5SDimitry Andric   Symbol *s;
5590b57cec5SDimitry Andric   bool wasInserted;
5600b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(name);
5610b57cec5SDimitry Andric   if (wasInserted) {
56285868e8aSDimitry Andric     replaceSymbol<LazyArchive>(s, f, sym);
5630b57cec5SDimitry Andric     return;
5640b57cec5SDimitry Andric   }
5650b57cec5SDimitry Andric   auto *u = dyn_cast<Undefined>(s);
5660b57cec5SDimitry Andric   if (!u || u->weakAlias || s->pendingArchiveLoad)
5670b57cec5SDimitry Andric     return;
5680b57cec5SDimitry Andric   s->pendingArchiveLoad = true;
5690b57cec5SDimitry Andric   f->addMember(sym);
5700b57cec5SDimitry Andric }
5710b57cec5SDimitry Andric 
57285868e8aSDimitry Andric void SymbolTable::addLazyObject(LazyObjFile *f, StringRef n) {
57385868e8aSDimitry Andric   Symbol *s;
57485868e8aSDimitry Andric   bool wasInserted;
57585868e8aSDimitry Andric   std::tie(s, wasInserted) = insert(n, f);
57685868e8aSDimitry Andric   if (wasInserted) {
57785868e8aSDimitry Andric     replaceSymbol<LazyObject>(s, f, n);
57885868e8aSDimitry Andric     return;
57985868e8aSDimitry Andric   }
58085868e8aSDimitry Andric   auto *u = dyn_cast<Undefined>(s);
58185868e8aSDimitry Andric   if (!u || u->weakAlias || s->pendingArchiveLoad)
58285868e8aSDimitry Andric     return;
58385868e8aSDimitry Andric   s->pendingArchiveLoad = true;
58485868e8aSDimitry Andric   f->fetch();
58585868e8aSDimitry Andric }
58685868e8aSDimitry Andric 
587*fe6060f1SDimitry Andric void SymbolTable::addLazyDLLSymbol(DLLFile *f, DLLFile::Symbol *sym,
588*fe6060f1SDimitry Andric                                    StringRef n) {
589*fe6060f1SDimitry Andric   Symbol *s;
590*fe6060f1SDimitry Andric   bool wasInserted;
591*fe6060f1SDimitry Andric   std::tie(s, wasInserted) = insert(n);
592*fe6060f1SDimitry Andric   if (wasInserted) {
593*fe6060f1SDimitry Andric     replaceSymbol<LazyDLLSymbol>(s, f, sym, n);
594*fe6060f1SDimitry Andric     return;
595*fe6060f1SDimitry Andric   }
596*fe6060f1SDimitry Andric   auto *u = dyn_cast<Undefined>(s);
597*fe6060f1SDimitry Andric   if (!u || u->weakAlias || s->pendingArchiveLoad)
598*fe6060f1SDimitry Andric     return;
599*fe6060f1SDimitry Andric   s->pendingArchiveLoad = true;
600*fe6060f1SDimitry Andric   f->makeImport(sym);
601*fe6060f1SDimitry Andric }
602*fe6060f1SDimitry Andric 
60385868e8aSDimitry Andric static std::string getSourceLocationBitcode(BitcodeFile *file) {
60485868e8aSDimitry Andric   std::string res("\n>>> defined at ");
60585868e8aSDimitry Andric   StringRef source = file->obj->getSourceFileName();
60685868e8aSDimitry Andric   if (!source.empty())
60785868e8aSDimitry Andric     res += source.str() + "\n>>>            ";
60885868e8aSDimitry Andric   res += toString(file);
60985868e8aSDimitry Andric   return res;
61085868e8aSDimitry Andric }
61185868e8aSDimitry Andric 
61285868e8aSDimitry Andric static std::string getSourceLocationObj(ObjFile *file, SectionChunk *sc,
61385868e8aSDimitry Andric                                         uint32_t offset, StringRef name) {
61485868e8aSDimitry Andric   Optional<std::pair<StringRef, uint32_t>> fileLine;
61585868e8aSDimitry Andric   if (sc)
61685868e8aSDimitry Andric     fileLine = getFileLine(sc, offset);
61785868e8aSDimitry Andric   if (!fileLine)
61885868e8aSDimitry Andric     fileLine = file->getVariableLocation(name);
61985868e8aSDimitry Andric 
62085868e8aSDimitry Andric   std::string res;
62185868e8aSDimitry Andric   llvm::raw_string_ostream os(res);
62285868e8aSDimitry Andric   os << "\n>>> defined at ";
62385868e8aSDimitry Andric   if (fileLine)
62485868e8aSDimitry Andric     os << fileLine->first << ":" << fileLine->second << "\n>>>            ";
62585868e8aSDimitry Andric   os << toString(file);
62685868e8aSDimitry Andric   return os.str();
62785868e8aSDimitry Andric }
62885868e8aSDimitry Andric 
62985868e8aSDimitry Andric static std::string getSourceLocation(InputFile *file, SectionChunk *sc,
63085868e8aSDimitry Andric                                      uint32_t offset, StringRef name) {
631480093f4SDimitry Andric   if (!file)
632480093f4SDimitry Andric     return "";
63385868e8aSDimitry Andric   if (auto *o = dyn_cast<ObjFile>(file))
63485868e8aSDimitry Andric     return getSourceLocationObj(o, sc, offset, name);
63585868e8aSDimitry Andric   if (auto *b = dyn_cast<BitcodeFile>(file))
63685868e8aSDimitry Andric     return getSourceLocationBitcode(b);
63785868e8aSDimitry Andric   return "\n>>> defined at " + toString(file);
63885868e8aSDimitry Andric }
63985868e8aSDimitry Andric 
64085868e8aSDimitry Andric // Construct and print an error message in the form of:
64185868e8aSDimitry Andric //
64285868e8aSDimitry Andric //   lld-link: error: duplicate symbol: foo
64385868e8aSDimitry Andric //   >>> defined at bar.c:30
64485868e8aSDimitry Andric //   >>>            bar.o
64585868e8aSDimitry Andric //   >>> defined at baz.c:563
64685868e8aSDimitry Andric //   >>>            baz.o
64785868e8aSDimitry Andric void SymbolTable::reportDuplicate(Symbol *existing, InputFile *newFile,
64885868e8aSDimitry Andric                                   SectionChunk *newSc,
64985868e8aSDimitry Andric                                   uint32_t newSectionOffset) {
65085868e8aSDimitry Andric   std::string msg;
65185868e8aSDimitry Andric   llvm::raw_string_ostream os(msg);
65285868e8aSDimitry Andric   os << "duplicate symbol: " << toString(*existing);
65385868e8aSDimitry Andric 
654480093f4SDimitry Andric   DefinedRegular *d = dyn_cast<DefinedRegular>(existing);
65585868e8aSDimitry Andric   if (d && isa<ObjFile>(d->getFile())) {
65685868e8aSDimitry Andric     os << getSourceLocation(d->getFile(), d->getChunk(), d->getValue(),
65785868e8aSDimitry Andric                             existing->getName());
65885868e8aSDimitry Andric   } else {
65985868e8aSDimitry Andric     os << getSourceLocation(existing->getFile(), nullptr, 0, "");
66085868e8aSDimitry Andric   }
66185868e8aSDimitry Andric   os << getSourceLocation(newFile, newSc, newSectionOffset,
66285868e8aSDimitry Andric                           existing->getName());
6630b57cec5SDimitry Andric 
6640b57cec5SDimitry Andric   if (config->forceMultiple)
66585868e8aSDimitry Andric     warn(os.str());
6660b57cec5SDimitry Andric   else
66785868e8aSDimitry Andric     error(os.str());
6680b57cec5SDimitry Andric }
6690b57cec5SDimitry Andric 
6700b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, COFFSymbolRef sym) {
6710b57cec5SDimitry Andric   Symbol *s;
6720b57cec5SDimitry Andric   bool wasInserted;
6730b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, nullptr);
6740b57cec5SDimitry Andric   s->isUsedInRegularObj = true;
67585868e8aSDimitry Andric   if (wasInserted || isa<Undefined>(s) || s->isLazy())
6760b57cec5SDimitry Andric     replaceSymbol<DefinedAbsolute>(s, n, sym);
677480093f4SDimitry Andric   else if (auto *da = dyn_cast<DefinedAbsolute>(s)) {
678480093f4SDimitry Andric     if (da->getVA() != sym.getValue())
679480093f4SDimitry Andric       reportDuplicate(s, nullptr);
680480093f4SDimitry Andric   } else if (!isa<DefinedCOFF>(s))
6810b57cec5SDimitry Andric     reportDuplicate(s, nullptr);
6820b57cec5SDimitry Andric   return s;
6830b57cec5SDimitry Andric }
6840b57cec5SDimitry Andric 
6850b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, uint64_t va) {
6860b57cec5SDimitry Andric   Symbol *s;
6870b57cec5SDimitry Andric   bool wasInserted;
6880b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, nullptr);
6890b57cec5SDimitry Andric   s->isUsedInRegularObj = true;
69085868e8aSDimitry Andric   if (wasInserted || isa<Undefined>(s) || s->isLazy())
6910b57cec5SDimitry Andric     replaceSymbol<DefinedAbsolute>(s, n, va);
692480093f4SDimitry Andric   else if (auto *da = dyn_cast<DefinedAbsolute>(s)) {
693480093f4SDimitry Andric     if (da->getVA() != va)
694480093f4SDimitry Andric       reportDuplicate(s, nullptr);
695480093f4SDimitry Andric   } else if (!isa<DefinedCOFF>(s))
6960b57cec5SDimitry Andric     reportDuplicate(s, nullptr);
6970b57cec5SDimitry Andric   return s;
6980b57cec5SDimitry Andric }
6990b57cec5SDimitry Andric 
7000b57cec5SDimitry Andric Symbol *SymbolTable::addSynthetic(StringRef n, Chunk *c) {
7010b57cec5SDimitry Andric   Symbol *s;
7020b57cec5SDimitry Andric   bool wasInserted;
7030b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, nullptr);
7040b57cec5SDimitry Andric   s->isUsedInRegularObj = true;
70585868e8aSDimitry Andric   if (wasInserted || isa<Undefined>(s) || s->isLazy())
7060b57cec5SDimitry Andric     replaceSymbol<DefinedSynthetic>(s, n, c);
7070b57cec5SDimitry Andric   else if (!isa<DefinedCOFF>(s))
7080b57cec5SDimitry Andric     reportDuplicate(s, nullptr);
7090b57cec5SDimitry Andric   return s;
7100b57cec5SDimitry Andric }
7110b57cec5SDimitry Andric 
7120b57cec5SDimitry Andric Symbol *SymbolTable::addRegular(InputFile *f, StringRef n,
71385868e8aSDimitry Andric                                 const coff_symbol_generic *sym, SectionChunk *c,
71485868e8aSDimitry Andric                                 uint32_t sectionOffset) {
7150b57cec5SDimitry Andric   Symbol *s;
7160b57cec5SDimitry Andric   bool wasInserted;
7170b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, f);
7180b57cec5SDimitry Andric   if (wasInserted || !isa<DefinedRegular>(s))
7190b57cec5SDimitry Andric     replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ false,
7200b57cec5SDimitry Andric                                   /*IsExternal*/ true, sym, c);
7210b57cec5SDimitry Andric   else
72285868e8aSDimitry Andric     reportDuplicate(s, f, c, sectionOffset);
7230b57cec5SDimitry Andric   return s;
7240b57cec5SDimitry Andric }
7250b57cec5SDimitry Andric 
7260b57cec5SDimitry Andric std::pair<DefinedRegular *, bool>
7270b57cec5SDimitry Andric SymbolTable::addComdat(InputFile *f, StringRef n,
7280b57cec5SDimitry Andric                        const coff_symbol_generic *sym) {
7290b57cec5SDimitry Andric   Symbol *s;
7300b57cec5SDimitry Andric   bool wasInserted;
7310b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, f);
7320b57cec5SDimitry Andric   if (wasInserted || !isa<DefinedRegular>(s)) {
7330b57cec5SDimitry Andric     replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ true,
7340b57cec5SDimitry Andric                                   /*IsExternal*/ true, sym, nullptr);
7350b57cec5SDimitry Andric     return {cast<DefinedRegular>(s), true};
7360b57cec5SDimitry Andric   }
7370b57cec5SDimitry Andric   auto *existingSymbol = cast<DefinedRegular>(s);
7380b57cec5SDimitry Andric   if (!existingSymbol->isCOMDAT)
7390b57cec5SDimitry Andric     reportDuplicate(s, f);
7400b57cec5SDimitry Andric   return {existingSymbol, false};
7410b57cec5SDimitry Andric }
7420b57cec5SDimitry Andric 
7430b57cec5SDimitry Andric Symbol *SymbolTable::addCommon(InputFile *f, StringRef n, uint64_t size,
7440b57cec5SDimitry Andric                                const coff_symbol_generic *sym, CommonChunk *c) {
7450b57cec5SDimitry Andric   Symbol *s;
7460b57cec5SDimitry Andric   bool wasInserted;
7470b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, f);
7480b57cec5SDimitry Andric   if (wasInserted || !isa<DefinedCOFF>(s))
7490b57cec5SDimitry Andric     replaceSymbol<DefinedCommon>(s, f, n, size, sym, c);
7500b57cec5SDimitry Andric   else if (auto *dc = dyn_cast<DefinedCommon>(s))
7510b57cec5SDimitry Andric     if (size > dc->getSize())
7520b57cec5SDimitry Andric       replaceSymbol<DefinedCommon>(s, f, n, size, sym, c);
7530b57cec5SDimitry Andric   return s;
7540b57cec5SDimitry Andric }
7550b57cec5SDimitry Andric 
7560b57cec5SDimitry Andric Symbol *SymbolTable::addImportData(StringRef n, ImportFile *f) {
7570b57cec5SDimitry Andric   Symbol *s;
7580b57cec5SDimitry Andric   bool wasInserted;
7590b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(n, nullptr);
7600b57cec5SDimitry Andric   s->isUsedInRegularObj = true;
76185868e8aSDimitry Andric   if (wasInserted || isa<Undefined>(s) || s->isLazy()) {
7620b57cec5SDimitry Andric     replaceSymbol<DefinedImportData>(s, n, f);
7630b57cec5SDimitry Andric     return s;
7640b57cec5SDimitry Andric   }
7650b57cec5SDimitry Andric 
7660b57cec5SDimitry Andric   reportDuplicate(s, f);
7670b57cec5SDimitry Andric   return nullptr;
7680b57cec5SDimitry Andric }
7690b57cec5SDimitry Andric 
7700b57cec5SDimitry Andric Symbol *SymbolTable::addImportThunk(StringRef name, DefinedImportData *id,
7710b57cec5SDimitry Andric                                     uint16_t machine) {
7720b57cec5SDimitry Andric   Symbol *s;
7730b57cec5SDimitry Andric   bool wasInserted;
7740b57cec5SDimitry Andric   std::tie(s, wasInserted) = insert(name, nullptr);
7750b57cec5SDimitry Andric   s->isUsedInRegularObj = true;
77685868e8aSDimitry Andric   if (wasInserted || isa<Undefined>(s) || s->isLazy()) {
7770b57cec5SDimitry Andric     replaceSymbol<DefinedImportThunk>(s, name, id, machine);
7780b57cec5SDimitry Andric     return s;
7790b57cec5SDimitry Andric   }
7800b57cec5SDimitry Andric 
7810b57cec5SDimitry Andric   reportDuplicate(s, id->file);
7820b57cec5SDimitry Andric   return nullptr;
7830b57cec5SDimitry Andric }
7840b57cec5SDimitry Andric 
7850b57cec5SDimitry Andric void SymbolTable::addLibcall(StringRef name) {
7860b57cec5SDimitry Andric   Symbol *sym = findUnderscore(name);
7870b57cec5SDimitry Andric   if (!sym)
7880b57cec5SDimitry Andric     return;
7890b57cec5SDimitry Andric 
79085868e8aSDimitry Andric   if (auto *l = dyn_cast<LazyArchive>(sym)) {
7910b57cec5SDimitry Andric     MemoryBufferRef mb = l->getMemberBuffer();
79285868e8aSDimitry Andric     if (isBitcode(mb))
79385868e8aSDimitry Andric       addUndefined(sym->getName());
79485868e8aSDimitry Andric   } else if (LazyObject *o = dyn_cast<LazyObject>(sym)) {
79585868e8aSDimitry Andric     if (isBitcode(o->file->mb))
7960b57cec5SDimitry Andric       addUndefined(sym->getName());
7970b57cec5SDimitry Andric   }
7980b57cec5SDimitry Andric }
7990b57cec5SDimitry Andric 
8000b57cec5SDimitry Andric std::vector<Chunk *> SymbolTable::getChunks() {
8010b57cec5SDimitry Andric   std::vector<Chunk *> res;
8020b57cec5SDimitry Andric   for (ObjFile *file : ObjFile::instances) {
8030b57cec5SDimitry Andric     ArrayRef<Chunk *> v = file->getChunks();
8040b57cec5SDimitry Andric     res.insert(res.end(), v.begin(), v.end());
8050b57cec5SDimitry Andric   }
8060b57cec5SDimitry Andric   return res;
8070b57cec5SDimitry Andric }
8080b57cec5SDimitry Andric 
8090b57cec5SDimitry Andric Symbol *SymbolTable::find(StringRef name) {
8100b57cec5SDimitry Andric   return symMap.lookup(CachedHashStringRef(name));
8110b57cec5SDimitry Andric }
8120b57cec5SDimitry Andric 
8130b57cec5SDimitry Andric Symbol *SymbolTable::findUnderscore(StringRef name) {
8140b57cec5SDimitry Andric   if (config->machine == I386)
8150b57cec5SDimitry Andric     return find(("_" + name).str());
8160b57cec5SDimitry Andric   return find(name);
8170b57cec5SDimitry Andric }
8180b57cec5SDimitry Andric 
8190b57cec5SDimitry Andric // Return all symbols that start with Prefix, possibly ignoring the first
8200b57cec5SDimitry Andric // character of Prefix or the first character symbol.
8210b57cec5SDimitry Andric std::vector<Symbol *> SymbolTable::getSymsWithPrefix(StringRef prefix) {
8220b57cec5SDimitry Andric   std::vector<Symbol *> syms;
8230b57cec5SDimitry Andric   for (auto pair : symMap) {
8240b57cec5SDimitry Andric     StringRef name = pair.first.val();
8250b57cec5SDimitry Andric     if (name.startswith(prefix) || name.startswith(prefix.drop_front()) ||
8260b57cec5SDimitry Andric         name.drop_front().startswith(prefix) ||
8270b57cec5SDimitry Andric         name.drop_front().startswith(prefix.drop_front())) {
8280b57cec5SDimitry Andric       syms.push_back(pair.second);
8290b57cec5SDimitry Andric     }
8300b57cec5SDimitry Andric   }
8310b57cec5SDimitry Andric   return syms;
8320b57cec5SDimitry Andric }
8330b57cec5SDimitry Andric 
8340b57cec5SDimitry Andric Symbol *SymbolTable::findMangle(StringRef name) {
8350b57cec5SDimitry Andric   if (Symbol *sym = find(name))
8360b57cec5SDimitry Andric     if (!isa<Undefined>(sym))
8370b57cec5SDimitry Andric       return sym;
8380b57cec5SDimitry Andric 
8390b57cec5SDimitry Andric   // Efficient fuzzy string lookup is impossible with a hash table, so iterate
8400b57cec5SDimitry Andric   // the symbol table once and collect all possibly matching symbols into this
8410b57cec5SDimitry Andric   // vector. Then compare each possibly matching symbol with each possible
8420b57cec5SDimitry Andric   // mangling.
8430b57cec5SDimitry Andric   std::vector<Symbol *> syms = getSymsWithPrefix(name);
8440b57cec5SDimitry Andric   auto findByPrefix = [&syms](const Twine &t) -> Symbol * {
8450b57cec5SDimitry Andric     std::string prefix = t.str();
8460b57cec5SDimitry Andric     for (auto *s : syms)
8470b57cec5SDimitry Andric       if (s->getName().startswith(prefix))
8480b57cec5SDimitry Andric         return s;
8490b57cec5SDimitry Andric     return nullptr;
8500b57cec5SDimitry Andric   };
8510b57cec5SDimitry Andric 
8520b57cec5SDimitry Andric   // For non-x86, just look for C++ functions.
8530b57cec5SDimitry Andric   if (config->machine != I386)
8540b57cec5SDimitry Andric     return findByPrefix("?" + name + "@@Y");
8550b57cec5SDimitry Andric 
8560b57cec5SDimitry Andric   if (!name.startswith("_"))
8570b57cec5SDimitry Andric     return nullptr;
8580b57cec5SDimitry Andric   // Search for x86 stdcall function.
8590b57cec5SDimitry Andric   if (Symbol *s = findByPrefix(name + "@"))
8600b57cec5SDimitry Andric     return s;
8610b57cec5SDimitry Andric   // Search for x86 fastcall function.
8620b57cec5SDimitry Andric   if (Symbol *s = findByPrefix("@" + name.substr(1) + "@"))
8630b57cec5SDimitry Andric     return s;
8640b57cec5SDimitry Andric   // Search for x86 vectorcall function.
8650b57cec5SDimitry Andric   if (Symbol *s = findByPrefix(name.substr(1) + "@@"))
8660b57cec5SDimitry Andric     return s;
8670b57cec5SDimitry Andric   // Search for x86 C++ non-member function.
8680b57cec5SDimitry Andric   return findByPrefix("?" + name.substr(1) + "@@Y");
8690b57cec5SDimitry Andric }
8700b57cec5SDimitry Andric 
8710b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name) {
8720b57cec5SDimitry Andric   return addUndefined(name, nullptr, false);
8730b57cec5SDimitry Andric }
8740b57cec5SDimitry Andric 
8750b57cec5SDimitry Andric void SymbolTable::addCombinedLTOObjects() {
8760b57cec5SDimitry Andric   if (BitcodeFile::instances.empty())
8770b57cec5SDimitry Andric     return;
8780b57cec5SDimitry Andric 
8790b57cec5SDimitry Andric   ScopedTimer t(ltoTimer);
8805ffd83dbSDimitry Andric   lto.reset(new BitcodeCompiler);
8815ffd83dbSDimitry Andric   for (BitcodeFile *f : BitcodeFile::instances)
8825ffd83dbSDimitry Andric     lto->add(*f);
8835ffd83dbSDimitry Andric   for (InputFile *newObj : lto->compile()) {
8845ffd83dbSDimitry Andric     ObjFile *obj = cast<ObjFile>(newObj);
8850b57cec5SDimitry Andric     obj->parse();
8860b57cec5SDimitry Andric     ObjFile::instances.push_back(obj);
8870b57cec5SDimitry Andric   }
8880b57cec5SDimitry Andric }
8890b57cec5SDimitry Andric 
8900b57cec5SDimitry Andric } // namespace coff
8910b57cec5SDimitry Andric } // namespace lld
892