10b57cec5SDimitry Andric //===- SymbolTable.cpp ----------------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "SymbolTable.h" 10349cc55cSDimitry Andric #include "COFFLinkerContext.h" 110b57cec5SDimitry Andric #include "Config.h" 120b57cec5SDimitry Andric #include "Driver.h" 130b57cec5SDimitry Andric #include "LTO.h" 140b57cec5SDimitry Andric #include "PDB.h" 150b57cec5SDimitry Andric #include "Symbols.h" 160b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h" 170b57cec5SDimitry Andric #include "lld/Common/Memory.h" 180b57cec5SDimitry Andric #include "lld/Common/Timer.h" 190eae32dcSDimitry Andric #include "llvm/DebugInfo/DIContext.h" 200b57cec5SDimitry Andric #include "llvm/IR/LLVMContext.h" 21480093f4SDimitry Andric #include "llvm/LTO/LTO.h" 220b57cec5SDimitry Andric #include "llvm/Object/WindowsMachineFlag.h" 230b57cec5SDimitry Andric #include "llvm/Support/Debug.h" 240b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h" 250b57cec5SDimitry Andric #include <utility> 260b57cec5SDimitry Andric 270b57cec5SDimitry Andric using namespace llvm; 280b57cec5SDimitry Andric 29*bdd1243dSDimitry Andric namespace lld::coff { 300b57cec5SDimitry Andric 31fe6060f1SDimitry Andric StringRef ltrim1(StringRef s, const char *chars) { 32fe6060f1SDimitry Andric if (!s.empty() && strchr(chars, s[0])) 33fe6060f1SDimitry Andric return s.substr(1); 34fe6060f1SDimitry Andric return s; 35fe6060f1SDimitry Andric } 36fe6060f1SDimitry Andric 370b57cec5SDimitry Andric void SymbolTable::addFile(InputFile *file) { 380b57cec5SDimitry Andric log("Reading " + toString(file)); 3904eeddc0SDimitry Andric if (file->lazy) { 4004eeddc0SDimitry Andric if (auto *f = dyn_cast<BitcodeFile>(file)) 4104eeddc0SDimitry Andric f->parseLazy(); 4204eeddc0SDimitry Andric else 4304eeddc0SDimitry Andric cast<ObjFile>(file)->parseLazy(); 4404eeddc0SDimitry Andric } else { 450b57cec5SDimitry Andric file->parse(); 4604eeddc0SDimitry Andric if (auto *f = dyn_cast<ObjFile>(file)) { 4704eeddc0SDimitry Andric ctx.objFileInstances.push_back(f); 4804eeddc0SDimitry Andric } else if (auto *f = dyn_cast<BitcodeFile>(file)) { 4904eeddc0SDimitry Andric ctx.bitcodeFileInstances.push_back(f); 5004eeddc0SDimitry Andric } else if (auto *f = dyn_cast<ImportFile>(file)) { 5104eeddc0SDimitry Andric ctx.importFileInstances.push_back(f); 5204eeddc0SDimitry Andric } 5304eeddc0SDimitry Andric } 540b57cec5SDimitry Andric 550b57cec5SDimitry Andric MachineTypes mt = file->getMachineType(); 56*bdd1243dSDimitry Andric if (ctx.config.machine == IMAGE_FILE_MACHINE_UNKNOWN) { 57*bdd1243dSDimitry Andric ctx.config.machine = mt; 58*bdd1243dSDimitry Andric ctx.driver.addWinSysRootLibSearchPaths(); 59*bdd1243dSDimitry Andric } else if (mt != IMAGE_FILE_MACHINE_UNKNOWN && ctx.config.machine != mt) { 600b57cec5SDimitry Andric error(toString(file) + ": machine type " + machineToStr(mt) + 61*bdd1243dSDimitry Andric " conflicts with " + machineToStr(ctx.config.machine)); 620b57cec5SDimitry Andric return; 630b57cec5SDimitry Andric } 640b57cec5SDimitry Andric 65*bdd1243dSDimitry Andric ctx.driver.parseDirectives(file); 660b57cec5SDimitry Andric } 670b57cec5SDimitry Andric 68*bdd1243dSDimitry Andric static void errorOrWarn(const Twine &s, bool forceUnresolved) { 69*bdd1243dSDimitry Andric if (forceUnresolved) 700b57cec5SDimitry Andric warn(s); 710b57cec5SDimitry Andric else 720b57cec5SDimitry Andric error(s); 730b57cec5SDimitry Andric } 740b57cec5SDimitry Andric 7585868e8aSDimitry Andric // Causes the file associated with a lazy symbol to be linked in. 7685868e8aSDimitry Andric static void forceLazy(Symbol *s) { 7785868e8aSDimitry Andric s->pendingArchiveLoad = true; 7885868e8aSDimitry Andric switch (s->kind()) { 7985868e8aSDimitry Andric case Symbol::Kind::LazyArchiveKind: { 8085868e8aSDimitry Andric auto *l = cast<LazyArchive>(s); 8185868e8aSDimitry Andric l->file->addMember(l->sym); 8285868e8aSDimitry Andric break; 8385868e8aSDimitry Andric } 8404eeddc0SDimitry Andric case Symbol::Kind::LazyObjectKind: { 8504eeddc0SDimitry Andric InputFile *file = cast<LazyObject>(s)->file; 8604eeddc0SDimitry Andric file->ctx.symtab.addFile(file); 8785868e8aSDimitry Andric break; 8804eeddc0SDimitry Andric } 89fe6060f1SDimitry Andric case Symbol::Kind::LazyDLLSymbolKind: { 90fe6060f1SDimitry Andric auto *l = cast<LazyDLLSymbol>(s); 91fe6060f1SDimitry Andric l->file->makeImport(l->sym); 92fe6060f1SDimitry Andric break; 93fe6060f1SDimitry Andric } 9485868e8aSDimitry Andric default: 9585868e8aSDimitry Andric llvm_unreachable( 9685868e8aSDimitry Andric "symbol passed to forceLazy is not a LazyArchive or LazyObject"); 9785868e8aSDimitry Andric } 9885868e8aSDimitry Andric } 9985868e8aSDimitry Andric 1000b57cec5SDimitry Andric // Returns the symbol in SC whose value is <= Addr that is closest to Addr. 1010b57cec5SDimitry Andric // This is generally the global variable or function whose definition contains 1020b57cec5SDimitry Andric // Addr. 1030b57cec5SDimitry Andric static Symbol *getSymbol(SectionChunk *sc, uint32_t addr) { 1040b57cec5SDimitry Andric DefinedRegular *candidate = nullptr; 1050b57cec5SDimitry Andric 1060b57cec5SDimitry Andric for (Symbol *s : sc->file->getSymbols()) { 1070b57cec5SDimitry Andric auto *d = dyn_cast_or_null<DefinedRegular>(s); 10885868e8aSDimitry Andric if (!d || !d->data || d->file != sc->file || d->getChunk() != sc || 10985868e8aSDimitry Andric d->getValue() > addr || 1100b57cec5SDimitry Andric (candidate && d->getValue() < candidate->getValue())) 1110b57cec5SDimitry Andric continue; 1120b57cec5SDimitry Andric 1130b57cec5SDimitry Andric candidate = d; 1140b57cec5SDimitry Andric } 1150b57cec5SDimitry Andric 1160b57cec5SDimitry Andric return candidate; 1170b57cec5SDimitry Andric } 1180b57cec5SDimitry Andric 11985868e8aSDimitry Andric static std::vector<std::string> getSymbolLocations(BitcodeFile *file) { 12085868e8aSDimitry Andric std::string res("\n>>> referenced by "); 12185868e8aSDimitry Andric StringRef source = file->obj->getSourceFileName(); 12285868e8aSDimitry Andric if (!source.empty()) 12385868e8aSDimitry Andric res += source.str() + "\n>>> "; 12485868e8aSDimitry Andric res += toString(file); 12585868e8aSDimitry Andric return {res}; 12685868e8aSDimitry Andric } 12785868e8aSDimitry Andric 128*bdd1243dSDimitry Andric static std::optional<std::pair<StringRef, uint32_t>> 12985868e8aSDimitry Andric getFileLineDwarf(const SectionChunk *c, uint32_t addr) { 130*bdd1243dSDimitry Andric std::optional<DILineInfo> optionalLineInfo = 13185868e8aSDimitry Andric c->file->getDILineInfo(addr, c->getSectionNumber() - 1); 13285868e8aSDimitry Andric if (!optionalLineInfo) 133*bdd1243dSDimitry Andric return std::nullopt; 13485868e8aSDimitry Andric const DILineInfo &lineInfo = *optionalLineInfo; 13585868e8aSDimitry Andric if (lineInfo.FileName == DILineInfo::BadString) 136*bdd1243dSDimitry Andric return std::nullopt; 13704eeddc0SDimitry Andric return std::make_pair(saver().save(lineInfo.FileName), lineInfo.Line); 13885868e8aSDimitry Andric } 13985868e8aSDimitry Andric 140*bdd1243dSDimitry Andric static std::optional<std::pair<StringRef, uint32_t>> 14185868e8aSDimitry Andric getFileLine(const SectionChunk *c, uint32_t addr) { 14285868e8aSDimitry Andric // MinGW can optionally use codeview, even if the default is dwarf. 143*bdd1243dSDimitry Andric std::optional<std::pair<StringRef, uint32_t>> fileLine = 14485868e8aSDimitry Andric getFileLineCodeView(c, addr); 14585868e8aSDimitry Andric // If codeview didn't yield any result, check dwarf in MinGW mode. 146*bdd1243dSDimitry Andric if (!fileLine && c->file->ctx.config.mingw) 14785868e8aSDimitry Andric fileLine = getFileLineDwarf(c, addr); 14885868e8aSDimitry Andric return fileLine; 14985868e8aSDimitry Andric } 15085868e8aSDimitry Andric 1510b57cec5SDimitry Andric // Given a file and the index of a symbol in that file, returns a description 1520b57cec5SDimitry Andric // of all references to that symbol from that file. If no debug information is 1530b57cec5SDimitry Andric // available, returns just the name of the file, else one string per actual 1540b57cec5SDimitry Andric // reference as described in the debug info. 155590d96feSDimitry Andric // Returns up to maxStrings string descriptions, along with the total number of 156590d96feSDimitry Andric // locations found. 157590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t> 158590d96feSDimitry Andric getSymbolLocations(ObjFile *file, uint32_t symIndex, size_t maxStrings) { 1590b57cec5SDimitry Andric struct Location { 1600b57cec5SDimitry Andric Symbol *sym; 1610b57cec5SDimitry Andric std::pair<StringRef, uint32_t> fileLine; 1620b57cec5SDimitry Andric }; 1630b57cec5SDimitry Andric std::vector<Location> locations; 164590d96feSDimitry Andric size_t numLocations = 0; 1650b57cec5SDimitry Andric 1660b57cec5SDimitry Andric for (Chunk *c : file->getChunks()) { 1670b57cec5SDimitry Andric auto *sc = dyn_cast<SectionChunk>(c); 1680b57cec5SDimitry Andric if (!sc) 1690b57cec5SDimitry Andric continue; 1700b57cec5SDimitry Andric for (const coff_relocation &r : sc->getRelocs()) { 1710b57cec5SDimitry Andric if (r.SymbolTableIndex != symIndex) 1720b57cec5SDimitry Andric continue; 173590d96feSDimitry Andric numLocations++; 174590d96feSDimitry Andric if (locations.size() >= maxStrings) 175590d96feSDimitry Andric continue; 176590d96feSDimitry Andric 177*bdd1243dSDimitry Andric std::optional<std::pair<StringRef, uint32_t>> fileLine = 1780b57cec5SDimitry Andric getFileLine(sc, r.VirtualAddress); 1790b57cec5SDimitry Andric Symbol *sym = getSymbol(sc, r.VirtualAddress); 18085868e8aSDimitry Andric if (fileLine) 18185868e8aSDimitry Andric locations.push_back({sym, *fileLine}); 18285868e8aSDimitry Andric else if (sym) 18385868e8aSDimitry Andric locations.push_back({sym, {"", 0}}); 1840b57cec5SDimitry Andric } 1850b57cec5SDimitry Andric } 1860b57cec5SDimitry Andric 187590d96feSDimitry Andric if (maxStrings == 0) 188590d96feSDimitry Andric return std::make_pair(std::vector<std::string>(), numLocations); 189590d96feSDimitry Andric 190590d96feSDimitry Andric if (numLocations == 0) 191590d96feSDimitry Andric return std::make_pair( 192590d96feSDimitry Andric std::vector<std::string>{"\n>>> referenced by " + toString(file)}, 1); 1930b57cec5SDimitry Andric 1940b57cec5SDimitry Andric std::vector<std::string> symbolLocations(locations.size()); 1950b57cec5SDimitry Andric size_t i = 0; 1960b57cec5SDimitry Andric for (Location loc : locations) { 1970b57cec5SDimitry Andric llvm::raw_string_ostream os(symbolLocations[i++]); 1980b57cec5SDimitry Andric os << "\n>>> referenced by "; 1990b57cec5SDimitry Andric if (!loc.fileLine.first.empty()) 2000b57cec5SDimitry Andric os << loc.fileLine.first << ":" << loc.fileLine.second 2010b57cec5SDimitry Andric << "\n>>> "; 2020b57cec5SDimitry Andric os << toString(file); 2030b57cec5SDimitry Andric if (loc.sym) 204*bdd1243dSDimitry Andric os << ":(" << toString(file->ctx, *loc.sym) << ')'; 2050b57cec5SDimitry Andric } 206590d96feSDimitry Andric return std::make_pair(symbolLocations, numLocations); 2070b57cec5SDimitry Andric } 2080b57cec5SDimitry Andric 209590d96feSDimitry Andric std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex) { 210590d96feSDimitry Andric return getSymbolLocations(file, symIndex, SIZE_MAX).first; 211590d96feSDimitry Andric } 212590d96feSDimitry Andric 213590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t> 214590d96feSDimitry Andric getSymbolLocations(InputFile *file, uint32_t symIndex, size_t maxStrings) { 21585868e8aSDimitry Andric if (auto *o = dyn_cast<ObjFile>(file)) 216590d96feSDimitry Andric return getSymbolLocations(o, symIndex, maxStrings); 217590d96feSDimitry Andric if (auto *b = dyn_cast<BitcodeFile>(file)) { 218590d96feSDimitry Andric std::vector<std::string> symbolLocations = getSymbolLocations(b); 219590d96feSDimitry Andric size_t numLocations = symbolLocations.size(); 220590d96feSDimitry Andric if (symbolLocations.size() > maxStrings) 221590d96feSDimitry Andric symbolLocations.resize(maxStrings); 222590d96feSDimitry Andric return std::make_pair(symbolLocations, numLocations); 223590d96feSDimitry Andric } 22485868e8aSDimitry Andric llvm_unreachable("unsupported file type passed to getSymbolLocations"); 225590d96feSDimitry Andric return std::make_pair(std::vector<std::string>(), (size_t)0); 22685868e8aSDimitry Andric } 22785868e8aSDimitry Andric 2280b57cec5SDimitry Andric // For an undefined symbol, stores all files referencing it and the index of 2290b57cec5SDimitry Andric // the undefined symbol in each file. 2300b57cec5SDimitry Andric struct UndefinedDiag { 2310b57cec5SDimitry Andric Symbol *sym; 2320b57cec5SDimitry Andric struct File { 23385868e8aSDimitry Andric InputFile *file; 23485868e8aSDimitry Andric uint32_t symIndex; 2350b57cec5SDimitry Andric }; 2360b57cec5SDimitry Andric std::vector<File> files; 2370b57cec5SDimitry Andric }; 2380b57cec5SDimitry Andric 239*bdd1243dSDimitry Andric static void reportUndefinedSymbol(const COFFLinkerContext &ctx, 240*bdd1243dSDimitry Andric const UndefinedDiag &undefDiag) { 2410b57cec5SDimitry Andric std::string out; 2420b57cec5SDimitry Andric llvm::raw_string_ostream os(out); 243*bdd1243dSDimitry Andric os << "undefined symbol: " << toString(ctx, *undefDiag.sym); 2440b57cec5SDimitry Andric 2455ffd83dbSDimitry Andric const size_t maxUndefReferences = 3; 246590d96feSDimitry Andric size_t numDisplayedRefs = 0, numRefs = 0; 2470b57cec5SDimitry Andric for (const UndefinedDiag::File &ref : undefDiag.files) { 248*bdd1243dSDimitry Andric auto [symbolLocations, totalLocations] = getSymbolLocations( 249590d96feSDimitry Andric ref.file, ref.symIndex, maxUndefReferences - numDisplayedRefs); 250590d96feSDimitry Andric 251590d96feSDimitry Andric numRefs += totalLocations; 252590d96feSDimitry Andric numDisplayedRefs += symbolLocations.size(); 2530b57cec5SDimitry Andric for (const std::string &s : symbolLocations) { 2540b57cec5SDimitry Andric os << s; 2550b57cec5SDimitry Andric } 2560b57cec5SDimitry Andric } 257590d96feSDimitry Andric if (numDisplayedRefs < numRefs) 258590d96feSDimitry Andric os << "\n>>> referenced " << numRefs - numDisplayedRefs << " more times"; 259*bdd1243dSDimitry Andric errorOrWarn(os.str(), ctx.config.forceUnresolved); 2600b57cec5SDimitry Andric } 2610b57cec5SDimitry Andric 262fe6060f1SDimitry Andric void SymbolTable::loadMinGWSymbols() { 2630b57cec5SDimitry Andric for (auto &i : symMap) { 2640b57cec5SDimitry Andric Symbol *sym = i.second; 2650b57cec5SDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 2660b57cec5SDimitry Andric if (!undef) 2670b57cec5SDimitry Andric continue; 26885868e8aSDimitry Andric if (undef->getWeakAlias()) 26985868e8aSDimitry Andric continue; 2700b57cec5SDimitry Andric 2710b57cec5SDimitry Andric StringRef name = undef->getName(); 2720b57cec5SDimitry Andric 273*bdd1243dSDimitry Andric if (ctx.config.machine == I386 && ctx.config.stdcallFixup) { 274fe6060f1SDimitry Andric // Check if we can resolve an undefined decorated symbol by finding 275349cc55cSDimitry Andric // the intended target as an undecorated symbol (only with a leading 276fe6060f1SDimitry Andric // underscore). 277fe6060f1SDimitry Andric StringRef origName = name; 278fe6060f1SDimitry Andric StringRef baseName = name; 279fe6060f1SDimitry Andric // Trim down stdcall/fastcall/vectorcall symbols to the base name. 280fe6060f1SDimitry Andric baseName = ltrim1(baseName, "_@"); 281fe6060f1SDimitry Andric baseName = baseName.substr(0, baseName.find('@')); 282fe6060f1SDimitry Andric // Add a leading underscore, as it would be in cdecl form. 283fe6060f1SDimitry Andric std::string newName = ("_" + baseName).str(); 284fe6060f1SDimitry Andric Symbol *l; 285fe6060f1SDimitry Andric if (newName != origName && (l = find(newName)) != nullptr) { 286fe6060f1SDimitry Andric // If we found a symbol and it is lazy; load it. 287fe6060f1SDimitry Andric if (l->isLazy() && !l->pendingArchiveLoad) { 288fe6060f1SDimitry Andric log("Loading lazy " + l->getName() + " from " + 289fe6060f1SDimitry Andric l->getFile()->getName() + " for stdcall fixup"); 290fe6060f1SDimitry Andric forceLazy(l); 291fe6060f1SDimitry Andric } 292fe6060f1SDimitry Andric // If it's lazy or already defined, hook it up as weak alias. 293fe6060f1SDimitry Andric if (l->isLazy() || isa<Defined>(l)) { 294*bdd1243dSDimitry Andric if (ctx.config.warnStdcallFixup) 295fe6060f1SDimitry Andric warn("Resolving " + origName + " by linking to " + newName); 296fe6060f1SDimitry Andric else 297fe6060f1SDimitry Andric log("Resolving " + origName + " by linking to " + newName); 298fe6060f1SDimitry Andric undef->weakAlias = l; 299fe6060f1SDimitry Andric continue; 300fe6060f1SDimitry Andric } 301fe6060f1SDimitry Andric } 302fe6060f1SDimitry Andric } 303fe6060f1SDimitry Andric 304*bdd1243dSDimitry Andric if (ctx.config.autoImport) { 3050b57cec5SDimitry Andric if (name.startswith("__imp_")) 3060b57cec5SDimitry Andric continue; 30785868e8aSDimitry Andric // If we have an undefined symbol, but we have a lazy symbol we could 30885868e8aSDimitry Andric // load, load it. 30985868e8aSDimitry Andric Symbol *l = find(("__imp_" + name).str()); 31085868e8aSDimitry Andric if (!l || l->pendingArchiveLoad || !l->isLazy()) 3110b57cec5SDimitry Andric continue; 3120b57cec5SDimitry Andric 31385868e8aSDimitry Andric log("Loading lazy " + l->getName() + " from " + l->getFile()->getName() + 3140b57cec5SDimitry Andric " for automatic import"); 31585868e8aSDimitry Andric forceLazy(l); 3160b57cec5SDimitry Andric } 3170b57cec5SDimitry Andric } 318fe6060f1SDimitry Andric } 3190b57cec5SDimitry Andric 32085868e8aSDimitry Andric Defined *SymbolTable::impSymbol(StringRef name) { 32185868e8aSDimitry Andric if (name.startswith("__imp_")) 32285868e8aSDimitry Andric return nullptr; 32385868e8aSDimitry Andric return dyn_cast_or_null<Defined>(find(("__imp_" + name).str())); 32485868e8aSDimitry Andric } 32585868e8aSDimitry Andric 3260b57cec5SDimitry Andric bool SymbolTable::handleMinGWAutomaticImport(Symbol *sym, StringRef name) { 32785868e8aSDimitry Andric Defined *imp = impSymbol(name); 3280b57cec5SDimitry Andric if (!imp) 3290b57cec5SDimitry Andric return false; 3300b57cec5SDimitry Andric 3310b57cec5SDimitry Andric // Replace the reference directly to a variable with a reference 3320b57cec5SDimitry Andric // to the import address table instead. This obviously isn't right, 3330b57cec5SDimitry Andric // but we mark the symbol as isRuntimePseudoReloc, and a later pass 3340b57cec5SDimitry Andric // will add runtime pseudo relocations for every relocation against 3350b57cec5SDimitry Andric // this Symbol. The runtime pseudo relocation framework expects the 3360b57cec5SDimitry Andric // reference itself to point at the IAT entry. 3370b57cec5SDimitry Andric size_t impSize = 0; 3380b57cec5SDimitry Andric if (isa<DefinedImportData>(imp)) { 3390b57cec5SDimitry Andric log("Automatically importing " + name + " from " + 3400b57cec5SDimitry Andric cast<DefinedImportData>(imp)->getDLLName()); 3410b57cec5SDimitry Andric impSize = sizeof(DefinedImportData); 3420b57cec5SDimitry Andric } else if (isa<DefinedRegular>(imp)) { 3430b57cec5SDimitry Andric log("Automatically importing " + name + " from " + 3440b57cec5SDimitry Andric toString(cast<DefinedRegular>(imp)->file)); 3450b57cec5SDimitry Andric impSize = sizeof(DefinedRegular); 3460b57cec5SDimitry Andric } else { 3470b57cec5SDimitry Andric warn("unable to automatically import " + name + " from " + imp->getName() + 3480b57cec5SDimitry Andric " from " + toString(cast<DefinedRegular>(imp)->file) + 3490b57cec5SDimitry Andric "; unexpected symbol type"); 3500b57cec5SDimitry Andric return false; 3510b57cec5SDimitry Andric } 3520b57cec5SDimitry Andric sym->replaceKeepingName(imp, impSize); 3530b57cec5SDimitry Andric sym->isRuntimePseudoReloc = true; 3540b57cec5SDimitry Andric 3550b57cec5SDimitry Andric // There may exist symbols named .refptr.<name> which only consist 3560b57cec5SDimitry Andric // of a single pointer to <name>. If it turns out <name> is 3570b57cec5SDimitry Andric // automatically imported, we don't need to keep the .refptr.<name> 3580b57cec5SDimitry Andric // pointer at all, but redirect all accesses to it to the IAT entry 3590b57cec5SDimitry Andric // for __imp_<name> instead, and drop the whole .refptr.<name> chunk. 3600b57cec5SDimitry Andric DefinedRegular *refptr = 3610b57cec5SDimitry Andric dyn_cast_or_null<DefinedRegular>(find((".refptr." + name).str())); 362*bdd1243dSDimitry Andric if (refptr && refptr->getChunk()->getSize() == ctx.config.wordsize) { 3630b57cec5SDimitry Andric SectionChunk *sc = dyn_cast_or_null<SectionChunk>(refptr->getChunk()); 3640b57cec5SDimitry Andric if (sc && sc->getRelocs().size() == 1 && *sc->symbols().begin() == sym) { 3650b57cec5SDimitry Andric log("Replacing .refptr." + name + " with " + imp->getName()); 3660b57cec5SDimitry Andric refptr->getChunk()->live = false; 3670b57cec5SDimitry Andric refptr->replaceKeepingName(imp, impSize); 3680b57cec5SDimitry Andric } 3690b57cec5SDimitry Andric } 3700b57cec5SDimitry Andric return true; 3710b57cec5SDimitry Andric } 3720b57cec5SDimitry Andric 37385868e8aSDimitry Andric /// Helper function for reportUnresolvable and resolveRemainingUndefines. 37485868e8aSDimitry Andric /// This function emits an "undefined symbol" diagnostic for each symbol in 37585868e8aSDimitry Andric /// undefs. If localImports is not nullptr, it also emits a "locally 37685868e8aSDimitry Andric /// defined symbol imported" diagnostic for symbols in localImports. 37785868e8aSDimitry Andric /// objFiles and bitcodeFiles (if not nullptr) are used to report where 37885868e8aSDimitry Andric /// undefined symbols are referenced. 379349cc55cSDimitry Andric static void reportProblemSymbols( 380349cc55cSDimitry Andric const COFFLinkerContext &ctx, const SmallPtrSetImpl<Symbol *> &undefs, 381349cc55cSDimitry Andric const DenseMap<Symbol *, Symbol *> *localImports, bool needBitcodeFiles) { 38285868e8aSDimitry Andric // Return early if there is nothing to report (which should be 38385868e8aSDimitry Andric // the common case). 38485868e8aSDimitry Andric if (undefs.empty() && (!localImports || localImports->empty())) 38585868e8aSDimitry Andric return; 38685868e8aSDimitry Andric 387*bdd1243dSDimitry Andric for (Symbol *b : ctx.config.gcroot) { 38885868e8aSDimitry Andric if (undefs.count(b)) 389*bdd1243dSDimitry Andric errorOrWarn("<root>: undefined symbol: " + toString(ctx, *b), 390*bdd1243dSDimitry Andric ctx.config.forceUnresolved); 39185868e8aSDimitry Andric if (localImports) 39285868e8aSDimitry Andric if (Symbol *imp = localImports->lookup(b)) 393*bdd1243dSDimitry Andric warn("<root>: locally defined symbol imported: " + toString(ctx, *imp) + 39485868e8aSDimitry Andric " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 39585868e8aSDimitry Andric } 39685868e8aSDimitry Andric 39785868e8aSDimitry Andric std::vector<UndefinedDiag> undefDiags; 39885868e8aSDimitry Andric DenseMap<Symbol *, int> firstDiag; 39985868e8aSDimitry Andric 40085868e8aSDimitry Andric auto processFile = [&](InputFile *file, ArrayRef<Symbol *> symbols) { 40185868e8aSDimitry Andric uint32_t symIndex = (uint32_t)-1; 40285868e8aSDimitry Andric for (Symbol *sym : symbols) { 40385868e8aSDimitry Andric ++symIndex; 40485868e8aSDimitry Andric if (!sym) 40585868e8aSDimitry Andric continue; 40685868e8aSDimitry Andric if (undefs.count(sym)) { 40785868e8aSDimitry Andric auto it = firstDiag.find(sym); 40885868e8aSDimitry Andric if (it == firstDiag.end()) { 40985868e8aSDimitry Andric firstDiag[sym] = undefDiags.size(); 41085868e8aSDimitry Andric undefDiags.push_back({sym, {{file, symIndex}}}); 41185868e8aSDimitry Andric } else { 41285868e8aSDimitry Andric undefDiags[it->second].files.push_back({file, symIndex}); 41385868e8aSDimitry Andric } 41485868e8aSDimitry Andric } 41585868e8aSDimitry Andric if (localImports) 41685868e8aSDimitry Andric if (Symbol *imp = localImports->lookup(sym)) 41785868e8aSDimitry Andric warn(toString(file) + 418*bdd1243dSDimitry Andric ": locally defined symbol imported: " + toString(ctx, *imp) + 41985868e8aSDimitry Andric " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 42085868e8aSDimitry Andric } 42185868e8aSDimitry Andric }; 42285868e8aSDimitry Andric 423349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) 42485868e8aSDimitry Andric processFile(file, file->getSymbols()); 42585868e8aSDimitry Andric 426349cc55cSDimitry Andric if (needBitcodeFiles) 427349cc55cSDimitry Andric for (BitcodeFile *file : ctx.bitcodeFileInstances) 42885868e8aSDimitry Andric processFile(file, file->getSymbols()); 42985868e8aSDimitry Andric 43085868e8aSDimitry Andric for (const UndefinedDiag &undefDiag : undefDiags) 431*bdd1243dSDimitry Andric reportUndefinedSymbol(ctx, undefDiag); 43285868e8aSDimitry Andric } 43385868e8aSDimitry Andric 43485868e8aSDimitry Andric void SymbolTable::reportUnresolvable() { 43585868e8aSDimitry Andric SmallPtrSet<Symbol *, 8> undefs; 43685868e8aSDimitry Andric for (auto &i : symMap) { 43785868e8aSDimitry Andric Symbol *sym = i.second; 43885868e8aSDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 439e8d8bef9SDimitry Andric if (!undef || sym->deferUndefined) 44085868e8aSDimitry Andric continue; 44185868e8aSDimitry Andric if (undef->getWeakAlias()) 44285868e8aSDimitry Andric continue; 44385868e8aSDimitry Andric StringRef name = undef->getName(); 44485868e8aSDimitry Andric if (name.startswith("__imp_")) { 44585868e8aSDimitry Andric Symbol *imp = find(name.substr(strlen("__imp_"))); 44685868e8aSDimitry Andric if (imp && isa<Defined>(imp)) 44785868e8aSDimitry Andric continue; 44885868e8aSDimitry Andric } 44985868e8aSDimitry Andric if (name.contains("_PchSym_")) 45085868e8aSDimitry Andric continue; 451*bdd1243dSDimitry Andric if (ctx.config.autoImport && impSymbol(name)) 45285868e8aSDimitry Andric continue; 45385868e8aSDimitry Andric undefs.insert(sym); 45485868e8aSDimitry Andric } 45585868e8aSDimitry Andric 456349cc55cSDimitry Andric reportProblemSymbols(ctx, undefs, 457349cc55cSDimitry Andric /* localImports */ nullptr, true); 45885868e8aSDimitry Andric } 45985868e8aSDimitry Andric 46085868e8aSDimitry Andric void SymbolTable::resolveRemainingUndefines() { 4610b57cec5SDimitry Andric SmallPtrSet<Symbol *, 8> undefs; 4620b57cec5SDimitry Andric DenseMap<Symbol *, Symbol *> localImports; 4630b57cec5SDimitry Andric 4640b57cec5SDimitry Andric for (auto &i : symMap) { 4650b57cec5SDimitry Andric Symbol *sym = i.second; 4660b57cec5SDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 4670b57cec5SDimitry Andric if (!undef) 4680b57cec5SDimitry Andric continue; 4690b57cec5SDimitry Andric if (!sym->isUsedInRegularObj) 4700b57cec5SDimitry Andric continue; 4710b57cec5SDimitry Andric 4720b57cec5SDimitry Andric StringRef name = undef->getName(); 4730b57cec5SDimitry Andric 4740b57cec5SDimitry Andric // A weak alias may have been resolved, so check for that. 4750b57cec5SDimitry Andric if (Defined *d = undef->getWeakAlias()) { 4760b57cec5SDimitry Andric // We want to replace Sym with D. However, we can't just blindly 4770b57cec5SDimitry Andric // copy sizeof(SymbolUnion) bytes from D to Sym because D may be an 4780b57cec5SDimitry Andric // internal symbol, and internal symbols are stored as "unparented" 4790b57cec5SDimitry Andric // Symbols. For that reason we need to check which type of symbol we 4800b57cec5SDimitry Andric // are dealing with and copy the correct number of bytes. 4810b57cec5SDimitry Andric if (isa<DefinedRegular>(d)) 4820b57cec5SDimitry Andric memcpy(sym, d, sizeof(DefinedRegular)); 4830b57cec5SDimitry Andric else if (isa<DefinedAbsolute>(d)) 4840b57cec5SDimitry Andric memcpy(sym, d, sizeof(DefinedAbsolute)); 4850b57cec5SDimitry Andric else 4860b57cec5SDimitry Andric memcpy(sym, d, sizeof(SymbolUnion)); 4870b57cec5SDimitry Andric continue; 4880b57cec5SDimitry Andric } 4890b57cec5SDimitry Andric 4900b57cec5SDimitry Andric // If we can resolve a symbol by removing __imp_ prefix, do that. 4910b57cec5SDimitry Andric // This odd rule is for compatibility with MSVC linker. 4920b57cec5SDimitry Andric if (name.startswith("__imp_")) { 4930b57cec5SDimitry Andric Symbol *imp = find(name.substr(strlen("__imp_"))); 4940b57cec5SDimitry Andric if (imp && isa<Defined>(imp)) { 4950b57cec5SDimitry Andric auto *d = cast<Defined>(imp); 496*bdd1243dSDimitry Andric replaceSymbol<DefinedLocalImport>(sym, ctx, name, d); 4970b57cec5SDimitry Andric localImportChunks.push_back(cast<DefinedLocalImport>(sym)->getChunk()); 4980b57cec5SDimitry Andric localImports[sym] = d; 4990b57cec5SDimitry Andric continue; 5000b57cec5SDimitry Andric } 5010b57cec5SDimitry Andric } 5020b57cec5SDimitry Andric 5030b57cec5SDimitry Andric // We don't want to report missing Microsoft precompiled headers symbols. 5040b57cec5SDimitry Andric // A proper message will be emitted instead in PDBLinker::aquirePrecompObj 5050b57cec5SDimitry Andric if (name.contains("_PchSym_")) 5060b57cec5SDimitry Andric continue; 5070b57cec5SDimitry Andric 508*bdd1243dSDimitry Andric if (ctx.config.autoImport && handleMinGWAutomaticImport(sym, name)) 5090b57cec5SDimitry Andric continue; 5100b57cec5SDimitry Andric 5110b57cec5SDimitry Andric // Remaining undefined symbols are not fatal if /force is specified. 5120b57cec5SDimitry Andric // They are replaced with dummy defined symbols. 513*bdd1243dSDimitry Andric if (ctx.config.forceUnresolved) 514*bdd1243dSDimitry Andric replaceSymbol<DefinedAbsolute>(sym, ctx, name, 0); 5150b57cec5SDimitry Andric undefs.insert(sym); 5160b57cec5SDimitry Andric } 5170b57cec5SDimitry Andric 51885868e8aSDimitry Andric reportProblemSymbols( 519*bdd1243dSDimitry Andric ctx, undefs, 520*bdd1243dSDimitry Andric ctx.config.warnLocallyDefinedImported ? &localImports : nullptr, false); 5210b57cec5SDimitry Andric } 5220b57cec5SDimitry Andric 5230b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name) { 5240b57cec5SDimitry Andric bool inserted = false; 5250b57cec5SDimitry Andric Symbol *&sym = symMap[CachedHashStringRef(name)]; 5260b57cec5SDimitry Andric if (!sym) { 5270b57cec5SDimitry Andric sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); 5280b57cec5SDimitry Andric sym->isUsedInRegularObj = false; 5290b57cec5SDimitry Andric sym->pendingArchiveLoad = false; 530e8d8bef9SDimitry Andric sym->canInline = true; 5310b57cec5SDimitry Andric inserted = true; 5320b57cec5SDimitry Andric } 5330b57cec5SDimitry Andric return {sym, inserted}; 5340b57cec5SDimitry Andric } 5350b57cec5SDimitry Andric 5360b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name, InputFile *file) { 5370b57cec5SDimitry Andric std::pair<Symbol *, bool> result = insert(name); 5380b57cec5SDimitry Andric if (!file || !isa<BitcodeFile>(file)) 5390b57cec5SDimitry Andric result.first->isUsedInRegularObj = true; 5400b57cec5SDimitry Andric return result; 5410b57cec5SDimitry Andric } 5420b57cec5SDimitry Andric 5430b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name, InputFile *f, 5440b57cec5SDimitry Andric bool isWeakAlias) { 545*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(name, f); 54685868e8aSDimitry Andric if (wasInserted || (s->isLazy() && isWeakAlias)) { 5470b57cec5SDimitry Andric replaceSymbol<Undefined>(s, name); 5480b57cec5SDimitry Andric return s; 5490b57cec5SDimitry Andric } 55085868e8aSDimitry Andric if (s->isLazy()) 55185868e8aSDimitry Andric forceLazy(s); 5520b57cec5SDimitry Andric return s; 5530b57cec5SDimitry Andric } 5540b57cec5SDimitry Andric 55585868e8aSDimitry Andric void SymbolTable::addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym) { 5560b57cec5SDimitry Andric StringRef name = sym.getName(); 557*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(name); 5580b57cec5SDimitry Andric if (wasInserted) { 55985868e8aSDimitry Andric replaceSymbol<LazyArchive>(s, f, sym); 5600b57cec5SDimitry Andric return; 5610b57cec5SDimitry Andric } 5620b57cec5SDimitry Andric auto *u = dyn_cast<Undefined>(s); 5630b57cec5SDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 5640b57cec5SDimitry Andric return; 5650b57cec5SDimitry Andric s->pendingArchiveLoad = true; 5660b57cec5SDimitry Andric f->addMember(sym); 5670b57cec5SDimitry Andric } 5680b57cec5SDimitry Andric 56904eeddc0SDimitry Andric void SymbolTable::addLazyObject(InputFile *f, StringRef n) { 57004eeddc0SDimitry Andric assert(f->lazy); 571*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, f); 57285868e8aSDimitry Andric if (wasInserted) { 57385868e8aSDimitry Andric replaceSymbol<LazyObject>(s, f, n); 57485868e8aSDimitry Andric return; 57585868e8aSDimitry Andric } 57685868e8aSDimitry Andric auto *u = dyn_cast<Undefined>(s); 57785868e8aSDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 57885868e8aSDimitry Andric return; 57985868e8aSDimitry Andric s->pendingArchiveLoad = true; 58004eeddc0SDimitry Andric f->lazy = false; 58104eeddc0SDimitry Andric addFile(f); 58285868e8aSDimitry Andric } 58385868e8aSDimitry Andric 584fe6060f1SDimitry Andric void SymbolTable::addLazyDLLSymbol(DLLFile *f, DLLFile::Symbol *sym, 585fe6060f1SDimitry Andric StringRef n) { 586*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n); 587fe6060f1SDimitry Andric if (wasInserted) { 588fe6060f1SDimitry Andric replaceSymbol<LazyDLLSymbol>(s, f, sym, n); 589fe6060f1SDimitry Andric return; 590fe6060f1SDimitry Andric } 591fe6060f1SDimitry Andric auto *u = dyn_cast<Undefined>(s); 592fe6060f1SDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 593fe6060f1SDimitry Andric return; 594fe6060f1SDimitry Andric s->pendingArchiveLoad = true; 595fe6060f1SDimitry Andric f->makeImport(sym); 596fe6060f1SDimitry Andric } 597fe6060f1SDimitry Andric 59885868e8aSDimitry Andric static std::string getSourceLocationBitcode(BitcodeFile *file) { 59985868e8aSDimitry Andric std::string res("\n>>> defined at "); 60085868e8aSDimitry Andric StringRef source = file->obj->getSourceFileName(); 60185868e8aSDimitry Andric if (!source.empty()) 60285868e8aSDimitry Andric res += source.str() + "\n>>> "; 60385868e8aSDimitry Andric res += toString(file); 60485868e8aSDimitry Andric return res; 60585868e8aSDimitry Andric } 60685868e8aSDimitry Andric 60785868e8aSDimitry Andric static std::string getSourceLocationObj(ObjFile *file, SectionChunk *sc, 60885868e8aSDimitry Andric uint32_t offset, StringRef name) { 609*bdd1243dSDimitry Andric std::optional<std::pair<StringRef, uint32_t>> fileLine; 61085868e8aSDimitry Andric if (sc) 61185868e8aSDimitry Andric fileLine = getFileLine(sc, offset); 61285868e8aSDimitry Andric if (!fileLine) 61385868e8aSDimitry Andric fileLine = file->getVariableLocation(name); 61485868e8aSDimitry Andric 61585868e8aSDimitry Andric std::string res; 61685868e8aSDimitry Andric llvm::raw_string_ostream os(res); 61785868e8aSDimitry Andric os << "\n>>> defined at "; 61885868e8aSDimitry Andric if (fileLine) 61985868e8aSDimitry Andric os << fileLine->first << ":" << fileLine->second << "\n>>> "; 62085868e8aSDimitry Andric os << toString(file); 62185868e8aSDimitry Andric return os.str(); 62285868e8aSDimitry Andric } 62385868e8aSDimitry Andric 62485868e8aSDimitry Andric static std::string getSourceLocation(InputFile *file, SectionChunk *sc, 62585868e8aSDimitry Andric uint32_t offset, StringRef name) { 626480093f4SDimitry Andric if (!file) 627480093f4SDimitry Andric return ""; 62885868e8aSDimitry Andric if (auto *o = dyn_cast<ObjFile>(file)) 62985868e8aSDimitry Andric return getSourceLocationObj(o, sc, offset, name); 63085868e8aSDimitry Andric if (auto *b = dyn_cast<BitcodeFile>(file)) 63185868e8aSDimitry Andric return getSourceLocationBitcode(b); 63285868e8aSDimitry Andric return "\n>>> defined at " + toString(file); 63385868e8aSDimitry Andric } 63485868e8aSDimitry Andric 63585868e8aSDimitry Andric // Construct and print an error message in the form of: 63685868e8aSDimitry Andric // 63785868e8aSDimitry Andric // lld-link: error: duplicate symbol: foo 63885868e8aSDimitry Andric // >>> defined at bar.c:30 63985868e8aSDimitry Andric // >>> bar.o 64085868e8aSDimitry Andric // >>> defined at baz.c:563 64185868e8aSDimitry Andric // >>> baz.o 64285868e8aSDimitry Andric void SymbolTable::reportDuplicate(Symbol *existing, InputFile *newFile, 64385868e8aSDimitry Andric SectionChunk *newSc, 64485868e8aSDimitry Andric uint32_t newSectionOffset) { 64585868e8aSDimitry Andric std::string msg; 64685868e8aSDimitry Andric llvm::raw_string_ostream os(msg); 647*bdd1243dSDimitry Andric os << "duplicate symbol: " << toString(ctx, *existing); 64885868e8aSDimitry Andric 649480093f4SDimitry Andric DefinedRegular *d = dyn_cast<DefinedRegular>(existing); 65085868e8aSDimitry Andric if (d && isa<ObjFile>(d->getFile())) { 65185868e8aSDimitry Andric os << getSourceLocation(d->getFile(), d->getChunk(), d->getValue(), 65285868e8aSDimitry Andric existing->getName()); 65385868e8aSDimitry Andric } else { 65485868e8aSDimitry Andric os << getSourceLocation(existing->getFile(), nullptr, 0, ""); 65585868e8aSDimitry Andric } 65685868e8aSDimitry Andric os << getSourceLocation(newFile, newSc, newSectionOffset, 65785868e8aSDimitry Andric existing->getName()); 6580b57cec5SDimitry Andric 659*bdd1243dSDimitry Andric if (ctx.config.forceMultiple) 66085868e8aSDimitry Andric warn(os.str()); 6610b57cec5SDimitry Andric else 66285868e8aSDimitry Andric error(os.str()); 6630b57cec5SDimitry Andric } 6640b57cec5SDimitry Andric 6650b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, COFFSymbolRef sym) { 666*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, nullptr); 6670b57cec5SDimitry Andric s->isUsedInRegularObj = true; 66885868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 669*bdd1243dSDimitry Andric replaceSymbol<DefinedAbsolute>(s, ctx, n, sym); 670480093f4SDimitry Andric else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 671480093f4SDimitry Andric if (da->getVA() != sym.getValue()) 672480093f4SDimitry Andric reportDuplicate(s, nullptr); 673480093f4SDimitry Andric } else if (!isa<DefinedCOFF>(s)) 6740b57cec5SDimitry Andric reportDuplicate(s, nullptr); 6750b57cec5SDimitry Andric return s; 6760b57cec5SDimitry Andric } 6770b57cec5SDimitry Andric 6780b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, uint64_t va) { 679*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, nullptr); 6800b57cec5SDimitry Andric s->isUsedInRegularObj = true; 68185868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 682*bdd1243dSDimitry Andric replaceSymbol<DefinedAbsolute>(s, ctx, n, va); 683480093f4SDimitry Andric else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 684480093f4SDimitry Andric if (da->getVA() != va) 685480093f4SDimitry Andric reportDuplicate(s, nullptr); 686480093f4SDimitry Andric } else if (!isa<DefinedCOFF>(s)) 6870b57cec5SDimitry Andric reportDuplicate(s, nullptr); 6880b57cec5SDimitry Andric return s; 6890b57cec5SDimitry Andric } 6900b57cec5SDimitry Andric 6910b57cec5SDimitry Andric Symbol *SymbolTable::addSynthetic(StringRef n, Chunk *c) { 692*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, nullptr); 6930b57cec5SDimitry Andric s->isUsedInRegularObj = true; 69485868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 6950b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(s, n, c); 6960b57cec5SDimitry Andric else if (!isa<DefinedCOFF>(s)) 6970b57cec5SDimitry Andric reportDuplicate(s, nullptr); 6980b57cec5SDimitry Andric return s; 6990b57cec5SDimitry Andric } 7000b57cec5SDimitry Andric 7010b57cec5SDimitry Andric Symbol *SymbolTable::addRegular(InputFile *f, StringRef n, 70285868e8aSDimitry Andric const coff_symbol_generic *sym, SectionChunk *c, 703*bdd1243dSDimitry Andric uint32_t sectionOffset, bool isWeak) { 704*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, f); 705*bdd1243dSDimitry Andric if (wasInserted || !isa<DefinedRegular>(s) || s->isWeak) 7060b57cec5SDimitry Andric replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ false, 707*bdd1243dSDimitry Andric /*IsExternal*/ true, sym, c, isWeak); 708*bdd1243dSDimitry Andric else if (!isWeak) 70985868e8aSDimitry Andric reportDuplicate(s, f, c, sectionOffset); 7100b57cec5SDimitry Andric return s; 7110b57cec5SDimitry Andric } 7120b57cec5SDimitry Andric 7130b57cec5SDimitry Andric std::pair<DefinedRegular *, bool> 7140b57cec5SDimitry Andric SymbolTable::addComdat(InputFile *f, StringRef n, 7150b57cec5SDimitry Andric const coff_symbol_generic *sym) { 716*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, f); 7170b57cec5SDimitry Andric if (wasInserted || !isa<DefinedRegular>(s)) { 7180b57cec5SDimitry Andric replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ true, 7190b57cec5SDimitry Andric /*IsExternal*/ true, sym, nullptr); 7200b57cec5SDimitry Andric return {cast<DefinedRegular>(s), true}; 7210b57cec5SDimitry Andric } 7220b57cec5SDimitry Andric auto *existingSymbol = cast<DefinedRegular>(s); 7230b57cec5SDimitry Andric if (!existingSymbol->isCOMDAT) 7240b57cec5SDimitry Andric reportDuplicate(s, f); 7250b57cec5SDimitry Andric return {existingSymbol, false}; 7260b57cec5SDimitry Andric } 7270b57cec5SDimitry Andric 7280b57cec5SDimitry Andric Symbol *SymbolTable::addCommon(InputFile *f, StringRef n, uint64_t size, 7290b57cec5SDimitry Andric const coff_symbol_generic *sym, CommonChunk *c) { 730*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, f); 7310b57cec5SDimitry Andric if (wasInserted || !isa<DefinedCOFF>(s)) 7320b57cec5SDimitry Andric replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 7330b57cec5SDimitry Andric else if (auto *dc = dyn_cast<DefinedCommon>(s)) 7340b57cec5SDimitry Andric if (size > dc->getSize()) 7350b57cec5SDimitry Andric replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 7360b57cec5SDimitry Andric return s; 7370b57cec5SDimitry Andric } 7380b57cec5SDimitry Andric 7390b57cec5SDimitry Andric Symbol *SymbolTable::addImportData(StringRef n, ImportFile *f) { 740*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(n, nullptr); 7410b57cec5SDimitry Andric s->isUsedInRegularObj = true; 74285868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 7430b57cec5SDimitry Andric replaceSymbol<DefinedImportData>(s, n, f); 7440b57cec5SDimitry Andric return s; 7450b57cec5SDimitry Andric } 7460b57cec5SDimitry Andric 7470b57cec5SDimitry Andric reportDuplicate(s, f); 7480b57cec5SDimitry Andric return nullptr; 7490b57cec5SDimitry Andric } 7500b57cec5SDimitry Andric 7510b57cec5SDimitry Andric Symbol *SymbolTable::addImportThunk(StringRef name, DefinedImportData *id, 7520b57cec5SDimitry Andric uint16_t machine) { 753*bdd1243dSDimitry Andric auto [s, wasInserted] = insert(name, nullptr); 7540b57cec5SDimitry Andric s->isUsedInRegularObj = true; 75585868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 756*bdd1243dSDimitry Andric replaceSymbol<DefinedImportThunk>(s, ctx, name, id, machine); 7570b57cec5SDimitry Andric return s; 7580b57cec5SDimitry Andric } 7590b57cec5SDimitry Andric 7600b57cec5SDimitry Andric reportDuplicate(s, id->file); 7610b57cec5SDimitry Andric return nullptr; 7620b57cec5SDimitry Andric } 7630b57cec5SDimitry Andric 7640b57cec5SDimitry Andric void SymbolTable::addLibcall(StringRef name) { 7650b57cec5SDimitry Andric Symbol *sym = findUnderscore(name); 7660b57cec5SDimitry Andric if (!sym) 7670b57cec5SDimitry Andric return; 7680b57cec5SDimitry Andric 76985868e8aSDimitry Andric if (auto *l = dyn_cast<LazyArchive>(sym)) { 7700b57cec5SDimitry Andric MemoryBufferRef mb = l->getMemberBuffer(); 77185868e8aSDimitry Andric if (isBitcode(mb)) 77285868e8aSDimitry Andric addUndefined(sym->getName()); 77385868e8aSDimitry Andric } else if (LazyObject *o = dyn_cast<LazyObject>(sym)) { 77485868e8aSDimitry Andric if (isBitcode(o->file->mb)) 7750b57cec5SDimitry Andric addUndefined(sym->getName()); 7760b57cec5SDimitry Andric } 7770b57cec5SDimitry Andric } 7780b57cec5SDimitry Andric 779349cc55cSDimitry Andric std::vector<Chunk *> SymbolTable::getChunks() const { 7800b57cec5SDimitry Andric std::vector<Chunk *> res; 781349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) { 7820b57cec5SDimitry Andric ArrayRef<Chunk *> v = file->getChunks(); 7830b57cec5SDimitry Andric res.insert(res.end(), v.begin(), v.end()); 7840b57cec5SDimitry Andric } 7850b57cec5SDimitry Andric return res; 7860b57cec5SDimitry Andric } 7870b57cec5SDimitry Andric 788349cc55cSDimitry Andric Symbol *SymbolTable::find(StringRef name) const { 7890b57cec5SDimitry Andric return symMap.lookup(CachedHashStringRef(name)); 7900b57cec5SDimitry Andric } 7910b57cec5SDimitry Andric 792349cc55cSDimitry Andric Symbol *SymbolTable::findUnderscore(StringRef name) const { 793*bdd1243dSDimitry Andric if (ctx.config.machine == I386) 7940b57cec5SDimitry Andric return find(("_" + name).str()); 7950b57cec5SDimitry Andric return find(name); 7960b57cec5SDimitry Andric } 7970b57cec5SDimitry Andric 7980b57cec5SDimitry Andric // Return all symbols that start with Prefix, possibly ignoring the first 7990b57cec5SDimitry Andric // character of Prefix or the first character symbol. 8000b57cec5SDimitry Andric std::vector<Symbol *> SymbolTable::getSymsWithPrefix(StringRef prefix) { 8010b57cec5SDimitry Andric std::vector<Symbol *> syms; 8020b57cec5SDimitry Andric for (auto pair : symMap) { 8030b57cec5SDimitry Andric StringRef name = pair.first.val(); 8040b57cec5SDimitry Andric if (name.startswith(prefix) || name.startswith(prefix.drop_front()) || 8050b57cec5SDimitry Andric name.drop_front().startswith(prefix) || 8060b57cec5SDimitry Andric name.drop_front().startswith(prefix.drop_front())) { 8070b57cec5SDimitry Andric syms.push_back(pair.second); 8080b57cec5SDimitry Andric } 8090b57cec5SDimitry Andric } 8100b57cec5SDimitry Andric return syms; 8110b57cec5SDimitry Andric } 8120b57cec5SDimitry Andric 8130b57cec5SDimitry Andric Symbol *SymbolTable::findMangle(StringRef name) { 814*bdd1243dSDimitry Andric if (Symbol *sym = find(name)) { 815*bdd1243dSDimitry Andric if (auto *u = dyn_cast<Undefined>(sym)) { 816*bdd1243dSDimitry Andric // We're specifically looking for weak aliases that ultimately resolve to 817*bdd1243dSDimitry Andric // defined symbols, hence the call to getWeakAlias() instead of just using 818*bdd1243dSDimitry Andric // the weakAlias member variable. This matches link.exe's behavior. 819*bdd1243dSDimitry Andric if (Symbol *weakAlias = u->getWeakAlias()) 820*bdd1243dSDimitry Andric return weakAlias; 821*bdd1243dSDimitry Andric } else { 8220b57cec5SDimitry Andric return sym; 823*bdd1243dSDimitry Andric } 824*bdd1243dSDimitry Andric } 8250b57cec5SDimitry Andric 8260b57cec5SDimitry Andric // Efficient fuzzy string lookup is impossible with a hash table, so iterate 8270b57cec5SDimitry Andric // the symbol table once and collect all possibly matching symbols into this 8280b57cec5SDimitry Andric // vector. Then compare each possibly matching symbol with each possible 8290b57cec5SDimitry Andric // mangling. 8300b57cec5SDimitry Andric std::vector<Symbol *> syms = getSymsWithPrefix(name); 8310b57cec5SDimitry Andric auto findByPrefix = [&syms](const Twine &t) -> Symbol * { 8320b57cec5SDimitry Andric std::string prefix = t.str(); 8330b57cec5SDimitry Andric for (auto *s : syms) 8340b57cec5SDimitry Andric if (s->getName().startswith(prefix)) 8350b57cec5SDimitry Andric return s; 8360b57cec5SDimitry Andric return nullptr; 8370b57cec5SDimitry Andric }; 8380b57cec5SDimitry Andric 8390b57cec5SDimitry Andric // For non-x86, just look for C++ functions. 840*bdd1243dSDimitry Andric if (ctx.config.machine != I386) 8410b57cec5SDimitry Andric return findByPrefix("?" + name + "@@Y"); 8420b57cec5SDimitry Andric 8430b57cec5SDimitry Andric if (!name.startswith("_")) 8440b57cec5SDimitry Andric return nullptr; 8450b57cec5SDimitry Andric // Search for x86 stdcall function. 8460b57cec5SDimitry Andric if (Symbol *s = findByPrefix(name + "@")) 8470b57cec5SDimitry Andric return s; 8480b57cec5SDimitry Andric // Search for x86 fastcall function. 8490b57cec5SDimitry Andric if (Symbol *s = findByPrefix("@" + name.substr(1) + "@")) 8500b57cec5SDimitry Andric return s; 8510b57cec5SDimitry Andric // Search for x86 vectorcall function. 8520b57cec5SDimitry Andric if (Symbol *s = findByPrefix(name.substr(1) + "@@")) 8530b57cec5SDimitry Andric return s; 8540b57cec5SDimitry Andric // Search for x86 C++ non-member function. 8550b57cec5SDimitry Andric return findByPrefix("?" + name.substr(1) + "@@Y"); 8560b57cec5SDimitry Andric } 8570b57cec5SDimitry Andric 8580b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name) { 8590b57cec5SDimitry Andric return addUndefined(name, nullptr, false); 8600b57cec5SDimitry Andric } 8610b57cec5SDimitry Andric 862349cc55cSDimitry Andric void SymbolTable::compileBitcodeFiles() { 863349cc55cSDimitry Andric if (ctx.bitcodeFileInstances.empty()) 8640b57cec5SDimitry Andric return; 8650b57cec5SDimitry Andric 866349cc55cSDimitry Andric ScopedTimer t(ctx.ltoTimer); 867*bdd1243dSDimitry Andric lto.reset(new BitcodeCompiler(ctx)); 868349cc55cSDimitry Andric for (BitcodeFile *f : ctx.bitcodeFileInstances) 8695ffd83dbSDimitry Andric lto->add(*f); 870*bdd1243dSDimitry Andric for (InputFile *newObj : lto->compile()) { 8715ffd83dbSDimitry Andric ObjFile *obj = cast<ObjFile>(newObj); 8720b57cec5SDimitry Andric obj->parse(); 873349cc55cSDimitry Andric ctx.objFileInstances.push_back(obj); 8740b57cec5SDimitry Andric } 8750b57cec5SDimitry Andric } 8760b57cec5SDimitry Andric 877*bdd1243dSDimitry Andric } // namespace lld::coff 878