10b57cec5SDimitry Andric //===- SymbolTable.cpp ----------------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "SymbolTable.h" 10349cc55cSDimitry Andric #include "COFFLinkerContext.h" 110b57cec5SDimitry Andric #include "Config.h" 120b57cec5SDimitry Andric #include "Driver.h" 130b57cec5SDimitry Andric #include "LTO.h" 140b57cec5SDimitry Andric #include "PDB.h" 150b57cec5SDimitry Andric #include "Symbols.h" 160b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h" 170b57cec5SDimitry Andric #include "lld/Common/Memory.h" 180b57cec5SDimitry Andric #include "lld/Common/Timer.h" 190eae32dcSDimitry Andric #include "llvm/DebugInfo/DIContext.h" 200b57cec5SDimitry Andric #include "llvm/IR/LLVMContext.h" 21480093f4SDimitry Andric #include "llvm/LTO/LTO.h" 220b57cec5SDimitry Andric #include "llvm/Object/WindowsMachineFlag.h" 230b57cec5SDimitry Andric #include "llvm/Support/Debug.h" 240b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h" 250b57cec5SDimitry Andric #include <utility> 260b57cec5SDimitry Andric 270b57cec5SDimitry Andric using namespace llvm; 280b57cec5SDimitry Andric 290b57cec5SDimitry Andric namespace lld { 300b57cec5SDimitry Andric namespace coff { 310b57cec5SDimitry Andric 32fe6060f1SDimitry Andric StringRef ltrim1(StringRef s, const char *chars) { 33fe6060f1SDimitry Andric if (!s.empty() && strchr(chars, s[0])) 34fe6060f1SDimitry Andric return s.substr(1); 35fe6060f1SDimitry Andric return s; 36fe6060f1SDimitry Andric } 37fe6060f1SDimitry Andric 380b57cec5SDimitry Andric void SymbolTable::addFile(InputFile *file) { 390b57cec5SDimitry Andric log("Reading " + toString(file)); 40*04eeddc0SDimitry Andric if (file->lazy) { 41*04eeddc0SDimitry Andric if (auto *f = dyn_cast<BitcodeFile>(file)) 42*04eeddc0SDimitry Andric f->parseLazy(); 43*04eeddc0SDimitry Andric else 44*04eeddc0SDimitry Andric cast<ObjFile>(file)->parseLazy(); 45*04eeddc0SDimitry Andric } else { 460b57cec5SDimitry Andric file->parse(); 47*04eeddc0SDimitry Andric if (auto *f = dyn_cast<ObjFile>(file)) { 48*04eeddc0SDimitry Andric ctx.objFileInstances.push_back(f); 49*04eeddc0SDimitry Andric } else if (auto *f = dyn_cast<BitcodeFile>(file)) { 50*04eeddc0SDimitry Andric ctx.bitcodeFileInstances.push_back(f); 51*04eeddc0SDimitry Andric } else if (auto *f = dyn_cast<ImportFile>(file)) { 52*04eeddc0SDimitry Andric ctx.importFileInstances.push_back(f); 53*04eeddc0SDimitry Andric } 54*04eeddc0SDimitry Andric } 550b57cec5SDimitry Andric 560b57cec5SDimitry Andric MachineTypes mt = file->getMachineType(); 570b57cec5SDimitry Andric if (config->machine == IMAGE_FILE_MACHINE_UNKNOWN) { 580b57cec5SDimitry Andric config->machine = mt; 590b57cec5SDimitry Andric } else if (mt != IMAGE_FILE_MACHINE_UNKNOWN && config->machine != mt) { 600b57cec5SDimitry Andric error(toString(file) + ": machine type " + machineToStr(mt) + 610b57cec5SDimitry Andric " conflicts with " + machineToStr(config->machine)); 620b57cec5SDimitry Andric return; 630b57cec5SDimitry Andric } 640b57cec5SDimitry Andric 650b57cec5SDimitry Andric driver->parseDirectives(file); 660b57cec5SDimitry Andric } 670b57cec5SDimitry Andric 680b57cec5SDimitry Andric static void errorOrWarn(const Twine &s) { 690b57cec5SDimitry Andric if (config->forceUnresolved) 700b57cec5SDimitry Andric warn(s); 710b57cec5SDimitry Andric else 720b57cec5SDimitry Andric error(s); 730b57cec5SDimitry Andric } 740b57cec5SDimitry Andric 7585868e8aSDimitry Andric // Causes the file associated with a lazy symbol to be linked in. 7685868e8aSDimitry Andric static void forceLazy(Symbol *s) { 7785868e8aSDimitry Andric s->pendingArchiveLoad = true; 7885868e8aSDimitry Andric switch (s->kind()) { 7985868e8aSDimitry Andric case Symbol::Kind::LazyArchiveKind: { 8085868e8aSDimitry Andric auto *l = cast<LazyArchive>(s); 8185868e8aSDimitry Andric l->file->addMember(l->sym); 8285868e8aSDimitry Andric break; 8385868e8aSDimitry Andric } 84*04eeddc0SDimitry Andric case Symbol::Kind::LazyObjectKind: { 85*04eeddc0SDimitry Andric InputFile *file = cast<LazyObject>(s)->file; 86*04eeddc0SDimitry Andric file->ctx.symtab.addFile(file); 8785868e8aSDimitry Andric break; 88*04eeddc0SDimitry Andric } 89fe6060f1SDimitry Andric case Symbol::Kind::LazyDLLSymbolKind: { 90fe6060f1SDimitry Andric auto *l = cast<LazyDLLSymbol>(s); 91fe6060f1SDimitry Andric l->file->makeImport(l->sym); 92fe6060f1SDimitry Andric break; 93fe6060f1SDimitry Andric } 9485868e8aSDimitry Andric default: 9585868e8aSDimitry Andric llvm_unreachable( 9685868e8aSDimitry Andric "symbol passed to forceLazy is not a LazyArchive or LazyObject"); 9785868e8aSDimitry Andric } 9885868e8aSDimitry Andric } 9985868e8aSDimitry Andric 1000b57cec5SDimitry Andric // Returns the symbol in SC whose value is <= Addr that is closest to Addr. 1010b57cec5SDimitry Andric // This is generally the global variable or function whose definition contains 1020b57cec5SDimitry Andric // Addr. 1030b57cec5SDimitry Andric static Symbol *getSymbol(SectionChunk *sc, uint32_t addr) { 1040b57cec5SDimitry Andric DefinedRegular *candidate = nullptr; 1050b57cec5SDimitry Andric 1060b57cec5SDimitry Andric for (Symbol *s : sc->file->getSymbols()) { 1070b57cec5SDimitry Andric auto *d = dyn_cast_or_null<DefinedRegular>(s); 10885868e8aSDimitry Andric if (!d || !d->data || d->file != sc->file || d->getChunk() != sc || 10985868e8aSDimitry Andric d->getValue() > addr || 1100b57cec5SDimitry Andric (candidate && d->getValue() < candidate->getValue())) 1110b57cec5SDimitry Andric continue; 1120b57cec5SDimitry Andric 1130b57cec5SDimitry Andric candidate = d; 1140b57cec5SDimitry Andric } 1150b57cec5SDimitry Andric 1160b57cec5SDimitry Andric return candidate; 1170b57cec5SDimitry Andric } 1180b57cec5SDimitry Andric 11985868e8aSDimitry Andric static std::vector<std::string> getSymbolLocations(BitcodeFile *file) { 12085868e8aSDimitry Andric std::string res("\n>>> referenced by "); 12185868e8aSDimitry Andric StringRef source = file->obj->getSourceFileName(); 12285868e8aSDimitry Andric if (!source.empty()) 12385868e8aSDimitry Andric res += source.str() + "\n>>> "; 12485868e8aSDimitry Andric res += toString(file); 12585868e8aSDimitry Andric return {res}; 12685868e8aSDimitry Andric } 12785868e8aSDimitry Andric 12885868e8aSDimitry Andric static Optional<std::pair<StringRef, uint32_t>> 12985868e8aSDimitry Andric getFileLineDwarf(const SectionChunk *c, uint32_t addr) { 13085868e8aSDimitry Andric Optional<DILineInfo> optionalLineInfo = 13185868e8aSDimitry Andric c->file->getDILineInfo(addr, c->getSectionNumber() - 1); 13285868e8aSDimitry Andric if (!optionalLineInfo) 13385868e8aSDimitry Andric return None; 13485868e8aSDimitry Andric const DILineInfo &lineInfo = *optionalLineInfo; 13585868e8aSDimitry Andric if (lineInfo.FileName == DILineInfo::BadString) 13685868e8aSDimitry Andric return None; 137*04eeddc0SDimitry Andric return std::make_pair(saver().save(lineInfo.FileName), lineInfo.Line); 13885868e8aSDimitry Andric } 13985868e8aSDimitry Andric 14085868e8aSDimitry Andric static Optional<std::pair<StringRef, uint32_t>> 14185868e8aSDimitry Andric getFileLine(const SectionChunk *c, uint32_t addr) { 14285868e8aSDimitry Andric // MinGW can optionally use codeview, even if the default is dwarf. 14385868e8aSDimitry Andric Optional<std::pair<StringRef, uint32_t>> fileLine = 14485868e8aSDimitry Andric getFileLineCodeView(c, addr); 14585868e8aSDimitry Andric // If codeview didn't yield any result, check dwarf in MinGW mode. 14685868e8aSDimitry Andric if (!fileLine && config->mingw) 14785868e8aSDimitry Andric fileLine = getFileLineDwarf(c, addr); 14885868e8aSDimitry Andric return fileLine; 14985868e8aSDimitry Andric } 15085868e8aSDimitry Andric 1510b57cec5SDimitry Andric // Given a file and the index of a symbol in that file, returns a description 1520b57cec5SDimitry Andric // of all references to that symbol from that file. If no debug information is 1530b57cec5SDimitry Andric // available, returns just the name of the file, else one string per actual 1540b57cec5SDimitry Andric // reference as described in the debug info. 155590d96feSDimitry Andric // Returns up to maxStrings string descriptions, along with the total number of 156590d96feSDimitry Andric // locations found. 157590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t> 158590d96feSDimitry Andric getSymbolLocations(ObjFile *file, uint32_t symIndex, size_t maxStrings) { 1590b57cec5SDimitry Andric struct Location { 1600b57cec5SDimitry Andric Symbol *sym; 1610b57cec5SDimitry Andric std::pair<StringRef, uint32_t> fileLine; 1620b57cec5SDimitry Andric }; 1630b57cec5SDimitry Andric std::vector<Location> locations; 164590d96feSDimitry Andric size_t numLocations = 0; 1650b57cec5SDimitry Andric 1660b57cec5SDimitry Andric for (Chunk *c : file->getChunks()) { 1670b57cec5SDimitry Andric auto *sc = dyn_cast<SectionChunk>(c); 1680b57cec5SDimitry Andric if (!sc) 1690b57cec5SDimitry Andric continue; 1700b57cec5SDimitry Andric for (const coff_relocation &r : sc->getRelocs()) { 1710b57cec5SDimitry Andric if (r.SymbolTableIndex != symIndex) 1720b57cec5SDimitry Andric continue; 173590d96feSDimitry Andric numLocations++; 174590d96feSDimitry Andric if (locations.size() >= maxStrings) 175590d96feSDimitry Andric continue; 176590d96feSDimitry Andric 17785868e8aSDimitry Andric Optional<std::pair<StringRef, uint32_t>> fileLine = 1780b57cec5SDimitry Andric getFileLine(sc, r.VirtualAddress); 1790b57cec5SDimitry Andric Symbol *sym = getSymbol(sc, r.VirtualAddress); 18085868e8aSDimitry Andric if (fileLine) 18185868e8aSDimitry Andric locations.push_back({sym, *fileLine}); 18285868e8aSDimitry Andric else if (sym) 18385868e8aSDimitry Andric locations.push_back({sym, {"", 0}}); 1840b57cec5SDimitry Andric } 1850b57cec5SDimitry Andric } 1860b57cec5SDimitry Andric 187590d96feSDimitry Andric if (maxStrings == 0) 188590d96feSDimitry Andric return std::make_pair(std::vector<std::string>(), numLocations); 189590d96feSDimitry Andric 190590d96feSDimitry Andric if (numLocations == 0) 191590d96feSDimitry Andric return std::make_pair( 192590d96feSDimitry Andric std::vector<std::string>{"\n>>> referenced by " + toString(file)}, 1); 1930b57cec5SDimitry Andric 1940b57cec5SDimitry Andric std::vector<std::string> symbolLocations(locations.size()); 1950b57cec5SDimitry Andric size_t i = 0; 1960b57cec5SDimitry Andric for (Location loc : locations) { 1970b57cec5SDimitry Andric llvm::raw_string_ostream os(symbolLocations[i++]); 1980b57cec5SDimitry Andric os << "\n>>> referenced by "; 1990b57cec5SDimitry Andric if (!loc.fileLine.first.empty()) 2000b57cec5SDimitry Andric os << loc.fileLine.first << ":" << loc.fileLine.second 2010b57cec5SDimitry Andric << "\n>>> "; 2020b57cec5SDimitry Andric os << toString(file); 2030b57cec5SDimitry Andric if (loc.sym) 2040b57cec5SDimitry Andric os << ":(" << toString(*loc.sym) << ')'; 2050b57cec5SDimitry Andric } 206590d96feSDimitry Andric return std::make_pair(symbolLocations, numLocations); 2070b57cec5SDimitry Andric } 2080b57cec5SDimitry Andric 209590d96feSDimitry Andric std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex) { 210590d96feSDimitry Andric return getSymbolLocations(file, symIndex, SIZE_MAX).first; 211590d96feSDimitry Andric } 212590d96feSDimitry Andric 213590d96feSDimitry Andric static std::pair<std::vector<std::string>, size_t> 214590d96feSDimitry Andric getSymbolLocations(InputFile *file, uint32_t symIndex, size_t maxStrings) { 21585868e8aSDimitry Andric if (auto *o = dyn_cast<ObjFile>(file)) 216590d96feSDimitry Andric return getSymbolLocations(o, symIndex, maxStrings); 217590d96feSDimitry Andric if (auto *b = dyn_cast<BitcodeFile>(file)) { 218590d96feSDimitry Andric std::vector<std::string> symbolLocations = getSymbolLocations(b); 219590d96feSDimitry Andric size_t numLocations = symbolLocations.size(); 220590d96feSDimitry Andric if (symbolLocations.size() > maxStrings) 221590d96feSDimitry Andric symbolLocations.resize(maxStrings); 222590d96feSDimitry Andric return std::make_pair(symbolLocations, numLocations); 223590d96feSDimitry Andric } 22485868e8aSDimitry Andric llvm_unreachable("unsupported file type passed to getSymbolLocations"); 225590d96feSDimitry Andric return std::make_pair(std::vector<std::string>(), (size_t)0); 22685868e8aSDimitry Andric } 22785868e8aSDimitry Andric 2280b57cec5SDimitry Andric // For an undefined symbol, stores all files referencing it and the index of 2290b57cec5SDimitry Andric // the undefined symbol in each file. 2300b57cec5SDimitry Andric struct UndefinedDiag { 2310b57cec5SDimitry Andric Symbol *sym; 2320b57cec5SDimitry Andric struct File { 23385868e8aSDimitry Andric InputFile *file; 23485868e8aSDimitry Andric uint32_t symIndex; 2350b57cec5SDimitry Andric }; 2360b57cec5SDimitry Andric std::vector<File> files; 2370b57cec5SDimitry Andric }; 2380b57cec5SDimitry Andric 2390b57cec5SDimitry Andric static void reportUndefinedSymbol(const UndefinedDiag &undefDiag) { 2400b57cec5SDimitry Andric std::string out; 2410b57cec5SDimitry Andric llvm::raw_string_ostream os(out); 2420b57cec5SDimitry Andric os << "undefined symbol: " << toString(*undefDiag.sym); 2430b57cec5SDimitry Andric 2445ffd83dbSDimitry Andric const size_t maxUndefReferences = 3; 245590d96feSDimitry Andric size_t numDisplayedRefs = 0, numRefs = 0; 2460b57cec5SDimitry Andric for (const UndefinedDiag::File &ref : undefDiag.files) { 247590d96feSDimitry Andric std::vector<std::string> symbolLocations; 248590d96feSDimitry Andric size_t totalLocations = 0; 249590d96feSDimitry Andric std::tie(symbolLocations, totalLocations) = getSymbolLocations( 250590d96feSDimitry Andric ref.file, ref.symIndex, maxUndefReferences - numDisplayedRefs); 251590d96feSDimitry Andric 252590d96feSDimitry Andric numRefs += totalLocations; 253590d96feSDimitry Andric numDisplayedRefs += symbolLocations.size(); 2540b57cec5SDimitry Andric for (const std::string &s : symbolLocations) { 2550b57cec5SDimitry Andric os << s; 2560b57cec5SDimitry Andric } 2570b57cec5SDimitry Andric } 258590d96feSDimitry Andric if (numDisplayedRefs < numRefs) 259590d96feSDimitry Andric os << "\n>>> referenced " << numRefs - numDisplayedRefs << " more times"; 2600b57cec5SDimitry Andric errorOrWarn(os.str()); 2610b57cec5SDimitry Andric } 2620b57cec5SDimitry Andric 263fe6060f1SDimitry Andric void SymbolTable::loadMinGWSymbols() { 2640b57cec5SDimitry Andric for (auto &i : symMap) { 2650b57cec5SDimitry Andric Symbol *sym = i.second; 2660b57cec5SDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 2670b57cec5SDimitry Andric if (!undef) 2680b57cec5SDimitry Andric continue; 26985868e8aSDimitry Andric if (undef->getWeakAlias()) 27085868e8aSDimitry Andric continue; 2710b57cec5SDimitry Andric 2720b57cec5SDimitry Andric StringRef name = undef->getName(); 2730b57cec5SDimitry Andric 274fe6060f1SDimitry Andric if (config->machine == I386 && config->stdcallFixup) { 275fe6060f1SDimitry Andric // Check if we can resolve an undefined decorated symbol by finding 276349cc55cSDimitry Andric // the intended target as an undecorated symbol (only with a leading 277fe6060f1SDimitry Andric // underscore). 278fe6060f1SDimitry Andric StringRef origName = name; 279fe6060f1SDimitry Andric StringRef baseName = name; 280fe6060f1SDimitry Andric // Trim down stdcall/fastcall/vectorcall symbols to the base name. 281fe6060f1SDimitry Andric baseName = ltrim1(baseName, "_@"); 282fe6060f1SDimitry Andric baseName = baseName.substr(0, baseName.find('@')); 283fe6060f1SDimitry Andric // Add a leading underscore, as it would be in cdecl form. 284fe6060f1SDimitry Andric std::string newName = ("_" + baseName).str(); 285fe6060f1SDimitry Andric Symbol *l; 286fe6060f1SDimitry Andric if (newName != origName && (l = find(newName)) != nullptr) { 287fe6060f1SDimitry Andric // If we found a symbol and it is lazy; load it. 288fe6060f1SDimitry Andric if (l->isLazy() && !l->pendingArchiveLoad) { 289fe6060f1SDimitry Andric log("Loading lazy " + l->getName() + " from " + 290fe6060f1SDimitry Andric l->getFile()->getName() + " for stdcall fixup"); 291fe6060f1SDimitry Andric forceLazy(l); 292fe6060f1SDimitry Andric } 293fe6060f1SDimitry Andric // If it's lazy or already defined, hook it up as weak alias. 294fe6060f1SDimitry Andric if (l->isLazy() || isa<Defined>(l)) { 295fe6060f1SDimitry Andric if (config->warnStdcallFixup) 296fe6060f1SDimitry Andric warn("Resolving " + origName + " by linking to " + newName); 297fe6060f1SDimitry Andric else 298fe6060f1SDimitry Andric log("Resolving " + origName + " by linking to " + newName); 299fe6060f1SDimitry Andric undef->weakAlias = l; 300fe6060f1SDimitry Andric continue; 301fe6060f1SDimitry Andric } 302fe6060f1SDimitry Andric } 303fe6060f1SDimitry Andric } 304fe6060f1SDimitry Andric 305fe6060f1SDimitry Andric if (config->autoImport) { 3060b57cec5SDimitry Andric if (name.startswith("__imp_")) 3070b57cec5SDimitry Andric continue; 30885868e8aSDimitry Andric // If we have an undefined symbol, but we have a lazy symbol we could 30985868e8aSDimitry Andric // load, load it. 31085868e8aSDimitry Andric Symbol *l = find(("__imp_" + name).str()); 31185868e8aSDimitry Andric if (!l || l->pendingArchiveLoad || !l->isLazy()) 3120b57cec5SDimitry Andric continue; 3130b57cec5SDimitry Andric 31485868e8aSDimitry Andric log("Loading lazy " + l->getName() + " from " + l->getFile()->getName() + 3150b57cec5SDimitry Andric " for automatic import"); 31685868e8aSDimitry Andric forceLazy(l); 3170b57cec5SDimitry Andric } 3180b57cec5SDimitry Andric } 319fe6060f1SDimitry Andric } 3200b57cec5SDimitry Andric 32185868e8aSDimitry Andric Defined *SymbolTable::impSymbol(StringRef name) { 32285868e8aSDimitry Andric if (name.startswith("__imp_")) 32385868e8aSDimitry Andric return nullptr; 32485868e8aSDimitry Andric return dyn_cast_or_null<Defined>(find(("__imp_" + name).str())); 32585868e8aSDimitry Andric } 32685868e8aSDimitry Andric 3270b57cec5SDimitry Andric bool SymbolTable::handleMinGWAutomaticImport(Symbol *sym, StringRef name) { 32885868e8aSDimitry Andric Defined *imp = impSymbol(name); 3290b57cec5SDimitry Andric if (!imp) 3300b57cec5SDimitry Andric return false; 3310b57cec5SDimitry Andric 3320b57cec5SDimitry Andric // Replace the reference directly to a variable with a reference 3330b57cec5SDimitry Andric // to the import address table instead. This obviously isn't right, 3340b57cec5SDimitry Andric // but we mark the symbol as isRuntimePseudoReloc, and a later pass 3350b57cec5SDimitry Andric // will add runtime pseudo relocations for every relocation against 3360b57cec5SDimitry Andric // this Symbol. The runtime pseudo relocation framework expects the 3370b57cec5SDimitry Andric // reference itself to point at the IAT entry. 3380b57cec5SDimitry Andric size_t impSize = 0; 3390b57cec5SDimitry Andric if (isa<DefinedImportData>(imp)) { 3400b57cec5SDimitry Andric log("Automatically importing " + name + " from " + 3410b57cec5SDimitry Andric cast<DefinedImportData>(imp)->getDLLName()); 3420b57cec5SDimitry Andric impSize = sizeof(DefinedImportData); 3430b57cec5SDimitry Andric } else if (isa<DefinedRegular>(imp)) { 3440b57cec5SDimitry Andric log("Automatically importing " + name + " from " + 3450b57cec5SDimitry Andric toString(cast<DefinedRegular>(imp)->file)); 3460b57cec5SDimitry Andric impSize = sizeof(DefinedRegular); 3470b57cec5SDimitry Andric } else { 3480b57cec5SDimitry Andric warn("unable to automatically import " + name + " from " + imp->getName() + 3490b57cec5SDimitry Andric " from " + toString(cast<DefinedRegular>(imp)->file) + 3500b57cec5SDimitry Andric "; unexpected symbol type"); 3510b57cec5SDimitry Andric return false; 3520b57cec5SDimitry Andric } 3530b57cec5SDimitry Andric sym->replaceKeepingName(imp, impSize); 3540b57cec5SDimitry Andric sym->isRuntimePseudoReloc = true; 3550b57cec5SDimitry Andric 3560b57cec5SDimitry Andric // There may exist symbols named .refptr.<name> which only consist 3570b57cec5SDimitry Andric // of a single pointer to <name>. If it turns out <name> is 3580b57cec5SDimitry Andric // automatically imported, we don't need to keep the .refptr.<name> 3590b57cec5SDimitry Andric // pointer at all, but redirect all accesses to it to the IAT entry 3600b57cec5SDimitry Andric // for __imp_<name> instead, and drop the whole .refptr.<name> chunk. 3610b57cec5SDimitry Andric DefinedRegular *refptr = 3620b57cec5SDimitry Andric dyn_cast_or_null<DefinedRegular>(find((".refptr." + name).str())); 3630b57cec5SDimitry Andric if (refptr && refptr->getChunk()->getSize() == config->wordsize) { 3640b57cec5SDimitry Andric SectionChunk *sc = dyn_cast_or_null<SectionChunk>(refptr->getChunk()); 3650b57cec5SDimitry Andric if (sc && sc->getRelocs().size() == 1 && *sc->symbols().begin() == sym) { 3660b57cec5SDimitry Andric log("Replacing .refptr." + name + " with " + imp->getName()); 3670b57cec5SDimitry Andric refptr->getChunk()->live = false; 3680b57cec5SDimitry Andric refptr->replaceKeepingName(imp, impSize); 3690b57cec5SDimitry Andric } 3700b57cec5SDimitry Andric } 3710b57cec5SDimitry Andric return true; 3720b57cec5SDimitry Andric } 3730b57cec5SDimitry Andric 37485868e8aSDimitry Andric /// Helper function for reportUnresolvable and resolveRemainingUndefines. 37585868e8aSDimitry Andric /// This function emits an "undefined symbol" diagnostic for each symbol in 37685868e8aSDimitry Andric /// undefs. If localImports is not nullptr, it also emits a "locally 37785868e8aSDimitry Andric /// defined symbol imported" diagnostic for symbols in localImports. 37885868e8aSDimitry Andric /// objFiles and bitcodeFiles (if not nullptr) are used to report where 37985868e8aSDimitry Andric /// undefined symbols are referenced. 380349cc55cSDimitry Andric static void reportProblemSymbols( 381349cc55cSDimitry Andric const COFFLinkerContext &ctx, const SmallPtrSetImpl<Symbol *> &undefs, 382349cc55cSDimitry Andric const DenseMap<Symbol *, Symbol *> *localImports, bool needBitcodeFiles) { 38385868e8aSDimitry Andric // Return early if there is nothing to report (which should be 38485868e8aSDimitry Andric // the common case). 38585868e8aSDimitry Andric if (undefs.empty() && (!localImports || localImports->empty())) 38685868e8aSDimitry Andric return; 38785868e8aSDimitry Andric 38885868e8aSDimitry Andric for (Symbol *b : config->gcroot) { 38985868e8aSDimitry Andric if (undefs.count(b)) 39085868e8aSDimitry Andric errorOrWarn("<root>: undefined symbol: " + toString(*b)); 39185868e8aSDimitry Andric if (localImports) 39285868e8aSDimitry Andric if (Symbol *imp = localImports->lookup(b)) 39385868e8aSDimitry Andric warn("<root>: locally defined symbol imported: " + toString(*imp) + 39485868e8aSDimitry Andric " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 39585868e8aSDimitry Andric } 39685868e8aSDimitry Andric 39785868e8aSDimitry Andric std::vector<UndefinedDiag> undefDiags; 39885868e8aSDimitry Andric DenseMap<Symbol *, int> firstDiag; 39985868e8aSDimitry Andric 40085868e8aSDimitry Andric auto processFile = [&](InputFile *file, ArrayRef<Symbol *> symbols) { 40185868e8aSDimitry Andric uint32_t symIndex = (uint32_t)-1; 40285868e8aSDimitry Andric for (Symbol *sym : symbols) { 40385868e8aSDimitry Andric ++symIndex; 40485868e8aSDimitry Andric if (!sym) 40585868e8aSDimitry Andric continue; 40685868e8aSDimitry Andric if (undefs.count(sym)) { 40785868e8aSDimitry Andric auto it = firstDiag.find(sym); 40885868e8aSDimitry Andric if (it == firstDiag.end()) { 40985868e8aSDimitry Andric firstDiag[sym] = undefDiags.size(); 41085868e8aSDimitry Andric undefDiags.push_back({sym, {{file, symIndex}}}); 41185868e8aSDimitry Andric } else { 41285868e8aSDimitry Andric undefDiags[it->second].files.push_back({file, symIndex}); 41385868e8aSDimitry Andric } 41485868e8aSDimitry Andric } 41585868e8aSDimitry Andric if (localImports) 41685868e8aSDimitry Andric if (Symbol *imp = localImports->lookup(sym)) 41785868e8aSDimitry Andric warn(toString(file) + 41885868e8aSDimitry Andric ": locally defined symbol imported: " + toString(*imp) + 41985868e8aSDimitry Andric " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 42085868e8aSDimitry Andric } 42185868e8aSDimitry Andric }; 42285868e8aSDimitry Andric 423349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) 42485868e8aSDimitry Andric processFile(file, file->getSymbols()); 42585868e8aSDimitry Andric 426349cc55cSDimitry Andric if (needBitcodeFiles) 427349cc55cSDimitry Andric for (BitcodeFile *file : ctx.bitcodeFileInstances) 42885868e8aSDimitry Andric processFile(file, file->getSymbols()); 42985868e8aSDimitry Andric 43085868e8aSDimitry Andric for (const UndefinedDiag &undefDiag : undefDiags) 43185868e8aSDimitry Andric reportUndefinedSymbol(undefDiag); 43285868e8aSDimitry Andric } 43385868e8aSDimitry Andric 43485868e8aSDimitry Andric void SymbolTable::reportUnresolvable() { 43585868e8aSDimitry Andric SmallPtrSet<Symbol *, 8> undefs; 43685868e8aSDimitry Andric for (auto &i : symMap) { 43785868e8aSDimitry Andric Symbol *sym = i.second; 43885868e8aSDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 439e8d8bef9SDimitry Andric if (!undef || sym->deferUndefined) 44085868e8aSDimitry Andric continue; 44185868e8aSDimitry Andric if (undef->getWeakAlias()) 44285868e8aSDimitry Andric continue; 44385868e8aSDimitry Andric StringRef name = undef->getName(); 44485868e8aSDimitry Andric if (name.startswith("__imp_")) { 44585868e8aSDimitry Andric Symbol *imp = find(name.substr(strlen("__imp_"))); 44685868e8aSDimitry Andric if (imp && isa<Defined>(imp)) 44785868e8aSDimitry Andric continue; 44885868e8aSDimitry Andric } 44985868e8aSDimitry Andric if (name.contains("_PchSym_")) 45085868e8aSDimitry Andric continue; 451e8d8bef9SDimitry Andric if (config->autoImport && impSymbol(name)) 45285868e8aSDimitry Andric continue; 45385868e8aSDimitry Andric undefs.insert(sym); 45485868e8aSDimitry Andric } 45585868e8aSDimitry Andric 456349cc55cSDimitry Andric reportProblemSymbols(ctx, undefs, 457349cc55cSDimitry Andric /* localImports */ nullptr, true); 45885868e8aSDimitry Andric } 45985868e8aSDimitry Andric 46085868e8aSDimitry Andric void SymbolTable::resolveRemainingUndefines() { 4610b57cec5SDimitry Andric SmallPtrSet<Symbol *, 8> undefs; 4620b57cec5SDimitry Andric DenseMap<Symbol *, Symbol *> localImports; 4630b57cec5SDimitry Andric 4640b57cec5SDimitry Andric for (auto &i : symMap) { 4650b57cec5SDimitry Andric Symbol *sym = i.second; 4660b57cec5SDimitry Andric auto *undef = dyn_cast<Undefined>(sym); 4670b57cec5SDimitry Andric if (!undef) 4680b57cec5SDimitry Andric continue; 4690b57cec5SDimitry Andric if (!sym->isUsedInRegularObj) 4700b57cec5SDimitry Andric continue; 4710b57cec5SDimitry Andric 4720b57cec5SDimitry Andric StringRef name = undef->getName(); 4730b57cec5SDimitry Andric 4740b57cec5SDimitry Andric // A weak alias may have been resolved, so check for that. 4750b57cec5SDimitry Andric if (Defined *d = undef->getWeakAlias()) { 4760b57cec5SDimitry Andric // We want to replace Sym with D. However, we can't just blindly 4770b57cec5SDimitry Andric // copy sizeof(SymbolUnion) bytes from D to Sym because D may be an 4780b57cec5SDimitry Andric // internal symbol, and internal symbols are stored as "unparented" 4790b57cec5SDimitry Andric // Symbols. For that reason we need to check which type of symbol we 4800b57cec5SDimitry Andric // are dealing with and copy the correct number of bytes. 4810b57cec5SDimitry Andric if (isa<DefinedRegular>(d)) 4820b57cec5SDimitry Andric memcpy(sym, d, sizeof(DefinedRegular)); 4830b57cec5SDimitry Andric else if (isa<DefinedAbsolute>(d)) 4840b57cec5SDimitry Andric memcpy(sym, d, sizeof(DefinedAbsolute)); 4850b57cec5SDimitry Andric else 4860b57cec5SDimitry Andric memcpy(sym, d, sizeof(SymbolUnion)); 4870b57cec5SDimitry Andric continue; 4880b57cec5SDimitry Andric } 4890b57cec5SDimitry Andric 4900b57cec5SDimitry Andric // If we can resolve a symbol by removing __imp_ prefix, do that. 4910b57cec5SDimitry Andric // This odd rule is for compatibility with MSVC linker. 4920b57cec5SDimitry Andric if (name.startswith("__imp_")) { 4930b57cec5SDimitry Andric Symbol *imp = find(name.substr(strlen("__imp_"))); 4940b57cec5SDimitry Andric if (imp && isa<Defined>(imp)) { 4950b57cec5SDimitry Andric auto *d = cast<Defined>(imp); 4960b57cec5SDimitry Andric replaceSymbol<DefinedLocalImport>(sym, name, d); 4970b57cec5SDimitry Andric localImportChunks.push_back(cast<DefinedLocalImport>(sym)->getChunk()); 4980b57cec5SDimitry Andric localImports[sym] = d; 4990b57cec5SDimitry Andric continue; 5000b57cec5SDimitry Andric } 5010b57cec5SDimitry Andric } 5020b57cec5SDimitry Andric 5030b57cec5SDimitry Andric // We don't want to report missing Microsoft precompiled headers symbols. 5040b57cec5SDimitry Andric // A proper message will be emitted instead in PDBLinker::aquirePrecompObj 5050b57cec5SDimitry Andric if (name.contains("_PchSym_")) 5060b57cec5SDimitry Andric continue; 5070b57cec5SDimitry Andric 5085ffd83dbSDimitry Andric if (config->autoImport && handleMinGWAutomaticImport(sym, name)) 5090b57cec5SDimitry Andric continue; 5100b57cec5SDimitry Andric 5110b57cec5SDimitry Andric // Remaining undefined symbols are not fatal if /force is specified. 5120b57cec5SDimitry Andric // They are replaced with dummy defined symbols. 5130b57cec5SDimitry Andric if (config->forceUnresolved) 5140b57cec5SDimitry Andric replaceSymbol<DefinedAbsolute>(sym, name, 0); 5150b57cec5SDimitry Andric undefs.insert(sym); 5160b57cec5SDimitry Andric } 5170b57cec5SDimitry Andric 51885868e8aSDimitry Andric reportProblemSymbols( 519349cc55cSDimitry Andric ctx, undefs, config->warnLocallyDefinedImported ? &localImports : nullptr, 520349cc55cSDimitry Andric false); 5210b57cec5SDimitry Andric } 5220b57cec5SDimitry Andric 5230b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name) { 5240b57cec5SDimitry Andric bool inserted = false; 5250b57cec5SDimitry Andric Symbol *&sym = symMap[CachedHashStringRef(name)]; 5260b57cec5SDimitry Andric if (!sym) { 5270b57cec5SDimitry Andric sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); 5280b57cec5SDimitry Andric sym->isUsedInRegularObj = false; 5290b57cec5SDimitry Andric sym->pendingArchiveLoad = false; 530e8d8bef9SDimitry Andric sym->canInline = true; 5310b57cec5SDimitry Andric inserted = true; 5320b57cec5SDimitry Andric } 5330b57cec5SDimitry Andric return {sym, inserted}; 5340b57cec5SDimitry Andric } 5350b57cec5SDimitry Andric 5360b57cec5SDimitry Andric std::pair<Symbol *, bool> SymbolTable::insert(StringRef name, InputFile *file) { 5370b57cec5SDimitry Andric std::pair<Symbol *, bool> result = insert(name); 5380b57cec5SDimitry Andric if (!file || !isa<BitcodeFile>(file)) 5390b57cec5SDimitry Andric result.first->isUsedInRegularObj = true; 5400b57cec5SDimitry Andric return result; 5410b57cec5SDimitry Andric } 5420b57cec5SDimitry Andric 5430b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name, InputFile *f, 5440b57cec5SDimitry Andric bool isWeakAlias) { 5450b57cec5SDimitry Andric Symbol *s; 5460b57cec5SDimitry Andric bool wasInserted; 5470b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(name, f); 54885868e8aSDimitry Andric if (wasInserted || (s->isLazy() && isWeakAlias)) { 5490b57cec5SDimitry Andric replaceSymbol<Undefined>(s, name); 5500b57cec5SDimitry Andric return s; 5510b57cec5SDimitry Andric } 55285868e8aSDimitry Andric if (s->isLazy()) 55385868e8aSDimitry Andric forceLazy(s); 5540b57cec5SDimitry Andric return s; 5550b57cec5SDimitry Andric } 5560b57cec5SDimitry Andric 55785868e8aSDimitry Andric void SymbolTable::addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym) { 5580b57cec5SDimitry Andric StringRef name = sym.getName(); 5590b57cec5SDimitry Andric Symbol *s; 5600b57cec5SDimitry Andric bool wasInserted; 5610b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(name); 5620b57cec5SDimitry Andric if (wasInserted) { 56385868e8aSDimitry Andric replaceSymbol<LazyArchive>(s, f, sym); 5640b57cec5SDimitry Andric return; 5650b57cec5SDimitry Andric } 5660b57cec5SDimitry Andric auto *u = dyn_cast<Undefined>(s); 5670b57cec5SDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 5680b57cec5SDimitry Andric return; 5690b57cec5SDimitry Andric s->pendingArchiveLoad = true; 5700b57cec5SDimitry Andric f->addMember(sym); 5710b57cec5SDimitry Andric } 5720b57cec5SDimitry Andric 573*04eeddc0SDimitry Andric void SymbolTable::addLazyObject(InputFile *f, StringRef n) { 574*04eeddc0SDimitry Andric assert(f->lazy); 57585868e8aSDimitry Andric Symbol *s; 57685868e8aSDimitry Andric bool wasInserted; 57785868e8aSDimitry Andric std::tie(s, wasInserted) = insert(n, f); 57885868e8aSDimitry Andric if (wasInserted) { 57985868e8aSDimitry Andric replaceSymbol<LazyObject>(s, f, n); 58085868e8aSDimitry Andric return; 58185868e8aSDimitry Andric } 58285868e8aSDimitry Andric auto *u = dyn_cast<Undefined>(s); 58385868e8aSDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 58485868e8aSDimitry Andric return; 58585868e8aSDimitry Andric s->pendingArchiveLoad = true; 586*04eeddc0SDimitry Andric f->lazy = false; 587*04eeddc0SDimitry Andric addFile(f); 58885868e8aSDimitry Andric } 58985868e8aSDimitry Andric 590fe6060f1SDimitry Andric void SymbolTable::addLazyDLLSymbol(DLLFile *f, DLLFile::Symbol *sym, 591fe6060f1SDimitry Andric StringRef n) { 592fe6060f1SDimitry Andric Symbol *s; 593fe6060f1SDimitry Andric bool wasInserted; 594fe6060f1SDimitry Andric std::tie(s, wasInserted) = insert(n); 595fe6060f1SDimitry Andric if (wasInserted) { 596fe6060f1SDimitry Andric replaceSymbol<LazyDLLSymbol>(s, f, sym, n); 597fe6060f1SDimitry Andric return; 598fe6060f1SDimitry Andric } 599fe6060f1SDimitry Andric auto *u = dyn_cast<Undefined>(s); 600fe6060f1SDimitry Andric if (!u || u->weakAlias || s->pendingArchiveLoad) 601fe6060f1SDimitry Andric return; 602fe6060f1SDimitry Andric s->pendingArchiveLoad = true; 603fe6060f1SDimitry Andric f->makeImport(sym); 604fe6060f1SDimitry Andric } 605fe6060f1SDimitry Andric 60685868e8aSDimitry Andric static std::string getSourceLocationBitcode(BitcodeFile *file) { 60785868e8aSDimitry Andric std::string res("\n>>> defined at "); 60885868e8aSDimitry Andric StringRef source = file->obj->getSourceFileName(); 60985868e8aSDimitry Andric if (!source.empty()) 61085868e8aSDimitry Andric res += source.str() + "\n>>> "; 61185868e8aSDimitry Andric res += toString(file); 61285868e8aSDimitry Andric return res; 61385868e8aSDimitry Andric } 61485868e8aSDimitry Andric 61585868e8aSDimitry Andric static std::string getSourceLocationObj(ObjFile *file, SectionChunk *sc, 61685868e8aSDimitry Andric uint32_t offset, StringRef name) { 61785868e8aSDimitry Andric Optional<std::pair<StringRef, uint32_t>> fileLine; 61885868e8aSDimitry Andric if (sc) 61985868e8aSDimitry Andric fileLine = getFileLine(sc, offset); 62085868e8aSDimitry Andric if (!fileLine) 62185868e8aSDimitry Andric fileLine = file->getVariableLocation(name); 62285868e8aSDimitry Andric 62385868e8aSDimitry Andric std::string res; 62485868e8aSDimitry Andric llvm::raw_string_ostream os(res); 62585868e8aSDimitry Andric os << "\n>>> defined at "; 62685868e8aSDimitry Andric if (fileLine) 62785868e8aSDimitry Andric os << fileLine->first << ":" << fileLine->second << "\n>>> "; 62885868e8aSDimitry Andric os << toString(file); 62985868e8aSDimitry Andric return os.str(); 63085868e8aSDimitry Andric } 63185868e8aSDimitry Andric 63285868e8aSDimitry Andric static std::string getSourceLocation(InputFile *file, SectionChunk *sc, 63385868e8aSDimitry Andric uint32_t offset, StringRef name) { 634480093f4SDimitry Andric if (!file) 635480093f4SDimitry Andric return ""; 63685868e8aSDimitry Andric if (auto *o = dyn_cast<ObjFile>(file)) 63785868e8aSDimitry Andric return getSourceLocationObj(o, sc, offset, name); 63885868e8aSDimitry Andric if (auto *b = dyn_cast<BitcodeFile>(file)) 63985868e8aSDimitry Andric return getSourceLocationBitcode(b); 64085868e8aSDimitry Andric return "\n>>> defined at " + toString(file); 64185868e8aSDimitry Andric } 64285868e8aSDimitry Andric 64385868e8aSDimitry Andric // Construct and print an error message in the form of: 64485868e8aSDimitry Andric // 64585868e8aSDimitry Andric // lld-link: error: duplicate symbol: foo 64685868e8aSDimitry Andric // >>> defined at bar.c:30 64785868e8aSDimitry Andric // >>> bar.o 64885868e8aSDimitry Andric // >>> defined at baz.c:563 64985868e8aSDimitry Andric // >>> baz.o 65085868e8aSDimitry Andric void SymbolTable::reportDuplicate(Symbol *existing, InputFile *newFile, 65185868e8aSDimitry Andric SectionChunk *newSc, 65285868e8aSDimitry Andric uint32_t newSectionOffset) { 65385868e8aSDimitry Andric std::string msg; 65485868e8aSDimitry Andric llvm::raw_string_ostream os(msg); 65585868e8aSDimitry Andric os << "duplicate symbol: " << toString(*existing); 65685868e8aSDimitry Andric 657480093f4SDimitry Andric DefinedRegular *d = dyn_cast<DefinedRegular>(existing); 65885868e8aSDimitry Andric if (d && isa<ObjFile>(d->getFile())) { 65985868e8aSDimitry Andric os << getSourceLocation(d->getFile(), d->getChunk(), d->getValue(), 66085868e8aSDimitry Andric existing->getName()); 66185868e8aSDimitry Andric } else { 66285868e8aSDimitry Andric os << getSourceLocation(existing->getFile(), nullptr, 0, ""); 66385868e8aSDimitry Andric } 66485868e8aSDimitry Andric os << getSourceLocation(newFile, newSc, newSectionOffset, 66585868e8aSDimitry Andric existing->getName()); 6660b57cec5SDimitry Andric 6670b57cec5SDimitry Andric if (config->forceMultiple) 66885868e8aSDimitry Andric warn(os.str()); 6690b57cec5SDimitry Andric else 67085868e8aSDimitry Andric error(os.str()); 6710b57cec5SDimitry Andric } 6720b57cec5SDimitry Andric 6730b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, COFFSymbolRef sym) { 6740b57cec5SDimitry Andric Symbol *s; 6750b57cec5SDimitry Andric bool wasInserted; 6760b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, nullptr); 6770b57cec5SDimitry Andric s->isUsedInRegularObj = true; 67885868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 6790b57cec5SDimitry Andric replaceSymbol<DefinedAbsolute>(s, n, sym); 680480093f4SDimitry Andric else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 681480093f4SDimitry Andric if (da->getVA() != sym.getValue()) 682480093f4SDimitry Andric reportDuplicate(s, nullptr); 683480093f4SDimitry Andric } else if (!isa<DefinedCOFF>(s)) 6840b57cec5SDimitry Andric reportDuplicate(s, nullptr); 6850b57cec5SDimitry Andric return s; 6860b57cec5SDimitry Andric } 6870b57cec5SDimitry Andric 6880b57cec5SDimitry Andric Symbol *SymbolTable::addAbsolute(StringRef n, uint64_t va) { 6890b57cec5SDimitry Andric Symbol *s; 6900b57cec5SDimitry Andric bool wasInserted; 6910b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, nullptr); 6920b57cec5SDimitry Andric s->isUsedInRegularObj = true; 69385868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 6940b57cec5SDimitry Andric replaceSymbol<DefinedAbsolute>(s, n, va); 695480093f4SDimitry Andric else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 696480093f4SDimitry Andric if (da->getVA() != va) 697480093f4SDimitry Andric reportDuplicate(s, nullptr); 698480093f4SDimitry Andric } else if (!isa<DefinedCOFF>(s)) 6990b57cec5SDimitry Andric reportDuplicate(s, nullptr); 7000b57cec5SDimitry Andric return s; 7010b57cec5SDimitry Andric } 7020b57cec5SDimitry Andric 7030b57cec5SDimitry Andric Symbol *SymbolTable::addSynthetic(StringRef n, Chunk *c) { 7040b57cec5SDimitry Andric Symbol *s; 7050b57cec5SDimitry Andric bool wasInserted; 7060b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, nullptr); 7070b57cec5SDimitry Andric s->isUsedInRegularObj = true; 70885868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) 7090b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(s, n, c); 7100b57cec5SDimitry Andric else if (!isa<DefinedCOFF>(s)) 7110b57cec5SDimitry Andric reportDuplicate(s, nullptr); 7120b57cec5SDimitry Andric return s; 7130b57cec5SDimitry Andric } 7140b57cec5SDimitry Andric 7150b57cec5SDimitry Andric Symbol *SymbolTable::addRegular(InputFile *f, StringRef n, 71685868e8aSDimitry Andric const coff_symbol_generic *sym, SectionChunk *c, 71785868e8aSDimitry Andric uint32_t sectionOffset) { 7180b57cec5SDimitry Andric Symbol *s; 7190b57cec5SDimitry Andric bool wasInserted; 7200b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, f); 7210b57cec5SDimitry Andric if (wasInserted || !isa<DefinedRegular>(s)) 7220b57cec5SDimitry Andric replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ false, 7230b57cec5SDimitry Andric /*IsExternal*/ true, sym, c); 7240b57cec5SDimitry Andric else 72585868e8aSDimitry Andric reportDuplicate(s, f, c, sectionOffset); 7260b57cec5SDimitry Andric return s; 7270b57cec5SDimitry Andric } 7280b57cec5SDimitry Andric 7290b57cec5SDimitry Andric std::pair<DefinedRegular *, bool> 7300b57cec5SDimitry Andric SymbolTable::addComdat(InputFile *f, StringRef n, 7310b57cec5SDimitry Andric const coff_symbol_generic *sym) { 7320b57cec5SDimitry Andric Symbol *s; 7330b57cec5SDimitry Andric bool wasInserted; 7340b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, f); 7350b57cec5SDimitry Andric if (wasInserted || !isa<DefinedRegular>(s)) { 7360b57cec5SDimitry Andric replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ true, 7370b57cec5SDimitry Andric /*IsExternal*/ true, sym, nullptr); 7380b57cec5SDimitry Andric return {cast<DefinedRegular>(s), true}; 7390b57cec5SDimitry Andric } 7400b57cec5SDimitry Andric auto *existingSymbol = cast<DefinedRegular>(s); 7410b57cec5SDimitry Andric if (!existingSymbol->isCOMDAT) 7420b57cec5SDimitry Andric reportDuplicate(s, f); 7430b57cec5SDimitry Andric return {existingSymbol, false}; 7440b57cec5SDimitry Andric } 7450b57cec5SDimitry Andric 7460b57cec5SDimitry Andric Symbol *SymbolTable::addCommon(InputFile *f, StringRef n, uint64_t size, 7470b57cec5SDimitry Andric const coff_symbol_generic *sym, CommonChunk *c) { 7480b57cec5SDimitry Andric Symbol *s; 7490b57cec5SDimitry Andric bool wasInserted; 7500b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, f); 7510b57cec5SDimitry Andric if (wasInserted || !isa<DefinedCOFF>(s)) 7520b57cec5SDimitry Andric replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 7530b57cec5SDimitry Andric else if (auto *dc = dyn_cast<DefinedCommon>(s)) 7540b57cec5SDimitry Andric if (size > dc->getSize()) 7550b57cec5SDimitry Andric replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 7560b57cec5SDimitry Andric return s; 7570b57cec5SDimitry Andric } 7580b57cec5SDimitry Andric 7590b57cec5SDimitry Andric Symbol *SymbolTable::addImportData(StringRef n, ImportFile *f) { 7600b57cec5SDimitry Andric Symbol *s; 7610b57cec5SDimitry Andric bool wasInserted; 7620b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(n, nullptr); 7630b57cec5SDimitry Andric s->isUsedInRegularObj = true; 76485868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 7650b57cec5SDimitry Andric replaceSymbol<DefinedImportData>(s, n, f); 7660b57cec5SDimitry Andric return s; 7670b57cec5SDimitry Andric } 7680b57cec5SDimitry Andric 7690b57cec5SDimitry Andric reportDuplicate(s, f); 7700b57cec5SDimitry Andric return nullptr; 7710b57cec5SDimitry Andric } 7720b57cec5SDimitry Andric 7730b57cec5SDimitry Andric Symbol *SymbolTable::addImportThunk(StringRef name, DefinedImportData *id, 7740b57cec5SDimitry Andric uint16_t machine) { 7750b57cec5SDimitry Andric Symbol *s; 7760b57cec5SDimitry Andric bool wasInserted; 7770b57cec5SDimitry Andric std::tie(s, wasInserted) = insert(name, nullptr); 7780b57cec5SDimitry Andric s->isUsedInRegularObj = true; 77985868e8aSDimitry Andric if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 7800b57cec5SDimitry Andric replaceSymbol<DefinedImportThunk>(s, name, id, machine); 7810b57cec5SDimitry Andric return s; 7820b57cec5SDimitry Andric } 7830b57cec5SDimitry Andric 7840b57cec5SDimitry Andric reportDuplicate(s, id->file); 7850b57cec5SDimitry Andric return nullptr; 7860b57cec5SDimitry Andric } 7870b57cec5SDimitry Andric 7880b57cec5SDimitry Andric void SymbolTable::addLibcall(StringRef name) { 7890b57cec5SDimitry Andric Symbol *sym = findUnderscore(name); 7900b57cec5SDimitry Andric if (!sym) 7910b57cec5SDimitry Andric return; 7920b57cec5SDimitry Andric 79385868e8aSDimitry Andric if (auto *l = dyn_cast<LazyArchive>(sym)) { 7940b57cec5SDimitry Andric MemoryBufferRef mb = l->getMemberBuffer(); 79585868e8aSDimitry Andric if (isBitcode(mb)) 79685868e8aSDimitry Andric addUndefined(sym->getName()); 79785868e8aSDimitry Andric } else if (LazyObject *o = dyn_cast<LazyObject>(sym)) { 79885868e8aSDimitry Andric if (isBitcode(o->file->mb)) 7990b57cec5SDimitry Andric addUndefined(sym->getName()); 8000b57cec5SDimitry Andric } 8010b57cec5SDimitry Andric } 8020b57cec5SDimitry Andric 803349cc55cSDimitry Andric std::vector<Chunk *> SymbolTable::getChunks() const { 8040b57cec5SDimitry Andric std::vector<Chunk *> res; 805349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) { 8060b57cec5SDimitry Andric ArrayRef<Chunk *> v = file->getChunks(); 8070b57cec5SDimitry Andric res.insert(res.end(), v.begin(), v.end()); 8080b57cec5SDimitry Andric } 8090b57cec5SDimitry Andric return res; 8100b57cec5SDimitry Andric } 8110b57cec5SDimitry Andric 812349cc55cSDimitry Andric Symbol *SymbolTable::find(StringRef name) const { 8130b57cec5SDimitry Andric return symMap.lookup(CachedHashStringRef(name)); 8140b57cec5SDimitry Andric } 8150b57cec5SDimitry Andric 816349cc55cSDimitry Andric Symbol *SymbolTable::findUnderscore(StringRef name) const { 8170b57cec5SDimitry Andric if (config->machine == I386) 8180b57cec5SDimitry Andric return find(("_" + name).str()); 8190b57cec5SDimitry Andric return find(name); 8200b57cec5SDimitry Andric } 8210b57cec5SDimitry Andric 8220b57cec5SDimitry Andric // Return all symbols that start with Prefix, possibly ignoring the first 8230b57cec5SDimitry Andric // character of Prefix or the first character symbol. 8240b57cec5SDimitry Andric std::vector<Symbol *> SymbolTable::getSymsWithPrefix(StringRef prefix) { 8250b57cec5SDimitry Andric std::vector<Symbol *> syms; 8260b57cec5SDimitry Andric for (auto pair : symMap) { 8270b57cec5SDimitry Andric StringRef name = pair.first.val(); 8280b57cec5SDimitry Andric if (name.startswith(prefix) || name.startswith(prefix.drop_front()) || 8290b57cec5SDimitry Andric name.drop_front().startswith(prefix) || 8300b57cec5SDimitry Andric name.drop_front().startswith(prefix.drop_front())) { 8310b57cec5SDimitry Andric syms.push_back(pair.second); 8320b57cec5SDimitry Andric } 8330b57cec5SDimitry Andric } 8340b57cec5SDimitry Andric return syms; 8350b57cec5SDimitry Andric } 8360b57cec5SDimitry Andric 8370b57cec5SDimitry Andric Symbol *SymbolTable::findMangle(StringRef name) { 8380b57cec5SDimitry Andric if (Symbol *sym = find(name)) 8390b57cec5SDimitry Andric if (!isa<Undefined>(sym)) 8400b57cec5SDimitry Andric return sym; 8410b57cec5SDimitry Andric 8420b57cec5SDimitry Andric // Efficient fuzzy string lookup is impossible with a hash table, so iterate 8430b57cec5SDimitry Andric // the symbol table once and collect all possibly matching symbols into this 8440b57cec5SDimitry Andric // vector. Then compare each possibly matching symbol with each possible 8450b57cec5SDimitry Andric // mangling. 8460b57cec5SDimitry Andric std::vector<Symbol *> syms = getSymsWithPrefix(name); 8470b57cec5SDimitry Andric auto findByPrefix = [&syms](const Twine &t) -> Symbol * { 8480b57cec5SDimitry Andric std::string prefix = t.str(); 8490b57cec5SDimitry Andric for (auto *s : syms) 8500b57cec5SDimitry Andric if (s->getName().startswith(prefix)) 8510b57cec5SDimitry Andric return s; 8520b57cec5SDimitry Andric return nullptr; 8530b57cec5SDimitry Andric }; 8540b57cec5SDimitry Andric 8550b57cec5SDimitry Andric // For non-x86, just look for C++ functions. 8560b57cec5SDimitry Andric if (config->machine != I386) 8570b57cec5SDimitry Andric return findByPrefix("?" + name + "@@Y"); 8580b57cec5SDimitry Andric 8590b57cec5SDimitry Andric if (!name.startswith("_")) 8600b57cec5SDimitry Andric return nullptr; 8610b57cec5SDimitry Andric // Search for x86 stdcall function. 8620b57cec5SDimitry Andric if (Symbol *s = findByPrefix(name + "@")) 8630b57cec5SDimitry Andric return s; 8640b57cec5SDimitry Andric // Search for x86 fastcall function. 8650b57cec5SDimitry Andric if (Symbol *s = findByPrefix("@" + name.substr(1) + "@")) 8660b57cec5SDimitry Andric return s; 8670b57cec5SDimitry Andric // Search for x86 vectorcall function. 8680b57cec5SDimitry Andric if (Symbol *s = findByPrefix(name.substr(1) + "@@")) 8690b57cec5SDimitry Andric return s; 8700b57cec5SDimitry Andric // Search for x86 C++ non-member function. 8710b57cec5SDimitry Andric return findByPrefix("?" + name.substr(1) + "@@Y"); 8720b57cec5SDimitry Andric } 8730b57cec5SDimitry Andric 8740b57cec5SDimitry Andric Symbol *SymbolTable::addUndefined(StringRef name) { 8750b57cec5SDimitry Andric return addUndefined(name, nullptr, false); 8760b57cec5SDimitry Andric } 8770b57cec5SDimitry Andric 878349cc55cSDimitry Andric void SymbolTable::compileBitcodeFiles() { 879349cc55cSDimitry Andric if (ctx.bitcodeFileInstances.empty()) 8800b57cec5SDimitry Andric return; 8810b57cec5SDimitry Andric 882349cc55cSDimitry Andric ScopedTimer t(ctx.ltoTimer); 883349cc55cSDimitry Andric lto.reset(new BitcodeCompiler()); 884349cc55cSDimitry Andric for (BitcodeFile *f : ctx.bitcodeFileInstances) 8855ffd83dbSDimitry Andric lto->add(*f); 886349cc55cSDimitry Andric for (InputFile *newObj : lto->compile(ctx)) { 8875ffd83dbSDimitry Andric ObjFile *obj = cast<ObjFile>(newObj); 8880b57cec5SDimitry Andric obj->parse(); 889349cc55cSDimitry Andric ctx.objFileInstances.push_back(obj); 8900b57cec5SDimitry Andric } 8910b57cec5SDimitry Andric } 8920b57cec5SDimitry Andric 8930b57cec5SDimitry Andric } // namespace coff 8940b57cec5SDimitry Andric } // namespace lld 895