1 //===- SymbolTable.cpp ----------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "SymbolTable.h" 10 #include "Config.h" 11 #include "Driver.h" 12 #include "LTO.h" 13 #include "PDB.h" 14 #include "Symbols.h" 15 #include "lld/Common/ErrorHandler.h" 16 #include "lld/Common/Memory.h" 17 #include "lld/Common/Timer.h" 18 #include "llvm/DebugInfo/Symbolize/Symbolize.h" 19 #include "llvm/IR/LLVMContext.h" 20 #include "llvm/LTO/LTO.h" 21 #include "llvm/Object/WindowsMachineFlag.h" 22 #include "llvm/Support/Debug.h" 23 #include "llvm/Support/raw_ostream.h" 24 #include <utility> 25 26 using namespace llvm; 27 28 namespace lld { 29 namespace coff { 30 31 static Timer ltoTimer("LTO", Timer::root()); 32 33 SymbolTable *symtab; 34 35 void SymbolTable::addFile(InputFile *file) { 36 log("Reading " + toString(file)); 37 file->parse(); 38 39 MachineTypes mt = file->getMachineType(); 40 if (config->machine == IMAGE_FILE_MACHINE_UNKNOWN) { 41 config->machine = mt; 42 } else if (mt != IMAGE_FILE_MACHINE_UNKNOWN && config->machine != mt) { 43 error(toString(file) + ": machine type " + machineToStr(mt) + 44 " conflicts with " + machineToStr(config->machine)); 45 return; 46 } 47 48 if (auto *f = dyn_cast<ObjFile>(file)) { 49 ObjFile::instances.push_back(f); 50 } else if (auto *f = dyn_cast<BitcodeFile>(file)) { 51 BitcodeFile::instances.push_back(f); 52 } else if (auto *f = dyn_cast<ImportFile>(file)) { 53 ImportFile::instances.push_back(f); 54 } 55 56 driver->parseDirectives(file); 57 } 58 59 static void errorOrWarn(const Twine &s) { 60 if (config->forceUnresolved) 61 warn(s); 62 else 63 error(s); 64 } 65 66 // Causes the file associated with a lazy symbol to be linked in. 67 static void forceLazy(Symbol *s) { 68 s->pendingArchiveLoad = true; 69 switch (s->kind()) { 70 case Symbol::Kind::LazyArchiveKind: { 71 auto *l = cast<LazyArchive>(s); 72 l->file->addMember(l->sym); 73 break; 74 } 75 case Symbol::Kind::LazyObjectKind: 76 cast<LazyObject>(s)->file->fetch(); 77 break; 78 default: 79 llvm_unreachable( 80 "symbol passed to forceLazy is not a LazyArchive or LazyObject"); 81 } 82 } 83 84 // Returns the symbol in SC whose value is <= Addr that is closest to Addr. 85 // This is generally the global variable or function whose definition contains 86 // Addr. 87 static Symbol *getSymbol(SectionChunk *sc, uint32_t addr) { 88 DefinedRegular *candidate = nullptr; 89 90 for (Symbol *s : sc->file->getSymbols()) { 91 auto *d = dyn_cast_or_null<DefinedRegular>(s); 92 if (!d || !d->data || d->file != sc->file || d->getChunk() != sc || 93 d->getValue() > addr || 94 (candidate && d->getValue() < candidate->getValue())) 95 continue; 96 97 candidate = d; 98 } 99 100 return candidate; 101 } 102 103 static std::vector<std::string> getSymbolLocations(BitcodeFile *file) { 104 std::string res("\n>>> referenced by "); 105 StringRef source = file->obj->getSourceFileName(); 106 if (!source.empty()) 107 res += source.str() + "\n>>> "; 108 res += toString(file); 109 return {res}; 110 } 111 112 static Optional<std::pair<StringRef, uint32_t>> 113 getFileLineDwarf(const SectionChunk *c, uint32_t addr) { 114 Optional<DILineInfo> optionalLineInfo = 115 c->file->getDILineInfo(addr, c->getSectionNumber() - 1); 116 if (!optionalLineInfo) 117 return None; 118 const DILineInfo &lineInfo = *optionalLineInfo; 119 if (lineInfo.FileName == DILineInfo::BadString) 120 return None; 121 return std::make_pair(saver.save(lineInfo.FileName), lineInfo.Line); 122 } 123 124 static Optional<std::pair<StringRef, uint32_t>> 125 getFileLine(const SectionChunk *c, uint32_t addr) { 126 // MinGW can optionally use codeview, even if the default is dwarf. 127 Optional<std::pair<StringRef, uint32_t>> fileLine = 128 getFileLineCodeView(c, addr); 129 // If codeview didn't yield any result, check dwarf in MinGW mode. 130 if (!fileLine && config->mingw) 131 fileLine = getFileLineDwarf(c, addr); 132 return fileLine; 133 } 134 135 // Given a file and the index of a symbol in that file, returns a description 136 // of all references to that symbol from that file. If no debug information is 137 // available, returns just the name of the file, else one string per actual 138 // reference as described in the debug info. 139 // Returns up to maxStrings string descriptions, along with the total number of 140 // locations found. 141 static std::pair<std::vector<std::string>, size_t> 142 getSymbolLocations(ObjFile *file, uint32_t symIndex, size_t maxStrings) { 143 struct Location { 144 Symbol *sym; 145 std::pair<StringRef, uint32_t> fileLine; 146 }; 147 std::vector<Location> locations; 148 size_t numLocations = 0; 149 150 for (Chunk *c : file->getChunks()) { 151 auto *sc = dyn_cast<SectionChunk>(c); 152 if (!sc) 153 continue; 154 for (const coff_relocation &r : sc->getRelocs()) { 155 if (r.SymbolTableIndex != symIndex) 156 continue; 157 numLocations++; 158 if (locations.size() >= maxStrings) 159 continue; 160 161 Optional<std::pair<StringRef, uint32_t>> fileLine = 162 getFileLine(sc, r.VirtualAddress); 163 Symbol *sym = getSymbol(sc, r.VirtualAddress); 164 if (fileLine) 165 locations.push_back({sym, *fileLine}); 166 else if (sym) 167 locations.push_back({sym, {"", 0}}); 168 } 169 } 170 171 if (maxStrings == 0) 172 return std::make_pair(std::vector<std::string>(), numLocations); 173 174 if (numLocations == 0) 175 return std::make_pair( 176 std::vector<std::string>{"\n>>> referenced by " + toString(file)}, 1); 177 178 std::vector<std::string> symbolLocations(locations.size()); 179 size_t i = 0; 180 for (Location loc : locations) { 181 llvm::raw_string_ostream os(symbolLocations[i++]); 182 os << "\n>>> referenced by "; 183 if (!loc.fileLine.first.empty()) 184 os << loc.fileLine.first << ":" << loc.fileLine.second 185 << "\n>>> "; 186 os << toString(file); 187 if (loc.sym) 188 os << ":(" << toString(*loc.sym) << ')'; 189 } 190 return std::make_pair(symbolLocations, numLocations); 191 } 192 193 std::vector<std::string> getSymbolLocations(ObjFile *file, uint32_t symIndex) { 194 return getSymbolLocations(file, symIndex, SIZE_MAX).first; 195 } 196 197 static std::pair<std::vector<std::string>, size_t> 198 getSymbolLocations(InputFile *file, uint32_t symIndex, size_t maxStrings) { 199 if (auto *o = dyn_cast<ObjFile>(file)) 200 return getSymbolLocations(o, symIndex, maxStrings); 201 if (auto *b = dyn_cast<BitcodeFile>(file)) { 202 std::vector<std::string> symbolLocations = getSymbolLocations(b); 203 size_t numLocations = symbolLocations.size(); 204 if (symbolLocations.size() > maxStrings) 205 symbolLocations.resize(maxStrings); 206 return std::make_pair(symbolLocations, numLocations); 207 } 208 llvm_unreachable("unsupported file type passed to getSymbolLocations"); 209 return std::make_pair(std::vector<std::string>(), (size_t)0); 210 } 211 212 // For an undefined symbol, stores all files referencing it and the index of 213 // the undefined symbol in each file. 214 struct UndefinedDiag { 215 Symbol *sym; 216 struct File { 217 InputFile *file; 218 uint32_t symIndex; 219 }; 220 std::vector<File> files; 221 }; 222 223 static void reportUndefinedSymbol(const UndefinedDiag &undefDiag) { 224 std::string out; 225 llvm::raw_string_ostream os(out); 226 os << "undefined symbol: " << toString(*undefDiag.sym); 227 228 const size_t maxUndefReferences = 3; 229 size_t numDisplayedRefs = 0, numRefs = 0; 230 for (const UndefinedDiag::File &ref : undefDiag.files) { 231 std::vector<std::string> symbolLocations; 232 size_t totalLocations = 0; 233 std::tie(symbolLocations, totalLocations) = getSymbolLocations( 234 ref.file, ref.symIndex, maxUndefReferences - numDisplayedRefs); 235 236 numRefs += totalLocations; 237 numDisplayedRefs += symbolLocations.size(); 238 for (const std::string &s : symbolLocations) { 239 os << s; 240 } 241 } 242 if (numDisplayedRefs < numRefs) 243 os << "\n>>> referenced " << numRefs - numDisplayedRefs << " more times"; 244 errorOrWarn(os.str()); 245 } 246 247 void SymbolTable::loadMinGWAutomaticImports() { 248 for (auto &i : symMap) { 249 Symbol *sym = i.second; 250 auto *undef = dyn_cast<Undefined>(sym); 251 if (!undef) 252 continue; 253 if (undef->getWeakAlias()) 254 continue; 255 256 StringRef name = undef->getName(); 257 258 if (name.startswith("__imp_")) 259 continue; 260 // If we have an undefined symbol, but we have a lazy symbol we could 261 // load, load it. 262 Symbol *l = find(("__imp_" + name).str()); 263 if (!l || l->pendingArchiveLoad || !l->isLazy()) 264 continue; 265 266 log("Loading lazy " + l->getName() + " from " + l->getFile()->getName() + 267 " for automatic import"); 268 forceLazy(l); 269 } 270 } 271 272 Defined *SymbolTable::impSymbol(StringRef name) { 273 if (name.startswith("__imp_")) 274 return nullptr; 275 return dyn_cast_or_null<Defined>(find(("__imp_" + name).str())); 276 } 277 278 bool SymbolTable::handleMinGWAutomaticImport(Symbol *sym, StringRef name) { 279 Defined *imp = impSymbol(name); 280 if (!imp) 281 return false; 282 283 // Replace the reference directly to a variable with a reference 284 // to the import address table instead. This obviously isn't right, 285 // but we mark the symbol as isRuntimePseudoReloc, and a later pass 286 // will add runtime pseudo relocations for every relocation against 287 // this Symbol. The runtime pseudo relocation framework expects the 288 // reference itself to point at the IAT entry. 289 size_t impSize = 0; 290 if (isa<DefinedImportData>(imp)) { 291 log("Automatically importing " + name + " from " + 292 cast<DefinedImportData>(imp)->getDLLName()); 293 impSize = sizeof(DefinedImportData); 294 } else if (isa<DefinedRegular>(imp)) { 295 log("Automatically importing " + name + " from " + 296 toString(cast<DefinedRegular>(imp)->file)); 297 impSize = sizeof(DefinedRegular); 298 } else { 299 warn("unable to automatically import " + name + " from " + imp->getName() + 300 " from " + toString(cast<DefinedRegular>(imp)->file) + 301 "; unexpected symbol type"); 302 return false; 303 } 304 sym->replaceKeepingName(imp, impSize); 305 sym->isRuntimePseudoReloc = true; 306 307 // There may exist symbols named .refptr.<name> which only consist 308 // of a single pointer to <name>. If it turns out <name> is 309 // automatically imported, we don't need to keep the .refptr.<name> 310 // pointer at all, but redirect all accesses to it to the IAT entry 311 // for __imp_<name> instead, and drop the whole .refptr.<name> chunk. 312 DefinedRegular *refptr = 313 dyn_cast_or_null<DefinedRegular>(find((".refptr." + name).str())); 314 if (refptr && refptr->getChunk()->getSize() == config->wordsize) { 315 SectionChunk *sc = dyn_cast_or_null<SectionChunk>(refptr->getChunk()); 316 if (sc && sc->getRelocs().size() == 1 && *sc->symbols().begin() == sym) { 317 log("Replacing .refptr." + name + " with " + imp->getName()); 318 refptr->getChunk()->live = false; 319 refptr->replaceKeepingName(imp, impSize); 320 } 321 } 322 return true; 323 } 324 325 /// Helper function for reportUnresolvable and resolveRemainingUndefines. 326 /// This function emits an "undefined symbol" diagnostic for each symbol in 327 /// undefs. If localImports is not nullptr, it also emits a "locally 328 /// defined symbol imported" diagnostic for symbols in localImports. 329 /// objFiles and bitcodeFiles (if not nullptr) are used to report where 330 /// undefined symbols are referenced. 331 static void 332 reportProblemSymbols(const SmallPtrSetImpl<Symbol *> &undefs, 333 const DenseMap<Symbol *, Symbol *> *localImports, 334 const std::vector<ObjFile *> objFiles, 335 const std::vector<BitcodeFile *> *bitcodeFiles) { 336 337 // Return early if there is nothing to report (which should be 338 // the common case). 339 if (undefs.empty() && (!localImports || localImports->empty())) 340 return; 341 342 for (Symbol *b : config->gcroot) { 343 if (undefs.count(b)) 344 errorOrWarn("<root>: undefined symbol: " + toString(*b)); 345 if (localImports) 346 if (Symbol *imp = localImports->lookup(b)) 347 warn("<root>: locally defined symbol imported: " + toString(*imp) + 348 " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 349 } 350 351 std::vector<UndefinedDiag> undefDiags; 352 DenseMap<Symbol *, int> firstDiag; 353 354 auto processFile = [&](InputFile *file, ArrayRef<Symbol *> symbols) { 355 uint32_t symIndex = (uint32_t)-1; 356 for (Symbol *sym : symbols) { 357 ++symIndex; 358 if (!sym) 359 continue; 360 if (undefs.count(sym)) { 361 auto it = firstDiag.find(sym); 362 if (it == firstDiag.end()) { 363 firstDiag[sym] = undefDiags.size(); 364 undefDiags.push_back({sym, {{file, symIndex}}}); 365 } else { 366 undefDiags[it->second].files.push_back({file, symIndex}); 367 } 368 } 369 if (localImports) 370 if (Symbol *imp = localImports->lookup(sym)) 371 warn(toString(file) + 372 ": locally defined symbol imported: " + toString(*imp) + 373 " (defined in " + toString(imp->getFile()) + ") [LNK4217]"); 374 } 375 }; 376 377 for (ObjFile *file : objFiles) 378 processFile(file, file->getSymbols()); 379 380 if (bitcodeFiles) 381 for (BitcodeFile *file : *bitcodeFiles) 382 processFile(file, file->getSymbols()); 383 384 for (const UndefinedDiag &undefDiag : undefDiags) 385 reportUndefinedSymbol(undefDiag); 386 } 387 388 void SymbolTable::reportUnresolvable() { 389 SmallPtrSet<Symbol *, 8> undefs; 390 for (auto &i : symMap) { 391 Symbol *sym = i.second; 392 auto *undef = dyn_cast<Undefined>(sym); 393 if (!undef || sym->deferUndefined) 394 continue; 395 if (undef->getWeakAlias()) 396 continue; 397 StringRef name = undef->getName(); 398 if (name.startswith("__imp_")) { 399 Symbol *imp = find(name.substr(strlen("__imp_"))); 400 if (imp && isa<Defined>(imp)) 401 continue; 402 } 403 if (name.contains("_PchSym_")) 404 continue; 405 if (config->autoImport && impSymbol(name)) 406 continue; 407 undefs.insert(sym); 408 } 409 410 reportProblemSymbols(undefs, 411 /* localImports */ nullptr, ObjFile::instances, 412 &BitcodeFile::instances); 413 } 414 415 void SymbolTable::resolveRemainingUndefines() { 416 SmallPtrSet<Symbol *, 8> undefs; 417 DenseMap<Symbol *, Symbol *> localImports; 418 419 for (auto &i : symMap) { 420 Symbol *sym = i.second; 421 auto *undef = dyn_cast<Undefined>(sym); 422 if (!undef) 423 continue; 424 if (!sym->isUsedInRegularObj) 425 continue; 426 427 StringRef name = undef->getName(); 428 429 // A weak alias may have been resolved, so check for that. 430 if (Defined *d = undef->getWeakAlias()) { 431 // We want to replace Sym with D. However, we can't just blindly 432 // copy sizeof(SymbolUnion) bytes from D to Sym because D may be an 433 // internal symbol, and internal symbols are stored as "unparented" 434 // Symbols. For that reason we need to check which type of symbol we 435 // are dealing with and copy the correct number of bytes. 436 if (isa<DefinedRegular>(d)) 437 memcpy(sym, d, sizeof(DefinedRegular)); 438 else if (isa<DefinedAbsolute>(d)) 439 memcpy(sym, d, sizeof(DefinedAbsolute)); 440 else 441 memcpy(sym, d, sizeof(SymbolUnion)); 442 continue; 443 } 444 445 // If we can resolve a symbol by removing __imp_ prefix, do that. 446 // This odd rule is for compatibility with MSVC linker. 447 if (name.startswith("__imp_")) { 448 Symbol *imp = find(name.substr(strlen("__imp_"))); 449 if (imp && isa<Defined>(imp)) { 450 auto *d = cast<Defined>(imp); 451 replaceSymbol<DefinedLocalImport>(sym, name, d); 452 localImportChunks.push_back(cast<DefinedLocalImport>(sym)->getChunk()); 453 localImports[sym] = d; 454 continue; 455 } 456 } 457 458 // We don't want to report missing Microsoft precompiled headers symbols. 459 // A proper message will be emitted instead in PDBLinker::aquirePrecompObj 460 if (name.contains("_PchSym_")) 461 continue; 462 463 if (config->autoImport && handleMinGWAutomaticImport(sym, name)) 464 continue; 465 466 // Remaining undefined symbols are not fatal if /force is specified. 467 // They are replaced with dummy defined symbols. 468 if (config->forceUnresolved) 469 replaceSymbol<DefinedAbsolute>(sym, name, 0); 470 undefs.insert(sym); 471 } 472 473 reportProblemSymbols( 474 undefs, config->warnLocallyDefinedImported ? &localImports : nullptr, 475 ObjFile::instances, /* bitcode files no longer needed */ nullptr); 476 } 477 478 std::pair<Symbol *, bool> SymbolTable::insert(StringRef name) { 479 bool inserted = false; 480 Symbol *&sym = symMap[CachedHashStringRef(name)]; 481 if (!sym) { 482 sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); 483 sym->isUsedInRegularObj = false; 484 sym->pendingArchiveLoad = false; 485 sym->canInline = true; 486 inserted = true; 487 } 488 return {sym, inserted}; 489 } 490 491 std::pair<Symbol *, bool> SymbolTable::insert(StringRef name, InputFile *file) { 492 std::pair<Symbol *, bool> result = insert(name); 493 if (!file || !isa<BitcodeFile>(file)) 494 result.first->isUsedInRegularObj = true; 495 return result; 496 } 497 498 Symbol *SymbolTable::addUndefined(StringRef name, InputFile *f, 499 bool isWeakAlias) { 500 Symbol *s; 501 bool wasInserted; 502 std::tie(s, wasInserted) = insert(name, f); 503 if (wasInserted || (s->isLazy() && isWeakAlias)) { 504 replaceSymbol<Undefined>(s, name); 505 return s; 506 } 507 if (s->isLazy()) 508 forceLazy(s); 509 return s; 510 } 511 512 void SymbolTable::addLazyArchive(ArchiveFile *f, const Archive::Symbol &sym) { 513 StringRef name = sym.getName(); 514 Symbol *s; 515 bool wasInserted; 516 std::tie(s, wasInserted) = insert(name); 517 if (wasInserted) { 518 replaceSymbol<LazyArchive>(s, f, sym); 519 return; 520 } 521 auto *u = dyn_cast<Undefined>(s); 522 if (!u || u->weakAlias || s->pendingArchiveLoad) 523 return; 524 s->pendingArchiveLoad = true; 525 f->addMember(sym); 526 } 527 528 void SymbolTable::addLazyObject(LazyObjFile *f, StringRef n) { 529 Symbol *s; 530 bool wasInserted; 531 std::tie(s, wasInserted) = insert(n, f); 532 if (wasInserted) { 533 replaceSymbol<LazyObject>(s, f, n); 534 return; 535 } 536 auto *u = dyn_cast<Undefined>(s); 537 if (!u || u->weakAlias || s->pendingArchiveLoad) 538 return; 539 s->pendingArchiveLoad = true; 540 f->fetch(); 541 } 542 543 static std::string getSourceLocationBitcode(BitcodeFile *file) { 544 std::string res("\n>>> defined at "); 545 StringRef source = file->obj->getSourceFileName(); 546 if (!source.empty()) 547 res += source.str() + "\n>>> "; 548 res += toString(file); 549 return res; 550 } 551 552 static std::string getSourceLocationObj(ObjFile *file, SectionChunk *sc, 553 uint32_t offset, StringRef name) { 554 Optional<std::pair<StringRef, uint32_t>> fileLine; 555 if (sc) 556 fileLine = getFileLine(sc, offset); 557 if (!fileLine) 558 fileLine = file->getVariableLocation(name); 559 560 std::string res; 561 llvm::raw_string_ostream os(res); 562 os << "\n>>> defined at "; 563 if (fileLine) 564 os << fileLine->first << ":" << fileLine->second << "\n>>> "; 565 os << toString(file); 566 return os.str(); 567 } 568 569 static std::string getSourceLocation(InputFile *file, SectionChunk *sc, 570 uint32_t offset, StringRef name) { 571 if (!file) 572 return ""; 573 if (auto *o = dyn_cast<ObjFile>(file)) 574 return getSourceLocationObj(o, sc, offset, name); 575 if (auto *b = dyn_cast<BitcodeFile>(file)) 576 return getSourceLocationBitcode(b); 577 return "\n>>> defined at " + toString(file); 578 } 579 580 // Construct and print an error message in the form of: 581 // 582 // lld-link: error: duplicate symbol: foo 583 // >>> defined at bar.c:30 584 // >>> bar.o 585 // >>> defined at baz.c:563 586 // >>> baz.o 587 void SymbolTable::reportDuplicate(Symbol *existing, InputFile *newFile, 588 SectionChunk *newSc, 589 uint32_t newSectionOffset) { 590 std::string msg; 591 llvm::raw_string_ostream os(msg); 592 os << "duplicate symbol: " << toString(*existing); 593 594 DefinedRegular *d = dyn_cast<DefinedRegular>(existing); 595 if (d && isa<ObjFile>(d->getFile())) { 596 os << getSourceLocation(d->getFile(), d->getChunk(), d->getValue(), 597 existing->getName()); 598 } else { 599 os << getSourceLocation(existing->getFile(), nullptr, 0, ""); 600 } 601 os << getSourceLocation(newFile, newSc, newSectionOffset, 602 existing->getName()); 603 604 if (config->forceMultiple) 605 warn(os.str()); 606 else 607 error(os.str()); 608 } 609 610 Symbol *SymbolTable::addAbsolute(StringRef n, COFFSymbolRef sym) { 611 Symbol *s; 612 bool wasInserted; 613 std::tie(s, wasInserted) = insert(n, nullptr); 614 s->isUsedInRegularObj = true; 615 if (wasInserted || isa<Undefined>(s) || s->isLazy()) 616 replaceSymbol<DefinedAbsolute>(s, n, sym); 617 else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 618 if (da->getVA() != sym.getValue()) 619 reportDuplicate(s, nullptr); 620 } else if (!isa<DefinedCOFF>(s)) 621 reportDuplicate(s, nullptr); 622 return s; 623 } 624 625 Symbol *SymbolTable::addAbsolute(StringRef n, uint64_t va) { 626 Symbol *s; 627 bool wasInserted; 628 std::tie(s, wasInserted) = insert(n, nullptr); 629 s->isUsedInRegularObj = true; 630 if (wasInserted || isa<Undefined>(s) || s->isLazy()) 631 replaceSymbol<DefinedAbsolute>(s, n, va); 632 else if (auto *da = dyn_cast<DefinedAbsolute>(s)) { 633 if (da->getVA() != va) 634 reportDuplicate(s, nullptr); 635 } else if (!isa<DefinedCOFF>(s)) 636 reportDuplicate(s, nullptr); 637 return s; 638 } 639 640 Symbol *SymbolTable::addSynthetic(StringRef n, Chunk *c) { 641 Symbol *s; 642 bool wasInserted; 643 std::tie(s, wasInserted) = insert(n, nullptr); 644 s->isUsedInRegularObj = true; 645 if (wasInserted || isa<Undefined>(s) || s->isLazy()) 646 replaceSymbol<DefinedSynthetic>(s, n, c); 647 else if (!isa<DefinedCOFF>(s)) 648 reportDuplicate(s, nullptr); 649 return s; 650 } 651 652 Symbol *SymbolTable::addRegular(InputFile *f, StringRef n, 653 const coff_symbol_generic *sym, SectionChunk *c, 654 uint32_t sectionOffset) { 655 Symbol *s; 656 bool wasInserted; 657 std::tie(s, wasInserted) = insert(n, f); 658 if (wasInserted || !isa<DefinedRegular>(s)) 659 replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ false, 660 /*IsExternal*/ true, sym, c); 661 else 662 reportDuplicate(s, f, c, sectionOffset); 663 return s; 664 } 665 666 std::pair<DefinedRegular *, bool> 667 SymbolTable::addComdat(InputFile *f, StringRef n, 668 const coff_symbol_generic *sym) { 669 Symbol *s; 670 bool wasInserted; 671 std::tie(s, wasInserted) = insert(n, f); 672 if (wasInserted || !isa<DefinedRegular>(s)) { 673 replaceSymbol<DefinedRegular>(s, f, n, /*IsCOMDAT*/ true, 674 /*IsExternal*/ true, sym, nullptr); 675 return {cast<DefinedRegular>(s), true}; 676 } 677 auto *existingSymbol = cast<DefinedRegular>(s); 678 if (!existingSymbol->isCOMDAT) 679 reportDuplicate(s, f); 680 return {existingSymbol, false}; 681 } 682 683 Symbol *SymbolTable::addCommon(InputFile *f, StringRef n, uint64_t size, 684 const coff_symbol_generic *sym, CommonChunk *c) { 685 Symbol *s; 686 bool wasInserted; 687 std::tie(s, wasInserted) = insert(n, f); 688 if (wasInserted || !isa<DefinedCOFF>(s)) 689 replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 690 else if (auto *dc = dyn_cast<DefinedCommon>(s)) 691 if (size > dc->getSize()) 692 replaceSymbol<DefinedCommon>(s, f, n, size, sym, c); 693 return s; 694 } 695 696 Symbol *SymbolTable::addImportData(StringRef n, ImportFile *f) { 697 Symbol *s; 698 bool wasInserted; 699 std::tie(s, wasInserted) = insert(n, nullptr); 700 s->isUsedInRegularObj = true; 701 if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 702 replaceSymbol<DefinedImportData>(s, n, f); 703 return s; 704 } 705 706 reportDuplicate(s, f); 707 return nullptr; 708 } 709 710 Symbol *SymbolTable::addImportThunk(StringRef name, DefinedImportData *id, 711 uint16_t machine) { 712 Symbol *s; 713 bool wasInserted; 714 std::tie(s, wasInserted) = insert(name, nullptr); 715 s->isUsedInRegularObj = true; 716 if (wasInserted || isa<Undefined>(s) || s->isLazy()) { 717 replaceSymbol<DefinedImportThunk>(s, name, id, machine); 718 return s; 719 } 720 721 reportDuplicate(s, id->file); 722 return nullptr; 723 } 724 725 void SymbolTable::addLibcall(StringRef name) { 726 Symbol *sym = findUnderscore(name); 727 if (!sym) 728 return; 729 730 if (auto *l = dyn_cast<LazyArchive>(sym)) { 731 MemoryBufferRef mb = l->getMemberBuffer(); 732 if (isBitcode(mb)) 733 addUndefined(sym->getName()); 734 } else if (LazyObject *o = dyn_cast<LazyObject>(sym)) { 735 if (isBitcode(o->file->mb)) 736 addUndefined(sym->getName()); 737 } 738 } 739 740 std::vector<Chunk *> SymbolTable::getChunks() { 741 std::vector<Chunk *> res; 742 for (ObjFile *file : ObjFile::instances) { 743 ArrayRef<Chunk *> v = file->getChunks(); 744 res.insert(res.end(), v.begin(), v.end()); 745 } 746 return res; 747 } 748 749 Symbol *SymbolTable::find(StringRef name) { 750 return symMap.lookup(CachedHashStringRef(name)); 751 } 752 753 Symbol *SymbolTable::findUnderscore(StringRef name) { 754 if (config->machine == I386) 755 return find(("_" + name).str()); 756 return find(name); 757 } 758 759 // Return all symbols that start with Prefix, possibly ignoring the first 760 // character of Prefix or the first character symbol. 761 std::vector<Symbol *> SymbolTable::getSymsWithPrefix(StringRef prefix) { 762 std::vector<Symbol *> syms; 763 for (auto pair : symMap) { 764 StringRef name = pair.first.val(); 765 if (name.startswith(prefix) || name.startswith(prefix.drop_front()) || 766 name.drop_front().startswith(prefix) || 767 name.drop_front().startswith(prefix.drop_front())) { 768 syms.push_back(pair.second); 769 } 770 } 771 return syms; 772 } 773 774 Symbol *SymbolTable::findMangle(StringRef name) { 775 if (Symbol *sym = find(name)) 776 if (!isa<Undefined>(sym)) 777 return sym; 778 779 // Efficient fuzzy string lookup is impossible with a hash table, so iterate 780 // the symbol table once and collect all possibly matching symbols into this 781 // vector. Then compare each possibly matching symbol with each possible 782 // mangling. 783 std::vector<Symbol *> syms = getSymsWithPrefix(name); 784 auto findByPrefix = [&syms](const Twine &t) -> Symbol * { 785 std::string prefix = t.str(); 786 for (auto *s : syms) 787 if (s->getName().startswith(prefix)) 788 return s; 789 return nullptr; 790 }; 791 792 // For non-x86, just look for C++ functions. 793 if (config->machine != I386) 794 return findByPrefix("?" + name + "@@Y"); 795 796 if (!name.startswith("_")) 797 return nullptr; 798 // Search for x86 stdcall function. 799 if (Symbol *s = findByPrefix(name + "@")) 800 return s; 801 // Search for x86 fastcall function. 802 if (Symbol *s = findByPrefix("@" + name.substr(1) + "@")) 803 return s; 804 // Search for x86 vectorcall function. 805 if (Symbol *s = findByPrefix(name.substr(1) + "@@")) 806 return s; 807 // Search for x86 C++ non-member function. 808 return findByPrefix("?" + name.substr(1) + "@@Y"); 809 } 810 811 Symbol *SymbolTable::addUndefined(StringRef name) { 812 return addUndefined(name, nullptr, false); 813 } 814 815 void SymbolTable::addCombinedLTOObjects() { 816 if (BitcodeFile::instances.empty()) 817 return; 818 819 ScopedTimer t(ltoTimer); 820 lto.reset(new BitcodeCompiler); 821 for (BitcodeFile *f : BitcodeFile::instances) 822 lto->add(*f); 823 for (InputFile *newObj : lto->compile()) { 824 ObjFile *obj = cast<ObjFile>(newObj); 825 obj->parse(); 826 ObjFile::instances.push_back(obj); 827 } 828 } 829 830 } // namespace coff 831 } // namespace lld 832