1 //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements Function import based on summaries. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "llvm/Transforms/IPO/FunctionImport.h" 14 #include "llvm/ADT/ArrayRef.h" 15 #include "llvm/ADT/STLExtras.h" 16 #include "llvm/ADT/SetVector.h" 17 #include "llvm/ADT/SmallVector.h" 18 #include "llvm/ADT/Statistic.h" 19 #include "llvm/ADT/StringMap.h" 20 #include "llvm/ADT/StringRef.h" 21 #include "llvm/ADT/StringSet.h" 22 #include "llvm/Bitcode/BitcodeReader.h" 23 #include "llvm/IR/AutoUpgrade.h" 24 #include "llvm/IR/Constants.h" 25 #include "llvm/IR/Function.h" 26 #include "llvm/IR/GlobalAlias.h" 27 #include "llvm/IR/GlobalObject.h" 28 #include "llvm/IR/GlobalValue.h" 29 #include "llvm/IR/GlobalVariable.h" 30 #include "llvm/IR/Metadata.h" 31 #include "llvm/IR/Module.h" 32 #include "llvm/IR/ModuleSummaryIndex.h" 33 #include "llvm/IRReader/IRReader.h" 34 #include "llvm/InitializePasses.h" 35 #include "llvm/Linker/IRMover.h" 36 #include "llvm/Object/ModuleSymbolTable.h" 37 #include "llvm/Object/SymbolicFile.h" 38 #include "llvm/Pass.h" 39 #include "llvm/Support/Casting.h" 40 #include "llvm/Support/CommandLine.h" 41 #include "llvm/Support/Debug.h" 42 #include "llvm/Support/Error.h" 43 #include "llvm/Support/ErrorHandling.h" 44 #include "llvm/Support/FileSystem.h" 45 #include "llvm/Support/SourceMgr.h" 46 #include "llvm/Support/raw_ostream.h" 47 #include "llvm/Transforms/IPO/Internalize.h" 48 #include "llvm/Transforms/Utils/Cloning.h" 49 #include "llvm/Transforms/Utils/FunctionImportUtils.h" 50 #include "llvm/Transforms/Utils/ValueMapper.h" 51 #include <cassert> 52 #include <memory> 53 #include <set> 54 #include <string> 55 #include <system_error> 56 #include <tuple> 57 #include <utility> 58 59 using namespace llvm; 60 61 #define DEBUG_TYPE "function-import" 62 63 STATISTIC(NumImportedFunctionsThinLink, 64 "Number of functions thin link decided to import"); 65 STATISTIC(NumImportedHotFunctionsThinLink, 66 "Number of hot functions thin link decided to import"); 67 STATISTIC(NumImportedCriticalFunctionsThinLink, 68 "Number of critical functions thin link decided to import"); 69 STATISTIC(NumImportedGlobalVarsThinLink, 70 "Number of global variables thin link decided to import"); 71 STATISTIC(NumImportedFunctions, "Number of functions imported in backend"); 72 STATISTIC(NumImportedGlobalVars, 73 "Number of global variables imported in backend"); 74 STATISTIC(NumImportedModules, "Number of modules imported from"); 75 STATISTIC(NumDeadSymbols, "Number of dead stripped symbols in index"); 76 STATISTIC(NumLiveSymbols, "Number of live symbols in index"); 77 78 /// Limit on instruction count of imported functions. 79 static cl::opt<unsigned> ImportInstrLimit( 80 "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), 81 cl::desc("Only import functions with less than N instructions")); 82 83 static cl::opt<int> ImportCutoff( 84 "import-cutoff", cl::init(-1), cl::Hidden, cl::value_desc("N"), 85 cl::desc("Only import first N functions if N>=0 (default -1)")); 86 87 static cl::opt<bool> 88 ForceImportAll("force-import-all", cl::init(false), cl::Hidden, 89 cl::desc("Import functions with noinline attribute")); 90 91 static cl::opt<float> 92 ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), 93 cl::Hidden, cl::value_desc("x"), 94 cl::desc("As we import functions, multiply the " 95 "`import-instr-limit` threshold by this factor " 96 "before processing newly imported functions")); 97 98 static cl::opt<float> ImportHotInstrFactor( 99 "import-hot-evolution-factor", cl::init(1.0), cl::Hidden, 100 cl::value_desc("x"), 101 cl::desc("As we import functions called from hot callsite, multiply the " 102 "`import-instr-limit` threshold by this factor " 103 "before processing newly imported functions")); 104 105 static cl::opt<float> ImportHotMultiplier( 106 "import-hot-multiplier", cl::init(10.0), cl::Hidden, cl::value_desc("x"), 107 cl::desc("Multiply the `import-instr-limit` threshold for hot callsites")); 108 109 static cl::opt<float> ImportCriticalMultiplier( 110 "import-critical-multiplier", cl::init(100.0), cl::Hidden, 111 cl::value_desc("x"), 112 cl::desc( 113 "Multiply the `import-instr-limit` threshold for critical callsites")); 114 115 // FIXME: This multiplier was not really tuned up. 116 static cl::opt<float> ImportColdMultiplier( 117 "import-cold-multiplier", cl::init(0), cl::Hidden, cl::value_desc("N"), 118 cl::desc("Multiply the `import-instr-limit` threshold for cold callsites")); 119 120 static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, 121 cl::desc("Print imported functions")); 122 123 static cl::opt<bool> PrintImportFailures( 124 "print-import-failures", cl::init(false), cl::Hidden, 125 cl::desc("Print information for functions rejected for importing")); 126 127 static cl::opt<bool> ComputeDead("compute-dead", cl::init(true), cl::Hidden, 128 cl::desc("Compute dead symbols")); 129 130 static cl::opt<bool> EnableImportMetadata( 131 "enable-import-metadata", cl::init(false), cl::Hidden, 132 cl::desc("Enable import metadata like 'thinlto_src_module'")); 133 134 /// Summary file to use for function importing when using -function-import from 135 /// the command line. 136 static cl::opt<std::string> 137 SummaryFile("summary-file", 138 cl::desc("The summary file to use for function importing.")); 139 140 /// Used when testing importing from distributed indexes via opt 141 // -function-import. 142 static cl::opt<bool> 143 ImportAllIndex("import-all-index", 144 cl::desc("Import all external functions in index.")); 145 146 // Load lazily a module from \p FileName in \p Context. 147 static std::unique_ptr<Module> loadFile(const std::string &FileName, 148 LLVMContext &Context) { 149 SMDiagnostic Err; 150 LLVM_DEBUG(dbgs() << "Loading '" << FileName << "'\n"); 151 // Metadata isn't loaded until functions are imported, to minimize 152 // the memory overhead. 153 std::unique_ptr<Module> Result = 154 getLazyIRFileModule(FileName, Err, Context, 155 /* ShouldLazyLoadMetadata = */ true); 156 if (!Result) { 157 Err.print("function-import", errs()); 158 report_fatal_error("Abort"); 159 } 160 161 return Result; 162 } 163 164 /// Given a list of possible callee implementation for a call site, select one 165 /// that fits the \p Threshold. 166 /// 167 /// FIXME: select "best" instead of first that fits. But what is "best"? 168 /// - The smallest: more likely to be inlined. 169 /// - The one with the least outgoing edges (already well optimized). 170 /// - One from a module already being imported from in order to reduce the 171 /// number of source modules parsed/linked. 172 /// - One that has PGO data attached. 173 /// - [insert you fancy metric here] 174 static const GlobalValueSummary * 175 selectCallee(const ModuleSummaryIndex &Index, 176 ArrayRef<std::unique_ptr<GlobalValueSummary>> CalleeSummaryList, 177 unsigned Threshold, StringRef CallerModulePath, 178 FunctionImporter::ImportFailureReason &Reason, 179 GlobalValue::GUID GUID) { 180 Reason = FunctionImporter::ImportFailureReason::None; 181 auto It = llvm::find_if( 182 CalleeSummaryList, 183 [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) { 184 auto *GVSummary = SummaryPtr.get(); 185 if (!Index.isGlobalValueLive(GVSummary)) { 186 Reason = FunctionImporter::ImportFailureReason::NotLive; 187 return false; 188 } 189 190 // For SamplePGO, in computeImportForFunction the OriginalId 191 // may have been used to locate the callee summary list (See 192 // comment there). 193 // The mapping from OriginalId to GUID may return a GUID 194 // that corresponds to a static variable. Filter it out here. 195 // This can happen when 196 // 1) There is a call to a library function which is not defined 197 // in the index. 198 // 2) There is a static variable with the OriginalGUID identical 199 // to the GUID of the library function in 1); 200 // When this happens, the logic for SamplePGO kicks in and 201 // the static variable in 2) will be found, which needs to be 202 // filtered out. 203 if (GVSummary->getSummaryKind() == GlobalValueSummary::GlobalVarKind) { 204 Reason = FunctionImporter::ImportFailureReason::GlobalVar; 205 return false; 206 } 207 if (GlobalValue::isInterposableLinkage(GVSummary->linkage())) { 208 Reason = FunctionImporter::ImportFailureReason::InterposableLinkage; 209 // There is no point in importing these, we can't inline them 210 return false; 211 } 212 213 auto *Summary = cast<FunctionSummary>(GVSummary->getBaseObject()); 214 215 // If this is a local function, make sure we import the copy 216 // in the caller's module. The only time a local function can 217 // share an entry in the index is if there is a local with the same name 218 // in another module that had the same source file name (in a different 219 // directory), where each was compiled in their own directory so there 220 // was not distinguishing path. 221 // However, do the import from another module if there is only one 222 // entry in the list - in that case this must be a reference due 223 // to indirect call profile data, since a function pointer can point to 224 // a local in another module. 225 if (GlobalValue::isLocalLinkage(Summary->linkage()) && 226 CalleeSummaryList.size() > 1 && 227 Summary->modulePath() != CallerModulePath) { 228 Reason = 229 FunctionImporter::ImportFailureReason::LocalLinkageNotInModule; 230 return false; 231 } 232 233 if ((Summary->instCount() > Threshold) && 234 !Summary->fflags().AlwaysInline && !ForceImportAll) { 235 Reason = FunctionImporter::ImportFailureReason::TooLarge; 236 return false; 237 } 238 239 // Skip if it isn't legal to import (e.g. may reference unpromotable 240 // locals). 241 if (Summary->notEligibleToImport()) { 242 Reason = FunctionImporter::ImportFailureReason::NotEligible; 243 return false; 244 } 245 246 // Don't bother importing if we can't inline it anyway. 247 if (Summary->fflags().NoInline && !ForceImportAll) { 248 Reason = FunctionImporter::ImportFailureReason::NoInline; 249 return false; 250 } 251 252 return true; 253 }); 254 if (It == CalleeSummaryList.end()) 255 return nullptr; 256 257 return cast<GlobalValueSummary>(It->get()); 258 } 259 260 namespace { 261 262 using EdgeInfo = 263 std::tuple<const GlobalValueSummary *, unsigned /* Threshold */>; 264 265 } // anonymous namespace 266 267 static ValueInfo 268 updateValueInfoForIndirectCalls(const ModuleSummaryIndex &Index, ValueInfo VI) { 269 if (!VI.getSummaryList().empty()) 270 return VI; 271 // For SamplePGO, the indirect call targets for local functions will 272 // have its original name annotated in profile. We try to find the 273 // corresponding PGOFuncName as the GUID. 274 // FIXME: Consider updating the edges in the graph after building 275 // it, rather than needing to perform this mapping on each walk. 276 auto GUID = Index.getGUIDFromOriginalID(VI.getGUID()); 277 if (GUID == 0) 278 return ValueInfo(); 279 return Index.getValueInfo(GUID); 280 } 281 282 static bool shouldImportGlobal(const ValueInfo &VI, 283 const GVSummaryMapTy &DefinedGVSummaries) { 284 const auto &GVS = DefinedGVSummaries.find(VI.getGUID()); 285 if (GVS == DefinedGVSummaries.end()) 286 return true; 287 // We should not skip import if the module contains a definition with 288 // interposable linkage type. This is required for correctness in 289 // the situation with two following conditions: 290 // * the def with interposable linkage is non-prevailing, 291 // * there is a prevailing def available for import and marked read-only. 292 // In this case, the non-prevailing def will be converted to a declaration, 293 // while the prevailing one becomes internal, thus no definitions will be 294 // available for linking. In order to prevent undefined symbol link error, 295 // the prevailing definition must be imported. 296 // FIXME: Consider adding a check that the suitable prevailing definition 297 // exists and marked read-only. 298 if (VI.getSummaryList().size() > 1 && 299 GlobalValue::isInterposableLinkage(GVS->second->linkage())) 300 return true; 301 302 return false; 303 } 304 305 static void computeImportForReferencedGlobals( 306 const GlobalValueSummary &Summary, const ModuleSummaryIndex &Index, 307 const GVSummaryMapTy &DefinedGVSummaries, 308 SmallVectorImpl<EdgeInfo> &Worklist, 309 FunctionImporter::ImportMapTy &ImportList, 310 StringMap<FunctionImporter::ExportSetTy> *ExportLists) { 311 for (auto &VI : Summary.refs()) { 312 if (!shouldImportGlobal(VI, DefinedGVSummaries)) { 313 LLVM_DEBUG( 314 dbgs() << "Ref ignored! Target already in destination module.\n"); 315 continue; 316 } 317 318 LLVM_DEBUG(dbgs() << " ref -> " << VI << "\n"); 319 320 // If this is a local variable, make sure we import the copy 321 // in the caller's module. The only time a local variable can 322 // share an entry in the index is if there is a local with the same name 323 // in another module that had the same source file name (in a different 324 // directory), where each was compiled in their own directory so there 325 // was not distinguishing path. 326 auto LocalNotInModule = [&](const GlobalValueSummary *RefSummary) -> bool { 327 return GlobalValue::isLocalLinkage(RefSummary->linkage()) && 328 RefSummary->modulePath() != Summary.modulePath(); 329 }; 330 331 for (auto &RefSummary : VI.getSummaryList()) 332 if (isa<GlobalVarSummary>(RefSummary.get()) && 333 Index.canImportGlobalVar(RefSummary.get(), /* AnalyzeRefs */ true) && 334 !LocalNotInModule(RefSummary.get())) { 335 auto ILI = ImportList[RefSummary->modulePath()].insert(VI.getGUID()); 336 // Only update stat and exports if we haven't already imported this 337 // variable. 338 if (!ILI.second) 339 break; 340 NumImportedGlobalVarsThinLink++; 341 // Any references made by this variable will be marked exported later, 342 // in ComputeCrossModuleImport, after import decisions are complete, 343 // which is more efficient than adding them here. 344 if (ExportLists) 345 (*ExportLists)[RefSummary->modulePath()].insert(VI); 346 347 // If variable is not writeonly we attempt to recursively analyze 348 // its references in order to import referenced constants. 349 if (!Index.isWriteOnly(cast<GlobalVarSummary>(RefSummary.get()))) 350 Worklist.emplace_back(RefSummary.get(), 0); 351 break; 352 } 353 } 354 } 355 356 static const char * 357 getFailureName(FunctionImporter::ImportFailureReason Reason) { 358 switch (Reason) { 359 case FunctionImporter::ImportFailureReason::None: 360 return "None"; 361 case FunctionImporter::ImportFailureReason::GlobalVar: 362 return "GlobalVar"; 363 case FunctionImporter::ImportFailureReason::NotLive: 364 return "NotLive"; 365 case FunctionImporter::ImportFailureReason::TooLarge: 366 return "TooLarge"; 367 case FunctionImporter::ImportFailureReason::InterposableLinkage: 368 return "InterposableLinkage"; 369 case FunctionImporter::ImportFailureReason::LocalLinkageNotInModule: 370 return "LocalLinkageNotInModule"; 371 case FunctionImporter::ImportFailureReason::NotEligible: 372 return "NotEligible"; 373 case FunctionImporter::ImportFailureReason::NoInline: 374 return "NoInline"; 375 } 376 llvm_unreachable("invalid reason"); 377 } 378 379 /// Compute the list of functions to import for a given caller. Mark these 380 /// imported functions and the symbols they reference in their source module as 381 /// exported from their source module. 382 static void computeImportForFunction( 383 const FunctionSummary &Summary, const ModuleSummaryIndex &Index, 384 const unsigned Threshold, const GVSummaryMapTy &DefinedGVSummaries, 385 SmallVectorImpl<EdgeInfo> &Worklist, 386 FunctionImporter::ImportMapTy &ImportList, 387 StringMap<FunctionImporter::ExportSetTy> *ExportLists, 388 FunctionImporter::ImportThresholdsTy &ImportThresholds) { 389 computeImportForReferencedGlobals(Summary, Index, DefinedGVSummaries, 390 Worklist, ImportList, ExportLists); 391 static int ImportCount = 0; 392 for (auto &Edge : Summary.calls()) { 393 ValueInfo VI = Edge.first; 394 LLVM_DEBUG(dbgs() << " edge -> " << VI << " Threshold:" << Threshold 395 << "\n"); 396 397 if (ImportCutoff >= 0 && ImportCount >= ImportCutoff) { 398 LLVM_DEBUG(dbgs() << "ignored! import-cutoff value of " << ImportCutoff 399 << " reached.\n"); 400 continue; 401 } 402 403 VI = updateValueInfoForIndirectCalls(Index, VI); 404 if (!VI) 405 continue; 406 407 if (DefinedGVSummaries.count(VI.getGUID())) { 408 // FIXME: Consider not skipping import if the module contains 409 // a non-prevailing def with interposable linkage. The prevailing copy 410 // can safely be imported (see shouldImportGlobal()). 411 LLVM_DEBUG(dbgs() << "ignored! Target already in destination module.\n"); 412 continue; 413 } 414 415 auto GetBonusMultiplier = [](CalleeInfo::HotnessType Hotness) -> float { 416 if (Hotness == CalleeInfo::HotnessType::Hot) 417 return ImportHotMultiplier; 418 if (Hotness == CalleeInfo::HotnessType::Cold) 419 return ImportColdMultiplier; 420 if (Hotness == CalleeInfo::HotnessType::Critical) 421 return ImportCriticalMultiplier; 422 return 1.0; 423 }; 424 425 const auto NewThreshold = 426 Threshold * GetBonusMultiplier(Edge.second.getHotness()); 427 428 auto IT = ImportThresholds.insert(std::make_pair( 429 VI.getGUID(), std::make_tuple(NewThreshold, nullptr, nullptr))); 430 bool PreviouslyVisited = !IT.second; 431 auto &ProcessedThreshold = std::get<0>(IT.first->second); 432 auto &CalleeSummary = std::get<1>(IT.first->second); 433 auto &FailureInfo = std::get<2>(IT.first->second); 434 435 bool IsHotCallsite = 436 Edge.second.getHotness() == CalleeInfo::HotnessType::Hot; 437 bool IsCriticalCallsite = 438 Edge.second.getHotness() == CalleeInfo::HotnessType::Critical; 439 440 const FunctionSummary *ResolvedCalleeSummary = nullptr; 441 if (CalleeSummary) { 442 assert(PreviouslyVisited); 443 // Since the traversal of the call graph is DFS, we can revisit a function 444 // a second time with a higher threshold. In this case, it is added back 445 // to the worklist with the new threshold (so that its own callee chains 446 // can be considered with the higher threshold). 447 if (NewThreshold <= ProcessedThreshold) { 448 LLVM_DEBUG( 449 dbgs() << "ignored! Target was already imported with Threshold " 450 << ProcessedThreshold << "\n"); 451 continue; 452 } 453 // Update with new larger threshold. 454 ProcessedThreshold = NewThreshold; 455 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 456 } else { 457 // If we already rejected importing a callee at the same or higher 458 // threshold, don't waste time calling selectCallee. 459 if (PreviouslyVisited && NewThreshold <= ProcessedThreshold) { 460 LLVM_DEBUG( 461 dbgs() << "ignored! Target was already rejected with Threshold " 462 << ProcessedThreshold << "\n"); 463 if (PrintImportFailures) { 464 assert(FailureInfo && 465 "Expected FailureInfo for previously rejected candidate"); 466 FailureInfo->Attempts++; 467 } 468 continue; 469 } 470 471 FunctionImporter::ImportFailureReason Reason; 472 CalleeSummary = selectCallee(Index, VI.getSummaryList(), NewThreshold, 473 Summary.modulePath(), Reason, VI.getGUID()); 474 if (!CalleeSummary) { 475 // Update with new larger threshold if this was a retry (otherwise 476 // we would have already inserted with NewThreshold above). Also 477 // update failure info if requested. 478 if (PreviouslyVisited) { 479 ProcessedThreshold = NewThreshold; 480 if (PrintImportFailures) { 481 assert(FailureInfo && 482 "Expected FailureInfo for previously rejected candidate"); 483 FailureInfo->Reason = Reason; 484 FailureInfo->Attempts++; 485 FailureInfo->MaxHotness = 486 std::max(FailureInfo->MaxHotness, Edge.second.getHotness()); 487 } 488 } else if (PrintImportFailures) { 489 assert(!FailureInfo && 490 "Expected no FailureInfo for newly rejected candidate"); 491 FailureInfo = std::make_unique<FunctionImporter::ImportFailureInfo>( 492 VI, Edge.second.getHotness(), Reason, 1); 493 } 494 if (ForceImportAll) { 495 std::string Msg = std::string("Failed to import function ") + 496 VI.name().str() + " due to " + 497 getFailureName(Reason); 498 auto Error = make_error<StringError>( 499 Msg, std::make_error_code(std::errc::operation_not_supported)); 500 logAllUnhandledErrors(std::move(Error), errs(), 501 "Error importing module: "); 502 break; 503 } else { 504 LLVM_DEBUG(dbgs() 505 << "ignored! No qualifying callee with summary found.\n"); 506 continue; 507 } 508 } 509 510 // "Resolve" the summary 511 CalleeSummary = CalleeSummary->getBaseObject(); 512 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 513 514 assert((ResolvedCalleeSummary->fflags().AlwaysInline || ForceImportAll || 515 (ResolvedCalleeSummary->instCount() <= NewThreshold)) && 516 "selectCallee() didn't honor the threshold"); 517 518 auto ExportModulePath = ResolvedCalleeSummary->modulePath(); 519 auto ILI = ImportList[ExportModulePath].insert(VI.getGUID()); 520 // We previously decided to import this GUID definition if it was already 521 // inserted in the set of imports from the exporting module. 522 bool PreviouslyImported = !ILI.second; 523 if (!PreviouslyImported) { 524 NumImportedFunctionsThinLink++; 525 if (IsHotCallsite) 526 NumImportedHotFunctionsThinLink++; 527 if (IsCriticalCallsite) 528 NumImportedCriticalFunctionsThinLink++; 529 } 530 531 // Any calls/references made by this function will be marked exported 532 // later, in ComputeCrossModuleImport, after import decisions are 533 // complete, which is more efficient than adding them here. 534 if (ExportLists) 535 (*ExportLists)[ExportModulePath].insert(VI); 536 } 537 538 auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) { 539 // Adjust the threshold for next level of imported functions. 540 // The threshold is different for hot callsites because we can then 541 // inline chains of hot calls. 542 if (IsHotCallsite) 543 return Threshold * ImportHotInstrFactor; 544 return Threshold * ImportInstrFactor; 545 }; 546 547 const auto AdjThreshold = GetAdjustedThreshold(Threshold, IsHotCallsite); 548 549 ImportCount++; 550 551 // Insert the newly imported function to the worklist. 552 Worklist.emplace_back(ResolvedCalleeSummary, AdjThreshold); 553 } 554 } 555 556 /// Given the list of globals defined in a module, compute the list of imports 557 /// as well as the list of "exports", i.e. the list of symbols referenced from 558 /// another module (that may require promotion). 559 static void ComputeImportForModule( 560 const GVSummaryMapTy &DefinedGVSummaries, const ModuleSummaryIndex &Index, 561 StringRef ModName, FunctionImporter::ImportMapTy &ImportList, 562 StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { 563 // Worklist contains the list of function imported in this module, for which 564 // we will analyse the callees and may import further down the callgraph. 565 SmallVector<EdgeInfo, 128> Worklist; 566 FunctionImporter::ImportThresholdsTy ImportThresholds; 567 568 // Populate the worklist with the import for the functions in the current 569 // module 570 for (auto &GVSummary : DefinedGVSummaries) { 571 #ifndef NDEBUG 572 // FIXME: Change the GVSummaryMapTy to hold ValueInfo instead of GUID 573 // so this map look up (and possibly others) can be avoided. 574 auto VI = Index.getValueInfo(GVSummary.first); 575 #endif 576 if (!Index.isGlobalValueLive(GVSummary.second)) { 577 LLVM_DEBUG(dbgs() << "Ignores Dead GUID: " << VI << "\n"); 578 continue; 579 } 580 auto *FuncSummary = 581 dyn_cast<FunctionSummary>(GVSummary.second->getBaseObject()); 582 if (!FuncSummary) 583 // Skip import for global variables 584 continue; 585 LLVM_DEBUG(dbgs() << "Initialize import for " << VI << "\n"); 586 computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, 587 DefinedGVSummaries, Worklist, ImportList, 588 ExportLists, ImportThresholds); 589 } 590 591 // Process the newly imported functions and add callees to the worklist. 592 while (!Worklist.empty()) { 593 auto GVInfo = Worklist.pop_back_val(); 594 auto *Summary = std::get<0>(GVInfo); 595 auto Threshold = std::get<1>(GVInfo); 596 597 if (auto *FS = dyn_cast<FunctionSummary>(Summary)) 598 computeImportForFunction(*FS, Index, Threshold, DefinedGVSummaries, 599 Worklist, ImportList, ExportLists, 600 ImportThresholds); 601 else 602 computeImportForReferencedGlobals(*Summary, Index, DefinedGVSummaries, 603 Worklist, ImportList, ExportLists); 604 } 605 606 // Print stats about functions considered but rejected for importing 607 // when requested. 608 if (PrintImportFailures) { 609 dbgs() << "Missed imports into module " << ModName << "\n"; 610 for (auto &I : ImportThresholds) { 611 auto &ProcessedThreshold = std::get<0>(I.second); 612 auto &CalleeSummary = std::get<1>(I.second); 613 auto &FailureInfo = std::get<2>(I.second); 614 if (CalleeSummary) 615 continue; // We are going to import. 616 assert(FailureInfo); 617 FunctionSummary *FS = nullptr; 618 if (!FailureInfo->VI.getSummaryList().empty()) 619 FS = dyn_cast<FunctionSummary>( 620 FailureInfo->VI.getSummaryList()[0]->getBaseObject()); 621 dbgs() << FailureInfo->VI 622 << ": Reason = " << getFailureName(FailureInfo->Reason) 623 << ", Threshold = " << ProcessedThreshold 624 << ", Size = " << (FS ? (int)FS->instCount() : -1) 625 << ", MaxHotness = " << getHotnessName(FailureInfo->MaxHotness) 626 << ", Attempts = " << FailureInfo->Attempts << "\n"; 627 } 628 } 629 } 630 631 #ifndef NDEBUG 632 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index, ValueInfo VI) { 633 auto SL = VI.getSummaryList(); 634 return SL.empty() 635 ? false 636 : SL[0]->getSummaryKind() == GlobalValueSummary::GlobalVarKind; 637 } 638 639 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index, 640 GlobalValue::GUID G) { 641 if (const auto &VI = Index.getValueInfo(G)) 642 return isGlobalVarSummary(Index, VI); 643 return false; 644 } 645 646 template <class T> 647 static unsigned numGlobalVarSummaries(const ModuleSummaryIndex &Index, 648 T &Cont) { 649 unsigned NumGVS = 0; 650 for (auto &V : Cont) 651 if (isGlobalVarSummary(Index, V)) 652 ++NumGVS; 653 return NumGVS; 654 } 655 #endif 656 657 #ifndef NDEBUG 658 static bool 659 checkVariableImport(const ModuleSummaryIndex &Index, 660 StringMap<FunctionImporter::ImportMapTy> &ImportLists, 661 StringMap<FunctionImporter::ExportSetTy> &ExportLists) { 662 663 DenseSet<GlobalValue::GUID> FlattenedImports; 664 665 for (auto &ImportPerModule : ImportLists) 666 for (auto &ExportPerModule : ImportPerModule.second) 667 FlattenedImports.insert(ExportPerModule.second.begin(), 668 ExportPerModule.second.end()); 669 670 // Checks that all GUIDs of read/writeonly vars we see in export lists 671 // are also in the import lists. Otherwise we my face linker undefs, 672 // because readonly and writeonly vars are internalized in their 673 // source modules. 674 auto IsReadOrWriteOnlyVar = [&](StringRef ModulePath, const ValueInfo &VI) { 675 auto *GVS = dyn_cast_or_null<GlobalVarSummary>( 676 Index.findSummaryInModule(VI, ModulePath)); 677 return GVS && (Index.isReadOnly(GVS) || Index.isWriteOnly(GVS)); 678 }; 679 680 for (auto &ExportPerModule : ExportLists) 681 for (auto &VI : ExportPerModule.second) 682 if (!FlattenedImports.count(VI.getGUID()) && 683 IsReadOrWriteOnlyVar(ExportPerModule.first(), VI)) 684 return false; 685 686 return true; 687 } 688 #endif 689 690 /// Compute all the import and export for every module using the Index. 691 void llvm::ComputeCrossModuleImport( 692 const ModuleSummaryIndex &Index, 693 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 694 StringMap<FunctionImporter::ImportMapTy> &ImportLists, 695 StringMap<FunctionImporter::ExportSetTy> &ExportLists) { 696 // For each module that has function defined, compute the import/export lists. 697 for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { 698 auto &ImportList = ImportLists[DefinedGVSummaries.first()]; 699 LLVM_DEBUG(dbgs() << "Computing import for Module '" 700 << DefinedGVSummaries.first() << "'\n"); 701 ComputeImportForModule(DefinedGVSummaries.second, Index, 702 DefinedGVSummaries.first(), ImportList, 703 &ExportLists); 704 } 705 706 // When computing imports we only added the variables and functions being 707 // imported to the export list. We also need to mark any references and calls 708 // they make as exported as well. We do this here, as it is more efficient 709 // since we may import the same values multiple times into different modules 710 // during the import computation. 711 for (auto &ELI : ExportLists) { 712 FunctionImporter::ExportSetTy NewExports; 713 const auto &DefinedGVSummaries = 714 ModuleToDefinedGVSummaries.lookup(ELI.first()); 715 for (auto &EI : ELI.second) { 716 // Find the copy defined in the exporting module so that we can mark the 717 // values it references in that specific definition as exported. 718 // Below we will add all references and called values, without regard to 719 // whether they are also defined in this module. We subsequently prune the 720 // list to only include those defined in the exporting module, see comment 721 // there as to why. 722 auto DS = DefinedGVSummaries.find(EI.getGUID()); 723 // Anything marked exported during the import computation must have been 724 // defined in the exporting module. 725 assert(DS != DefinedGVSummaries.end()); 726 auto *S = DS->getSecond(); 727 S = S->getBaseObject(); 728 if (auto *GVS = dyn_cast<GlobalVarSummary>(S)) { 729 // Export referenced functions and variables. We don't export/promote 730 // objects referenced by writeonly variable initializer, because 731 // we convert such variables initializers to "zeroinitializer". 732 // See processGlobalForThinLTO. 733 if (!Index.isWriteOnly(GVS)) 734 for (const auto &VI : GVS->refs()) 735 NewExports.insert(VI); 736 } else { 737 auto *FS = cast<FunctionSummary>(S); 738 for (auto &Edge : FS->calls()) 739 NewExports.insert(Edge.first); 740 for (auto &Ref : FS->refs()) 741 NewExports.insert(Ref); 742 } 743 } 744 // Prune list computed above to only include values defined in the exporting 745 // module. We do this after the above insertion since we may hit the same 746 // ref/call target multiple times in above loop, and it is more efficient to 747 // avoid a set lookup each time. 748 for (auto EI = NewExports.begin(); EI != NewExports.end();) { 749 if (!DefinedGVSummaries.count(EI->getGUID())) 750 NewExports.erase(EI++); 751 else 752 ++EI; 753 } 754 ELI.second.insert(NewExports.begin(), NewExports.end()); 755 } 756 757 assert(checkVariableImport(Index, ImportLists, ExportLists)); 758 #ifndef NDEBUG 759 LLVM_DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() 760 << " modules:\n"); 761 for (auto &ModuleImports : ImportLists) { 762 auto ModName = ModuleImports.first(); 763 auto &Exports = ExportLists[ModName]; 764 unsigned NumGVS = numGlobalVarSummaries(Index, Exports); 765 LLVM_DEBUG(dbgs() << "* Module " << ModName << " exports " 766 << Exports.size() - NumGVS << " functions and " << NumGVS 767 << " vars. Imports from " << ModuleImports.second.size() 768 << " modules.\n"); 769 for (auto &Src : ModuleImports.second) { 770 auto SrcModName = Src.first(); 771 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second); 772 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod 773 << " functions imported from " << SrcModName << "\n"); 774 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod 775 << " global vars imported from " << SrcModName << "\n"); 776 } 777 } 778 #endif 779 } 780 781 #ifndef NDEBUG 782 static void dumpImportListForModule(const ModuleSummaryIndex &Index, 783 StringRef ModulePath, 784 FunctionImporter::ImportMapTy &ImportList) { 785 LLVM_DEBUG(dbgs() << "* Module " << ModulePath << " imports from " 786 << ImportList.size() << " modules.\n"); 787 for (auto &Src : ImportList) { 788 auto SrcModName = Src.first(); 789 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second); 790 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod 791 << " functions imported from " << SrcModName << "\n"); 792 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod << " vars imported from " 793 << SrcModName << "\n"); 794 } 795 } 796 #endif 797 798 /// Compute all the imports for the given module in the Index. 799 void llvm::ComputeCrossModuleImportForModule( 800 StringRef ModulePath, const ModuleSummaryIndex &Index, 801 FunctionImporter::ImportMapTy &ImportList) { 802 // Collect the list of functions this module defines. 803 // GUID -> Summary 804 GVSummaryMapTy FunctionSummaryMap; 805 Index.collectDefinedFunctionsForModule(ModulePath, FunctionSummaryMap); 806 807 // Compute the import list for this module. 808 LLVM_DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); 809 ComputeImportForModule(FunctionSummaryMap, Index, ModulePath, ImportList); 810 811 #ifndef NDEBUG 812 dumpImportListForModule(Index, ModulePath, ImportList); 813 #endif 814 } 815 816 // Mark all external summaries in Index for import into the given module. 817 // Used for distributed builds using a distributed index. 818 void llvm::ComputeCrossModuleImportForModuleFromIndex( 819 StringRef ModulePath, const ModuleSummaryIndex &Index, 820 FunctionImporter::ImportMapTy &ImportList) { 821 for (auto &GlobalList : Index) { 822 // Ignore entries for undefined references. 823 if (GlobalList.second.SummaryList.empty()) 824 continue; 825 826 auto GUID = GlobalList.first; 827 assert(GlobalList.second.SummaryList.size() == 1 && 828 "Expected individual combined index to have one summary per GUID"); 829 auto &Summary = GlobalList.second.SummaryList[0]; 830 // Skip the summaries for the importing module. These are included to 831 // e.g. record required linkage changes. 832 if (Summary->modulePath() == ModulePath) 833 continue; 834 // Add an entry to provoke importing by thinBackend. 835 ImportList[Summary->modulePath()].insert(GUID); 836 } 837 #ifndef NDEBUG 838 dumpImportListForModule(Index, ModulePath, ImportList); 839 #endif 840 } 841 842 void llvm::computeDeadSymbols( 843 ModuleSummaryIndex &Index, 844 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols, 845 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing) { 846 assert(!Index.withGlobalValueDeadStripping()); 847 if (!ComputeDead) 848 return; 849 if (GUIDPreservedSymbols.empty()) 850 // Don't do anything when nothing is live, this is friendly with tests. 851 return; 852 unsigned LiveSymbols = 0; 853 SmallVector<ValueInfo, 128> Worklist; 854 Worklist.reserve(GUIDPreservedSymbols.size() * 2); 855 for (auto GUID : GUIDPreservedSymbols) { 856 ValueInfo VI = Index.getValueInfo(GUID); 857 if (!VI) 858 continue; 859 for (auto &S : VI.getSummaryList()) 860 S->setLive(true); 861 } 862 863 // Add values flagged in the index as live roots to the worklist. 864 for (const auto &Entry : Index) { 865 auto VI = Index.getValueInfo(Entry); 866 for (auto &S : Entry.second.SummaryList) 867 if (S->isLive()) { 868 LLVM_DEBUG(dbgs() << "Live root: " << VI << "\n"); 869 Worklist.push_back(VI); 870 ++LiveSymbols; 871 break; 872 } 873 } 874 875 // Make value live and add it to the worklist if it was not live before. 876 auto visit = [&](ValueInfo VI, bool IsAliasee) { 877 // FIXME: If we knew which edges were created for indirect call profiles, 878 // we could skip them here. Any that are live should be reached via 879 // other edges, e.g. reference edges. Otherwise, using a profile collected 880 // on a slightly different binary might provoke preserving, importing 881 // and ultimately promoting calls to functions not linked into this 882 // binary, which increases the binary size unnecessarily. Note that 883 // if this code changes, the importer needs to change so that edges 884 // to functions marked dead are skipped. 885 VI = updateValueInfoForIndirectCalls(Index, VI); 886 if (!VI) 887 return; 888 889 if (llvm::any_of(VI.getSummaryList(), 890 [](const std::unique_ptr<llvm::GlobalValueSummary> &S) { 891 return S->isLive(); 892 })) 893 return; 894 895 // We only keep live symbols that are known to be non-prevailing if any are 896 // available_externally, linkonceodr, weakodr. Those symbols are discarded 897 // later in the EliminateAvailableExternally pass and setting them to 898 // not-live could break downstreams users of liveness information (PR36483) 899 // or limit optimization opportunities. 900 if (isPrevailing(VI.getGUID()) == PrevailingType::No) { 901 bool KeepAliveLinkage = false; 902 bool Interposable = false; 903 for (auto &S : VI.getSummaryList()) { 904 if (S->linkage() == GlobalValue::AvailableExternallyLinkage || 905 S->linkage() == GlobalValue::WeakODRLinkage || 906 S->linkage() == GlobalValue::LinkOnceODRLinkage) 907 KeepAliveLinkage = true; 908 else if (GlobalValue::isInterposableLinkage(S->linkage())) 909 Interposable = true; 910 } 911 912 if (!IsAliasee) { 913 if (!KeepAliveLinkage) 914 return; 915 916 if (Interposable) 917 report_fatal_error( 918 "Interposable and available_externally/linkonce_odr/weak_odr " 919 "symbol"); 920 } 921 } 922 923 for (auto &S : VI.getSummaryList()) 924 S->setLive(true); 925 ++LiveSymbols; 926 Worklist.push_back(VI); 927 }; 928 929 while (!Worklist.empty()) { 930 auto VI = Worklist.pop_back_val(); 931 for (auto &Summary : VI.getSummaryList()) { 932 if (auto *AS = dyn_cast<AliasSummary>(Summary.get())) { 933 // If this is an alias, visit the aliasee VI to ensure that all copies 934 // are marked live and it is added to the worklist for further 935 // processing of its references. 936 visit(AS->getAliaseeVI(), true); 937 continue; 938 } 939 for (auto Ref : Summary->refs()) 940 visit(Ref, false); 941 if (auto *FS = dyn_cast<FunctionSummary>(Summary.get())) 942 for (auto Call : FS->calls()) 943 visit(Call.first, false); 944 } 945 } 946 Index.setWithGlobalValueDeadStripping(); 947 948 unsigned DeadSymbols = Index.size() - LiveSymbols; 949 LLVM_DEBUG(dbgs() << LiveSymbols << " symbols Live, and " << DeadSymbols 950 << " symbols Dead \n"); 951 NumDeadSymbols += DeadSymbols; 952 NumLiveSymbols += LiveSymbols; 953 } 954 955 // Compute dead symbols and propagate constants in combined index. 956 void llvm::computeDeadSymbolsWithConstProp( 957 ModuleSummaryIndex &Index, 958 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols, 959 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing, 960 bool ImportEnabled) { 961 computeDeadSymbols(Index, GUIDPreservedSymbols, isPrevailing); 962 if (ImportEnabled) 963 Index.propagateAttributes(GUIDPreservedSymbols); 964 } 965 966 /// Compute the set of summaries needed for a ThinLTO backend compilation of 967 /// \p ModulePath. 968 void llvm::gatherImportedSummariesForModule( 969 StringRef ModulePath, 970 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 971 const FunctionImporter::ImportMapTy &ImportList, 972 std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) { 973 // Include all summaries from the importing module. 974 ModuleToSummariesForIndex[std::string(ModulePath)] = 975 ModuleToDefinedGVSummaries.lookup(ModulePath); 976 // Include summaries for imports. 977 for (auto &ILI : ImportList) { 978 auto &SummariesForIndex = 979 ModuleToSummariesForIndex[std::string(ILI.first())]; 980 const auto &DefinedGVSummaries = 981 ModuleToDefinedGVSummaries.lookup(ILI.first()); 982 for (auto &GI : ILI.second) { 983 const auto &DS = DefinedGVSummaries.find(GI); 984 assert(DS != DefinedGVSummaries.end() && 985 "Expected a defined summary for imported global value"); 986 SummariesForIndex[GI] = DS->second; 987 } 988 } 989 } 990 991 /// Emit the files \p ModulePath will import from into \p OutputFilename. 992 std::error_code llvm::EmitImportsFiles( 993 StringRef ModulePath, StringRef OutputFilename, 994 const std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) { 995 std::error_code EC; 996 raw_fd_ostream ImportsOS(OutputFilename, EC, sys::fs::OpenFlags::OF_None); 997 if (EC) 998 return EC; 999 for (auto &ILI : ModuleToSummariesForIndex) 1000 // The ModuleToSummariesForIndex map includes an entry for the current 1001 // Module (needed for writing out the index files). We don't want to 1002 // include it in the imports file, however, so filter it out. 1003 if (ILI.first != ModulePath) 1004 ImportsOS << ILI.first << "\n"; 1005 return std::error_code(); 1006 } 1007 1008 bool llvm::convertToDeclaration(GlobalValue &GV) { 1009 LLVM_DEBUG(dbgs() << "Converting to a declaration: `" << GV.getName() 1010 << "\n"); 1011 if (Function *F = dyn_cast<Function>(&GV)) { 1012 F->deleteBody(); 1013 F->clearMetadata(); 1014 F->setComdat(nullptr); 1015 } else if (GlobalVariable *V = dyn_cast<GlobalVariable>(&GV)) { 1016 V->setInitializer(nullptr); 1017 V->setLinkage(GlobalValue::ExternalLinkage); 1018 V->clearMetadata(); 1019 V->setComdat(nullptr); 1020 } else { 1021 GlobalValue *NewGV; 1022 if (GV.getValueType()->isFunctionTy()) 1023 NewGV = 1024 Function::Create(cast<FunctionType>(GV.getValueType()), 1025 GlobalValue::ExternalLinkage, GV.getAddressSpace(), 1026 "", GV.getParent()); 1027 else 1028 NewGV = 1029 new GlobalVariable(*GV.getParent(), GV.getValueType(), 1030 /*isConstant*/ false, GlobalValue::ExternalLinkage, 1031 /*init*/ nullptr, "", 1032 /*insertbefore*/ nullptr, GV.getThreadLocalMode(), 1033 GV.getType()->getAddressSpace()); 1034 NewGV->takeName(&GV); 1035 GV.replaceAllUsesWith(NewGV); 1036 return false; 1037 } 1038 if (!GV.isImplicitDSOLocal()) 1039 GV.setDSOLocal(false); 1040 return true; 1041 } 1042 1043 void llvm::thinLTOResolvePrevailingInModule( 1044 Module &TheModule, const GVSummaryMapTy &DefinedGlobals) { 1045 auto updateLinkage = [&](GlobalValue &GV) { 1046 // See if the global summary analysis computed a new resolved linkage. 1047 const auto &GS = DefinedGlobals.find(GV.getGUID()); 1048 if (GS == DefinedGlobals.end()) 1049 return; 1050 auto NewLinkage = GS->second->linkage(); 1051 if (GlobalValue::isLocalLinkage(GV.getLinkage()) || 1052 // Don't internalize anything here, because the code below 1053 // lacks necessary correctness checks. Leave this job to 1054 // LLVM 'internalize' pass. 1055 GlobalValue::isLocalLinkage(NewLinkage) || 1056 // In case it was dead and already converted to declaration. 1057 GV.isDeclaration()) 1058 return; 1059 1060 // Set the potentially more constraining visibility computed from summaries. 1061 // The DefaultVisibility condition is because older GlobalValueSummary does 1062 // not record DefaultVisibility and we don't want to change protected/hidden 1063 // to default. 1064 if (GS->second->getVisibility() != GlobalValue::DefaultVisibility) 1065 GV.setVisibility(GS->second->getVisibility()); 1066 1067 if (NewLinkage == GV.getLinkage()) 1068 return; 1069 1070 // Check for a non-prevailing def that has interposable linkage 1071 // (e.g. non-odr weak or linkonce). In that case we can't simply 1072 // convert to available_externally, since it would lose the 1073 // interposable property and possibly get inlined. Simply drop 1074 // the definition in that case. 1075 if (GlobalValue::isAvailableExternallyLinkage(NewLinkage) && 1076 GlobalValue::isInterposableLinkage(GV.getLinkage())) { 1077 if (!convertToDeclaration(GV)) 1078 // FIXME: Change this to collect replaced GVs and later erase 1079 // them from the parent module once thinLTOResolvePrevailingGUID is 1080 // changed to enable this for aliases. 1081 llvm_unreachable("Expected GV to be converted"); 1082 } else { 1083 // If all copies of the original symbol had global unnamed addr and 1084 // linkonce_odr linkage, it should be an auto hide symbol. In that case 1085 // the thin link would have marked it as CanAutoHide. Add hidden visibility 1086 // to the symbol to preserve the property. 1087 if (NewLinkage == GlobalValue::WeakODRLinkage && 1088 GS->second->canAutoHide()) { 1089 assert(GV.hasLinkOnceODRLinkage() && GV.hasGlobalUnnamedAddr()); 1090 GV.setVisibility(GlobalValue::HiddenVisibility); 1091 } 1092 1093 LLVM_DEBUG(dbgs() << "ODR fixing up linkage for `" << GV.getName() 1094 << "` from " << GV.getLinkage() << " to " << NewLinkage 1095 << "\n"); 1096 GV.setLinkage(NewLinkage); 1097 } 1098 // Remove declarations from comdats, including available_externally 1099 // as this is a declaration for the linker, and will be dropped eventually. 1100 // It is illegal for comdats to contain declarations. 1101 auto *GO = dyn_cast_or_null<GlobalObject>(&GV); 1102 if (GO && GO->isDeclarationForLinker() && GO->hasComdat()) 1103 GO->setComdat(nullptr); 1104 }; 1105 1106 // Process functions and global now 1107 for (auto &GV : TheModule) 1108 updateLinkage(GV); 1109 for (auto &GV : TheModule.globals()) 1110 updateLinkage(GV); 1111 for (auto &GV : TheModule.aliases()) 1112 updateLinkage(GV); 1113 } 1114 1115 /// Run internalization on \p TheModule based on symmary analysis. 1116 void llvm::thinLTOInternalizeModule(Module &TheModule, 1117 const GVSummaryMapTy &DefinedGlobals) { 1118 // Declare a callback for the internalize pass that will ask for every 1119 // candidate GlobalValue if it can be internalized or not. 1120 auto MustPreserveGV = [&](const GlobalValue &GV) -> bool { 1121 // Lookup the linkage recorded in the summaries during global analysis. 1122 auto GS = DefinedGlobals.find(GV.getGUID()); 1123 if (GS == DefinedGlobals.end()) { 1124 // Must have been promoted (possibly conservatively). Find original 1125 // name so that we can access the correct summary and see if it can 1126 // be internalized again. 1127 // FIXME: Eventually we should control promotion instead of promoting 1128 // and internalizing again. 1129 StringRef OrigName = 1130 ModuleSummaryIndex::getOriginalNameBeforePromote(GV.getName()); 1131 std::string OrigId = GlobalValue::getGlobalIdentifier( 1132 OrigName, GlobalValue::InternalLinkage, 1133 TheModule.getSourceFileName()); 1134 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigId)); 1135 if (GS == DefinedGlobals.end()) { 1136 // Also check the original non-promoted non-globalized name. In some 1137 // cases a preempted weak value is linked in as a local copy because 1138 // it is referenced by an alias (IRLinker::linkGlobalValueProto). 1139 // In that case, since it was originally not a local value, it was 1140 // recorded in the index using the original name. 1141 // FIXME: This may not be needed once PR27866 is fixed. 1142 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigName)); 1143 assert(GS != DefinedGlobals.end()); 1144 } 1145 } 1146 return !GlobalValue::isLocalLinkage(GS->second->linkage()); 1147 }; 1148 1149 // FIXME: See if we can just internalize directly here via linkage changes 1150 // based on the index, rather than invoking internalizeModule. 1151 internalizeModule(TheModule, MustPreserveGV); 1152 } 1153 1154 /// Make alias a clone of its aliasee. 1155 static Function *replaceAliasWithAliasee(Module *SrcModule, GlobalAlias *GA) { 1156 Function *Fn = cast<Function>(GA->getBaseObject()); 1157 1158 ValueToValueMapTy VMap; 1159 Function *NewFn = CloneFunction(Fn, VMap); 1160 // Clone should use the original alias's linkage, visibility and name, and we 1161 // ensure all uses of alias instead use the new clone (casted if necessary). 1162 NewFn->setLinkage(GA->getLinkage()); 1163 NewFn->setVisibility(GA->getVisibility()); 1164 GA->replaceAllUsesWith(ConstantExpr::getBitCast(NewFn, GA->getType())); 1165 NewFn->takeName(GA); 1166 return NewFn; 1167 } 1168 1169 // Internalize values that we marked with specific attribute 1170 // in processGlobalForThinLTO. 1171 static void internalizeGVsAfterImport(Module &M) { 1172 for (auto &GV : M.globals()) 1173 // Skip GVs which have been converted to declarations 1174 // by dropDeadSymbols. 1175 if (!GV.isDeclaration() && GV.hasAttribute("thinlto-internalize")) { 1176 GV.setLinkage(GlobalValue::InternalLinkage); 1177 GV.setVisibility(GlobalValue::DefaultVisibility); 1178 } 1179 } 1180 1181 // Automatically import functions in Module \p DestModule based on the summaries 1182 // index. 1183 Expected<bool> FunctionImporter::importFunctions( 1184 Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) { 1185 LLVM_DEBUG(dbgs() << "Starting import for Module " 1186 << DestModule.getModuleIdentifier() << "\n"); 1187 unsigned ImportedCount = 0, ImportedGVCount = 0; 1188 1189 IRMover Mover(DestModule); 1190 // Do the actual import of functions now, one Module at a time 1191 std::set<StringRef> ModuleNameOrderedList; 1192 for (auto &FunctionsToImportPerModule : ImportList) { 1193 ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); 1194 } 1195 for (auto &Name : ModuleNameOrderedList) { 1196 // Get the module for the import 1197 const auto &FunctionsToImportPerModule = ImportList.find(Name); 1198 assert(FunctionsToImportPerModule != ImportList.end()); 1199 Expected<std::unique_ptr<Module>> SrcModuleOrErr = ModuleLoader(Name); 1200 if (!SrcModuleOrErr) 1201 return SrcModuleOrErr.takeError(); 1202 std::unique_ptr<Module> SrcModule = std::move(*SrcModuleOrErr); 1203 assert(&DestModule.getContext() == &SrcModule->getContext() && 1204 "Context mismatch"); 1205 1206 // If modules were created with lazy metadata loading, materialize it 1207 // now, before linking it (otherwise this will be a noop). 1208 if (Error Err = SrcModule->materializeMetadata()) 1209 return std::move(Err); 1210 1211 auto &ImportGUIDs = FunctionsToImportPerModule->second; 1212 // Find the globals to import 1213 SetVector<GlobalValue *> GlobalsToImport; 1214 for (Function &F : *SrcModule) { 1215 if (!F.hasName()) 1216 continue; 1217 auto GUID = F.getGUID(); 1218 auto Import = ImportGUIDs.count(GUID); 1219 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " 1220 << GUID << " " << F.getName() << " from " 1221 << SrcModule->getSourceFileName() << "\n"); 1222 if (Import) { 1223 if (Error Err = F.materialize()) 1224 return std::move(Err); 1225 if (EnableImportMetadata) { 1226 // Add 'thinlto_src_module' metadata for statistics and debugging. 1227 F.setMetadata( 1228 "thinlto_src_module", 1229 MDNode::get(DestModule.getContext(), 1230 {MDString::get(DestModule.getContext(), 1231 SrcModule->getSourceFileName())})); 1232 } 1233 GlobalsToImport.insert(&F); 1234 } 1235 } 1236 for (GlobalVariable &GV : SrcModule->globals()) { 1237 if (!GV.hasName()) 1238 continue; 1239 auto GUID = GV.getGUID(); 1240 auto Import = ImportGUIDs.count(GUID); 1241 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " 1242 << GUID << " " << GV.getName() << " from " 1243 << SrcModule->getSourceFileName() << "\n"); 1244 if (Import) { 1245 if (Error Err = GV.materialize()) 1246 return std::move(Err); 1247 ImportedGVCount += GlobalsToImport.insert(&GV); 1248 } 1249 } 1250 for (GlobalAlias &GA : SrcModule->aliases()) { 1251 if (!GA.hasName()) 1252 continue; 1253 auto GUID = GA.getGUID(); 1254 auto Import = ImportGUIDs.count(GUID); 1255 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " 1256 << GUID << " " << GA.getName() << " from " 1257 << SrcModule->getSourceFileName() << "\n"); 1258 if (Import) { 1259 if (Error Err = GA.materialize()) 1260 return std::move(Err); 1261 // Import alias as a copy of its aliasee. 1262 GlobalObject *Base = GA.getBaseObject(); 1263 if (Error Err = Base->materialize()) 1264 return std::move(Err); 1265 auto *Fn = replaceAliasWithAliasee(SrcModule.get(), &GA); 1266 LLVM_DEBUG(dbgs() << "Is importing aliasee fn " << Base->getGUID() 1267 << " " << Base->getName() << " from " 1268 << SrcModule->getSourceFileName() << "\n"); 1269 if (EnableImportMetadata) { 1270 // Add 'thinlto_src_module' metadata for statistics and debugging. 1271 Fn->setMetadata( 1272 "thinlto_src_module", 1273 MDNode::get(DestModule.getContext(), 1274 {MDString::get(DestModule.getContext(), 1275 SrcModule->getSourceFileName())})); 1276 } 1277 GlobalsToImport.insert(Fn); 1278 } 1279 } 1280 1281 // Upgrade debug info after we're done materializing all the globals and we 1282 // have loaded all the required metadata! 1283 UpgradeDebugInfo(*SrcModule); 1284 1285 // Set the partial sample profile ratio in the profile summary module flag 1286 // of the imported source module, if applicable, so that the profile summary 1287 // module flag will match with that of the destination module when it's 1288 // imported. 1289 SrcModule->setPartialSampleProfileRatio(Index); 1290 1291 // Link in the specified functions. 1292 if (renameModuleForThinLTO(*SrcModule, Index, ClearDSOLocalOnDeclarations, 1293 &GlobalsToImport)) 1294 return true; 1295 1296 if (PrintImports) { 1297 for (const auto *GV : GlobalsToImport) 1298 dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() 1299 << " from " << SrcModule->getSourceFileName() << "\n"; 1300 } 1301 1302 if (Error Err = Mover.move( 1303 std::move(SrcModule), GlobalsToImport.getArrayRef(), 1304 [](GlobalValue &, IRMover::ValueAdder) {}, 1305 /*IsPerformingImport=*/true)) 1306 report_fatal_error("Function Import: link error: " + 1307 toString(std::move(Err))); 1308 1309 ImportedCount += GlobalsToImport.size(); 1310 NumImportedModules++; 1311 } 1312 1313 internalizeGVsAfterImport(DestModule); 1314 1315 NumImportedFunctions += (ImportedCount - ImportedGVCount); 1316 NumImportedGlobalVars += ImportedGVCount; 1317 1318 LLVM_DEBUG(dbgs() << "Imported " << ImportedCount - ImportedGVCount 1319 << " functions for Module " 1320 << DestModule.getModuleIdentifier() << "\n"); 1321 LLVM_DEBUG(dbgs() << "Imported " << ImportedGVCount 1322 << " global variables for Module " 1323 << DestModule.getModuleIdentifier() << "\n"); 1324 return ImportedCount; 1325 } 1326 1327 static bool doImportingForModule(Module &M) { 1328 if (SummaryFile.empty()) 1329 report_fatal_error("error: -function-import requires -summary-file\n"); 1330 Expected<std::unique_ptr<ModuleSummaryIndex>> IndexPtrOrErr = 1331 getModuleSummaryIndexForFile(SummaryFile); 1332 if (!IndexPtrOrErr) { 1333 logAllUnhandledErrors(IndexPtrOrErr.takeError(), errs(), 1334 "Error loading file '" + SummaryFile + "': "); 1335 return false; 1336 } 1337 std::unique_ptr<ModuleSummaryIndex> Index = std::move(*IndexPtrOrErr); 1338 1339 // First step is collecting the import list. 1340 FunctionImporter::ImportMapTy ImportList; 1341 // If requested, simply import all functions in the index. This is used 1342 // when testing distributed backend handling via the opt tool, when 1343 // we have distributed indexes containing exactly the summaries to import. 1344 if (ImportAllIndex) 1345 ComputeCrossModuleImportForModuleFromIndex(M.getModuleIdentifier(), *Index, 1346 ImportList); 1347 else 1348 ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index, 1349 ImportList); 1350 1351 // Conservatively mark all internal values as promoted. This interface is 1352 // only used when doing importing via the function importing pass. The pass 1353 // is only enabled when testing importing via the 'opt' tool, which does 1354 // not do the ThinLink that would normally determine what values to promote. 1355 for (auto &I : *Index) { 1356 for (auto &S : I.second.SummaryList) { 1357 if (GlobalValue::isLocalLinkage(S->linkage())) 1358 S->setLinkage(GlobalValue::ExternalLinkage); 1359 } 1360 } 1361 1362 // Next we need to promote to global scope and rename any local values that 1363 // are potentially exported to other modules. 1364 if (renameModuleForThinLTO(M, *Index, /*ClearDSOLocalOnDeclarations=*/false, 1365 /*GlobalsToImport=*/nullptr)) { 1366 errs() << "Error renaming module\n"; 1367 return false; 1368 } 1369 1370 // Perform the import now. 1371 auto ModuleLoader = [&M](StringRef Identifier) { 1372 return loadFile(std::string(Identifier), M.getContext()); 1373 }; 1374 FunctionImporter Importer(*Index, ModuleLoader, 1375 /*ClearDSOLocalOnDeclarations=*/false); 1376 Expected<bool> Result = Importer.importFunctions(M, ImportList); 1377 1378 // FIXME: Probably need to propagate Errors through the pass manager. 1379 if (!Result) { 1380 logAllUnhandledErrors(Result.takeError(), errs(), 1381 "Error importing module: "); 1382 return false; 1383 } 1384 1385 return *Result; 1386 } 1387 1388 namespace { 1389 1390 /// Pass that performs cross-module function import provided a summary file. 1391 class FunctionImportLegacyPass : public ModulePass { 1392 public: 1393 /// Pass identification, replacement for typeid 1394 static char ID; 1395 1396 explicit FunctionImportLegacyPass() : ModulePass(ID) {} 1397 1398 /// Specify pass name for debug output 1399 StringRef getPassName() const override { return "Function Importing"; } 1400 1401 bool runOnModule(Module &M) override { 1402 if (skipModule(M)) 1403 return false; 1404 1405 return doImportingForModule(M); 1406 } 1407 }; 1408 1409 } // end anonymous namespace 1410 1411 PreservedAnalyses FunctionImportPass::run(Module &M, 1412 ModuleAnalysisManager &AM) { 1413 if (!doImportingForModule(M)) 1414 return PreservedAnalyses::all(); 1415 1416 return PreservedAnalyses::none(); 1417 } 1418 1419 char FunctionImportLegacyPass::ID = 0; 1420 INITIALIZE_PASS(FunctionImportLegacyPass, "function-import", 1421 "Summary Based Function Import", false, false) 1422 1423 namespace llvm { 1424 1425 Pass *createFunctionImportPass() { 1426 return new FunctionImportLegacyPass(); 1427 } 1428 1429 } // end namespace llvm 1430