1 //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements Function import based on summaries. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "llvm/Transforms/IPO/FunctionImport.h" 14 #include "llvm/ADT/ArrayRef.h" 15 #include "llvm/ADT/STLExtras.h" 16 #include "llvm/ADT/SetVector.h" 17 #include "llvm/ADT/SmallVector.h" 18 #include "llvm/ADT/Statistic.h" 19 #include "llvm/ADT/StringMap.h" 20 #include "llvm/ADT/StringRef.h" 21 #include "llvm/Bitcode/BitcodeReader.h" 22 #include "llvm/IR/AutoUpgrade.h" 23 #include "llvm/IR/Constants.h" 24 #include "llvm/IR/Function.h" 25 #include "llvm/IR/GlobalAlias.h" 26 #include "llvm/IR/GlobalObject.h" 27 #include "llvm/IR/GlobalValue.h" 28 #include "llvm/IR/GlobalVariable.h" 29 #include "llvm/IR/Metadata.h" 30 #include "llvm/IR/Module.h" 31 #include "llvm/IR/ModuleSummaryIndex.h" 32 #include "llvm/IRReader/IRReader.h" 33 #include "llvm/Linker/IRMover.h" 34 #include "llvm/Support/Casting.h" 35 #include "llvm/Support/CommandLine.h" 36 #include "llvm/Support/Debug.h" 37 #include "llvm/Support/Errc.h" 38 #include "llvm/Support/Error.h" 39 #include "llvm/Support/ErrorHandling.h" 40 #include "llvm/Support/FileSystem.h" 41 #include "llvm/Support/SourceMgr.h" 42 #include "llvm/Support/raw_ostream.h" 43 #include "llvm/Transforms/IPO/Internalize.h" 44 #include "llvm/Transforms/Utils/Cloning.h" 45 #include "llvm/Transforms/Utils/FunctionImportUtils.h" 46 #include "llvm/Transforms/Utils/ValueMapper.h" 47 #include <cassert> 48 #include <memory> 49 #include <set> 50 #include <string> 51 #include <system_error> 52 #include <tuple> 53 #include <utility> 54 55 using namespace llvm; 56 57 #define DEBUG_TYPE "function-import" 58 59 STATISTIC(NumImportedFunctionsThinLink, 60 "Number of functions thin link decided to import"); 61 STATISTIC(NumImportedHotFunctionsThinLink, 62 "Number of hot functions thin link decided to import"); 63 STATISTIC(NumImportedCriticalFunctionsThinLink, 64 "Number of critical functions thin link decided to import"); 65 STATISTIC(NumImportedGlobalVarsThinLink, 66 "Number of global variables thin link decided to import"); 67 STATISTIC(NumImportedFunctions, "Number of functions imported in backend"); 68 STATISTIC(NumImportedGlobalVars, 69 "Number of global variables imported in backend"); 70 STATISTIC(NumImportedModules, "Number of modules imported from"); 71 STATISTIC(NumDeadSymbols, "Number of dead stripped symbols in index"); 72 STATISTIC(NumLiveSymbols, "Number of live symbols in index"); 73 74 /// Limit on instruction count of imported functions. 75 static cl::opt<unsigned> ImportInstrLimit( 76 "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), 77 cl::desc("Only import functions with less than N instructions")); 78 79 static cl::opt<int> ImportCutoff( 80 "import-cutoff", cl::init(-1), cl::Hidden, cl::value_desc("N"), 81 cl::desc("Only import first N functions if N>=0 (default -1)")); 82 83 static cl::opt<bool> 84 ForceImportAll("force-import-all", cl::init(false), cl::Hidden, 85 cl::desc("Import functions with noinline attribute")); 86 87 static cl::opt<float> 88 ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), 89 cl::Hidden, cl::value_desc("x"), 90 cl::desc("As we import functions, multiply the " 91 "`import-instr-limit` threshold by this factor " 92 "before processing newly imported functions")); 93 94 static cl::opt<float> ImportHotInstrFactor( 95 "import-hot-evolution-factor", cl::init(1.0), cl::Hidden, 96 cl::value_desc("x"), 97 cl::desc("As we import functions called from hot callsite, multiply the " 98 "`import-instr-limit` threshold by this factor " 99 "before processing newly imported functions")); 100 101 static cl::opt<float> ImportHotMultiplier( 102 "import-hot-multiplier", cl::init(10.0), cl::Hidden, cl::value_desc("x"), 103 cl::desc("Multiply the `import-instr-limit` threshold for hot callsites")); 104 105 static cl::opt<float> ImportCriticalMultiplier( 106 "import-critical-multiplier", cl::init(100.0), cl::Hidden, 107 cl::value_desc("x"), 108 cl::desc( 109 "Multiply the `import-instr-limit` threshold for critical callsites")); 110 111 // FIXME: This multiplier was not really tuned up. 112 static cl::opt<float> ImportColdMultiplier( 113 "import-cold-multiplier", cl::init(0), cl::Hidden, cl::value_desc("N"), 114 cl::desc("Multiply the `import-instr-limit` threshold for cold callsites")); 115 116 static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, 117 cl::desc("Print imported functions")); 118 119 static cl::opt<bool> PrintImportFailures( 120 "print-import-failures", cl::init(false), cl::Hidden, 121 cl::desc("Print information for functions rejected for importing")); 122 123 static cl::opt<bool> ComputeDead("compute-dead", cl::init(true), cl::Hidden, 124 cl::desc("Compute dead symbols")); 125 126 static cl::opt<bool> EnableImportMetadata( 127 "enable-import-metadata", cl::init(false), cl::Hidden, 128 cl::desc("Enable import metadata like 'thinlto_src_module'")); 129 130 /// Summary file to use for function importing when using -function-import from 131 /// the command line. 132 static cl::opt<std::string> 133 SummaryFile("summary-file", 134 cl::desc("The summary file to use for function importing.")); 135 136 /// Used when testing importing from distributed indexes via opt 137 // -function-import. 138 static cl::opt<bool> 139 ImportAllIndex("import-all-index", 140 cl::desc("Import all external functions in index.")); 141 142 // Load lazily a module from \p FileName in \p Context. 143 static std::unique_ptr<Module> loadFile(const std::string &FileName, 144 LLVMContext &Context) { 145 SMDiagnostic Err; 146 LLVM_DEBUG(dbgs() << "Loading '" << FileName << "'\n"); 147 // Metadata isn't loaded until functions are imported, to minimize 148 // the memory overhead. 149 std::unique_ptr<Module> Result = 150 getLazyIRFileModule(FileName, Err, Context, 151 /* ShouldLazyLoadMetadata = */ true); 152 if (!Result) { 153 Err.print("function-import", errs()); 154 report_fatal_error("Abort"); 155 } 156 157 return Result; 158 } 159 160 /// Given a list of possible callee implementation for a call site, qualify the 161 /// legality of importing each. The return is a range of pairs. Each pair 162 /// corresponds to a candidate. The first value is the ImportFailureReason for 163 /// that candidate, the second is the candidate. 164 static auto qualifyCalleeCandidates( 165 const ModuleSummaryIndex &Index, 166 ArrayRef<std::unique_ptr<GlobalValueSummary>> CalleeSummaryList, 167 StringRef CallerModulePath) { 168 return llvm::map_range( 169 CalleeSummaryList, 170 [&Index, CalleeSummaryList, 171 CallerModulePath](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) 172 -> std::pair<FunctionImporter::ImportFailureReason, 173 const GlobalValueSummary *> { 174 auto *GVSummary = SummaryPtr.get(); 175 if (!Index.isGlobalValueLive(GVSummary)) 176 return {FunctionImporter::ImportFailureReason::NotLive, GVSummary}; 177 178 if (GlobalValue::isInterposableLinkage(GVSummary->linkage())) 179 return {FunctionImporter::ImportFailureReason::InterposableLinkage, 180 GVSummary}; 181 182 auto *Summary = dyn_cast<FunctionSummary>(GVSummary->getBaseObject()); 183 184 // Ignore any callees that aren't actually functions. This could happen 185 // in the case of GUID hash collisions. It could also happen in theory 186 // for SamplePGO profiles collected on old versions of the code after 187 // renaming, since we synthesize edges to any inlined callees appearing 188 // in the profile. 189 if (!Summary) 190 return {FunctionImporter::ImportFailureReason::GlobalVar, GVSummary}; 191 192 // If this is a local function, make sure we import the copy 193 // in the caller's module. The only time a local function can 194 // share an entry in the index is if there is a local with the same name 195 // in another module that had the same source file name (in a different 196 // directory), where each was compiled in their own directory so there 197 // was not distinguishing path. 198 // However, do the import from another module if there is only one 199 // entry in the list - in that case this must be a reference due 200 // to indirect call profile data, since a function pointer can point to 201 // a local in another module. 202 if (GlobalValue::isLocalLinkage(Summary->linkage()) && 203 CalleeSummaryList.size() > 1 && 204 Summary->modulePath() != CallerModulePath) 205 return { 206 FunctionImporter::ImportFailureReason::LocalLinkageNotInModule, 207 GVSummary}; 208 209 // Skip if it isn't legal to import (e.g. may reference unpromotable 210 // locals). 211 if (Summary->notEligibleToImport()) 212 return {FunctionImporter::ImportFailureReason::NotEligible, 213 GVSummary}; 214 215 return {FunctionImporter::ImportFailureReason::None, GVSummary}; 216 }); 217 } 218 219 /// Given a list of possible callee implementation for a call site, select one 220 /// that fits the \p Threshold. If none are found, the Reason will give the last 221 /// reason for the failure (last, in the order of CalleeSummaryList entries). 222 /// 223 /// FIXME: select "best" instead of first that fits. But what is "best"? 224 /// - The smallest: more likely to be inlined. 225 /// - The one with the least outgoing edges (already well optimized). 226 /// - One from a module already being imported from in order to reduce the 227 /// number of source modules parsed/linked. 228 /// - One that has PGO data attached. 229 /// - [insert you fancy metric here] 230 static const GlobalValueSummary * 231 selectCallee(const ModuleSummaryIndex &Index, 232 ArrayRef<std::unique_ptr<GlobalValueSummary>> CalleeSummaryList, 233 unsigned Threshold, StringRef CallerModulePath, 234 FunctionImporter::ImportFailureReason &Reason) { 235 auto QualifiedCandidates = 236 qualifyCalleeCandidates(Index, CalleeSummaryList, CallerModulePath); 237 for (auto QualifiedValue : QualifiedCandidates) { 238 Reason = QualifiedValue.first; 239 if (Reason != FunctionImporter::ImportFailureReason::None) 240 continue; 241 auto *Summary = 242 cast<FunctionSummary>(QualifiedValue.second->getBaseObject()); 243 244 if ((Summary->instCount() > Threshold) && !Summary->fflags().AlwaysInline && 245 !ForceImportAll) { 246 Reason = FunctionImporter::ImportFailureReason::TooLarge; 247 continue; 248 } 249 250 // Don't bother importing if we can't inline it anyway. 251 if (Summary->fflags().NoInline && !ForceImportAll) { 252 Reason = FunctionImporter::ImportFailureReason::NoInline; 253 continue; 254 } 255 256 return Summary; 257 } 258 return nullptr; 259 } 260 261 namespace { 262 263 using EdgeInfo = std::tuple<const FunctionSummary *, unsigned /* Threshold */>; 264 265 } // anonymous namespace 266 267 /// Import globals referenced by a function or other globals that are being 268 /// imported, if importing such global is possible. 269 class GlobalsImporter final { 270 const ModuleSummaryIndex &Index; 271 const GVSummaryMapTy &DefinedGVSummaries; 272 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 273 IsPrevailing; 274 FunctionImporter::ImportMapTy &ImportList; 275 StringMap<FunctionImporter::ExportSetTy> *const ExportLists; 276 277 bool shouldImportGlobal(const ValueInfo &VI) { 278 const auto &GVS = DefinedGVSummaries.find(VI.getGUID()); 279 if (GVS == DefinedGVSummaries.end()) 280 return true; 281 // We should not skip import if the module contains a non-prevailing 282 // definition with interposable linkage type. This is required for 283 // correctness in the situation where there is a prevailing def available 284 // for import and marked read-only. In this case, the non-prevailing def 285 // will be converted to a declaration, while the prevailing one becomes 286 // internal, thus no definitions will be available for linking. In order to 287 // prevent undefined symbol link error, the prevailing definition must be 288 // imported. 289 // FIXME: Consider adding a check that the suitable prevailing definition 290 // exists and marked read-only. 291 if (VI.getSummaryList().size() > 1 && 292 GlobalValue::isInterposableLinkage(GVS->second->linkage()) && 293 !IsPrevailing(VI.getGUID(), GVS->second)) 294 return true; 295 296 return false; 297 } 298 299 void 300 onImportingSummaryImpl(const GlobalValueSummary &Summary, 301 SmallVectorImpl<const GlobalVarSummary *> &Worklist) { 302 for (const auto &VI : Summary.refs()) { 303 if (!shouldImportGlobal(VI)) { 304 LLVM_DEBUG( 305 dbgs() << "Ref ignored! Target already in destination module.\n"); 306 continue; 307 } 308 309 LLVM_DEBUG(dbgs() << " ref -> " << VI << "\n"); 310 311 // If this is a local variable, make sure we import the copy 312 // in the caller's module. The only time a local variable can 313 // share an entry in the index is if there is a local with the same name 314 // in another module that had the same source file name (in a different 315 // directory), where each was compiled in their own directory so there 316 // was not distinguishing path. 317 auto LocalNotInModule = 318 [&](const GlobalValueSummary *RefSummary) -> bool { 319 return GlobalValue::isLocalLinkage(RefSummary->linkage()) && 320 RefSummary->modulePath() != Summary.modulePath(); 321 }; 322 323 for (const auto &RefSummary : VI.getSummaryList()) { 324 const auto *GVS = dyn_cast<GlobalVarSummary>(RefSummary.get()); 325 // Functions could be referenced by global vars - e.g. a vtable; but we 326 // don't currently imagine a reason those would be imported here, rather 327 // than as part of the logic deciding which functions to import (i.e. 328 // based on profile information). Should we decide to handle them here, 329 // we can refactor accordingly at that time. 330 if (!GVS || !Index.canImportGlobalVar(GVS, /* AnalyzeRefs */ true) || 331 LocalNotInModule(GVS)) 332 continue; 333 auto ILI = ImportList[RefSummary->modulePath()].insert(VI.getGUID()); 334 // Only update stat and exports if we haven't already imported this 335 // variable. 336 if (!ILI.second) 337 break; 338 NumImportedGlobalVarsThinLink++; 339 // Any references made by this variable will be marked exported 340 // later, in ComputeCrossModuleImport, after import decisions are 341 // complete, which is more efficient than adding them here. 342 if (ExportLists) 343 (*ExportLists)[RefSummary->modulePath()].insert(VI); 344 345 // If variable is not writeonly we attempt to recursively analyze 346 // its references in order to import referenced constants. 347 if (!Index.isWriteOnly(GVS)) 348 Worklist.emplace_back(GVS); 349 break; 350 } 351 } 352 } 353 354 public: 355 GlobalsImporter( 356 const ModuleSummaryIndex &Index, const GVSummaryMapTy &DefinedGVSummaries, 357 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 358 IsPrevailing, 359 FunctionImporter::ImportMapTy &ImportList, 360 StringMap<FunctionImporter::ExportSetTy> *ExportLists) 361 : Index(Index), DefinedGVSummaries(DefinedGVSummaries), 362 IsPrevailing(IsPrevailing), ImportList(ImportList), 363 ExportLists(ExportLists) {} 364 365 void onImportingSummary(const GlobalValueSummary &Summary) { 366 SmallVector<const GlobalVarSummary *, 128> Worklist; 367 onImportingSummaryImpl(Summary, Worklist); 368 while (!Worklist.empty()) 369 onImportingSummaryImpl(*Worklist.pop_back_val(), Worklist); 370 } 371 }; 372 373 static const char * 374 getFailureName(FunctionImporter::ImportFailureReason Reason) { 375 switch (Reason) { 376 case FunctionImporter::ImportFailureReason::None: 377 return "None"; 378 case FunctionImporter::ImportFailureReason::GlobalVar: 379 return "GlobalVar"; 380 case FunctionImporter::ImportFailureReason::NotLive: 381 return "NotLive"; 382 case FunctionImporter::ImportFailureReason::TooLarge: 383 return "TooLarge"; 384 case FunctionImporter::ImportFailureReason::InterposableLinkage: 385 return "InterposableLinkage"; 386 case FunctionImporter::ImportFailureReason::LocalLinkageNotInModule: 387 return "LocalLinkageNotInModule"; 388 case FunctionImporter::ImportFailureReason::NotEligible: 389 return "NotEligible"; 390 case FunctionImporter::ImportFailureReason::NoInline: 391 return "NoInline"; 392 } 393 llvm_unreachable("invalid reason"); 394 } 395 396 /// Compute the list of functions to import for a given caller. Mark these 397 /// imported functions and the symbols they reference in their source module as 398 /// exported from their source module. 399 static void computeImportForFunction( 400 const FunctionSummary &Summary, const ModuleSummaryIndex &Index, 401 const unsigned Threshold, const GVSummaryMapTy &DefinedGVSummaries, 402 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 403 isPrevailing, 404 SmallVectorImpl<EdgeInfo> &Worklist, GlobalsImporter &GVImporter, 405 FunctionImporter::ImportMapTy &ImportList, 406 StringMap<FunctionImporter::ExportSetTy> *ExportLists, 407 FunctionImporter::ImportThresholdsTy &ImportThresholds) { 408 GVImporter.onImportingSummary(Summary); 409 static int ImportCount = 0; 410 for (const auto &Edge : Summary.calls()) { 411 ValueInfo VI = Edge.first; 412 LLVM_DEBUG(dbgs() << " edge -> " << VI << " Threshold:" << Threshold 413 << "\n"); 414 415 if (ImportCutoff >= 0 && ImportCount >= ImportCutoff) { 416 LLVM_DEBUG(dbgs() << "ignored! import-cutoff value of " << ImportCutoff 417 << " reached.\n"); 418 continue; 419 } 420 421 if (DefinedGVSummaries.count(VI.getGUID())) { 422 // FIXME: Consider not skipping import if the module contains 423 // a non-prevailing def with interposable linkage. The prevailing copy 424 // can safely be imported (see shouldImportGlobal()). 425 LLVM_DEBUG(dbgs() << "ignored! Target already in destination module.\n"); 426 continue; 427 } 428 429 auto GetBonusMultiplier = [](CalleeInfo::HotnessType Hotness) -> float { 430 if (Hotness == CalleeInfo::HotnessType::Hot) 431 return ImportHotMultiplier; 432 if (Hotness == CalleeInfo::HotnessType::Cold) 433 return ImportColdMultiplier; 434 if (Hotness == CalleeInfo::HotnessType::Critical) 435 return ImportCriticalMultiplier; 436 return 1.0; 437 }; 438 439 const auto NewThreshold = 440 Threshold * GetBonusMultiplier(Edge.second.getHotness()); 441 442 auto IT = ImportThresholds.insert(std::make_pair( 443 VI.getGUID(), std::make_tuple(NewThreshold, nullptr, nullptr))); 444 bool PreviouslyVisited = !IT.second; 445 auto &ProcessedThreshold = std::get<0>(IT.first->second); 446 auto &CalleeSummary = std::get<1>(IT.first->second); 447 auto &FailureInfo = std::get<2>(IT.first->second); 448 449 bool IsHotCallsite = 450 Edge.second.getHotness() == CalleeInfo::HotnessType::Hot; 451 bool IsCriticalCallsite = 452 Edge.second.getHotness() == CalleeInfo::HotnessType::Critical; 453 454 const FunctionSummary *ResolvedCalleeSummary = nullptr; 455 if (CalleeSummary) { 456 assert(PreviouslyVisited); 457 // Since the traversal of the call graph is DFS, we can revisit a function 458 // a second time with a higher threshold. In this case, it is added back 459 // to the worklist with the new threshold (so that its own callee chains 460 // can be considered with the higher threshold). 461 if (NewThreshold <= ProcessedThreshold) { 462 LLVM_DEBUG( 463 dbgs() << "ignored! Target was already imported with Threshold " 464 << ProcessedThreshold << "\n"); 465 continue; 466 } 467 // Update with new larger threshold. 468 ProcessedThreshold = NewThreshold; 469 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 470 } else { 471 // If we already rejected importing a callee at the same or higher 472 // threshold, don't waste time calling selectCallee. 473 if (PreviouslyVisited && NewThreshold <= ProcessedThreshold) { 474 LLVM_DEBUG( 475 dbgs() << "ignored! Target was already rejected with Threshold " 476 << ProcessedThreshold << "\n"); 477 if (PrintImportFailures) { 478 assert(FailureInfo && 479 "Expected FailureInfo for previously rejected candidate"); 480 FailureInfo->Attempts++; 481 } 482 continue; 483 } 484 485 FunctionImporter::ImportFailureReason Reason; 486 CalleeSummary = selectCallee(Index, VI.getSummaryList(), NewThreshold, 487 Summary.modulePath(), Reason); 488 if (!CalleeSummary) { 489 // Update with new larger threshold if this was a retry (otherwise 490 // we would have already inserted with NewThreshold above). Also 491 // update failure info if requested. 492 if (PreviouslyVisited) { 493 ProcessedThreshold = NewThreshold; 494 if (PrintImportFailures) { 495 assert(FailureInfo && 496 "Expected FailureInfo for previously rejected candidate"); 497 FailureInfo->Reason = Reason; 498 FailureInfo->Attempts++; 499 FailureInfo->MaxHotness = 500 std::max(FailureInfo->MaxHotness, Edge.second.getHotness()); 501 } 502 } else if (PrintImportFailures) { 503 assert(!FailureInfo && 504 "Expected no FailureInfo for newly rejected candidate"); 505 FailureInfo = std::make_unique<FunctionImporter::ImportFailureInfo>( 506 VI, Edge.second.getHotness(), Reason, 1); 507 } 508 if (ForceImportAll) { 509 std::string Msg = std::string("Failed to import function ") + 510 VI.name().str() + " due to " + 511 getFailureName(Reason); 512 auto Error = make_error<StringError>( 513 Msg, make_error_code(errc::not_supported)); 514 logAllUnhandledErrors(std::move(Error), errs(), 515 "Error importing module: "); 516 break; 517 } else { 518 LLVM_DEBUG(dbgs() 519 << "ignored! No qualifying callee with summary found.\n"); 520 continue; 521 } 522 } 523 524 // "Resolve" the summary 525 CalleeSummary = CalleeSummary->getBaseObject(); 526 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 527 528 assert((ResolvedCalleeSummary->fflags().AlwaysInline || ForceImportAll || 529 (ResolvedCalleeSummary->instCount() <= NewThreshold)) && 530 "selectCallee() didn't honor the threshold"); 531 532 auto ExportModulePath = ResolvedCalleeSummary->modulePath(); 533 auto ILI = ImportList[ExportModulePath].insert(VI.getGUID()); 534 // We previously decided to import this GUID definition if it was already 535 // inserted in the set of imports from the exporting module. 536 bool PreviouslyImported = !ILI.second; 537 if (!PreviouslyImported) { 538 NumImportedFunctionsThinLink++; 539 if (IsHotCallsite) 540 NumImportedHotFunctionsThinLink++; 541 if (IsCriticalCallsite) 542 NumImportedCriticalFunctionsThinLink++; 543 } 544 545 // Any calls/references made by this function will be marked exported 546 // later, in ComputeCrossModuleImport, after import decisions are 547 // complete, which is more efficient than adding them here. 548 if (ExportLists) 549 (*ExportLists)[ExportModulePath].insert(VI); 550 } 551 552 auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) { 553 // Adjust the threshold for next level of imported functions. 554 // The threshold is different for hot callsites because we can then 555 // inline chains of hot calls. 556 if (IsHotCallsite) 557 return Threshold * ImportHotInstrFactor; 558 return Threshold * ImportInstrFactor; 559 }; 560 561 const auto AdjThreshold = GetAdjustedThreshold(Threshold, IsHotCallsite); 562 563 ImportCount++; 564 565 // Insert the newly imported function to the worklist. 566 Worklist.emplace_back(ResolvedCalleeSummary, AdjThreshold); 567 } 568 } 569 570 /// Given the list of globals defined in a module, compute the list of imports 571 /// as well as the list of "exports", i.e. the list of symbols referenced from 572 /// another module (that may require promotion). 573 static void ComputeImportForModule( 574 const GVSummaryMapTy &DefinedGVSummaries, 575 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 576 isPrevailing, 577 const ModuleSummaryIndex &Index, StringRef ModName, 578 FunctionImporter::ImportMapTy &ImportList, 579 StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { 580 // Worklist contains the list of function imported in this module, for which 581 // we will analyse the callees and may import further down the callgraph. 582 SmallVector<EdgeInfo, 128> Worklist; 583 GlobalsImporter GVI(Index, DefinedGVSummaries, isPrevailing, ImportList, 584 ExportLists); 585 FunctionImporter::ImportThresholdsTy ImportThresholds; 586 587 // Populate the worklist with the import for the functions in the current 588 // module 589 for (const auto &GVSummary : DefinedGVSummaries) { 590 #ifndef NDEBUG 591 // FIXME: Change the GVSummaryMapTy to hold ValueInfo instead of GUID 592 // so this map look up (and possibly others) can be avoided. 593 auto VI = Index.getValueInfo(GVSummary.first); 594 #endif 595 if (!Index.isGlobalValueLive(GVSummary.second)) { 596 LLVM_DEBUG(dbgs() << "Ignores Dead GUID: " << VI << "\n"); 597 continue; 598 } 599 auto *FuncSummary = 600 dyn_cast<FunctionSummary>(GVSummary.second->getBaseObject()); 601 if (!FuncSummary) 602 // Skip import for global variables 603 continue; 604 LLVM_DEBUG(dbgs() << "Initialize import for " << VI << "\n"); 605 computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, 606 DefinedGVSummaries, isPrevailing, Worklist, GVI, 607 ImportList, ExportLists, ImportThresholds); 608 } 609 610 // Process the newly imported functions and add callees to the worklist. 611 while (!Worklist.empty()) { 612 auto GVInfo = Worklist.pop_back_val(); 613 auto *Summary = std::get<0>(GVInfo); 614 auto Threshold = std::get<1>(GVInfo); 615 616 if (auto *FS = dyn_cast<FunctionSummary>(Summary)) 617 computeImportForFunction(*FS, Index, Threshold, DefinedGVSummaries, 618 isPrevailing, Worklist, GVI, ImportList, 619 ExportLists, ImportThresholds); 620 } 621 622 // Print stats about functions considered but rejected for importing 623 // when requested. 624 if (PrintImportFailures) { 625 dbgs() << "Missed imports into module " << ModName << "\n"; 626 for (auto &I : ImportThresholds) { 627 auto &ProcessedThreshold = std::get<0>(I.second); 628 auto &CalleeSummary = std::get<1>(I.second); 629 auto &FailureInfo = std::get<2>(I.second); 630 if (CalleeSummary) 631 continue; // We are going to import. 632 assert(FailureInfo); 633 FunctionSummary *FS = nullptr; 634 if (!FailureInfo->VI.getSummaryList().empty()) 635 FS = dyn_cast<FunctionSummary>( 636 FailureInfo->VI.getSummaryList()[0]->getBaseObject()); 637 dbgs() << FailureInfo->VI 638 << ": Reason = " << getFailureName(FailureInfo->Reason) 639 << ", Threshold = " << ProcessedThreshold 640 << ", Size = " << (FS ? (int)FS->instCount() : -1) 641 << ", MaxHotness = " << getHotnessName(FailureInfo->MaxHotness) 642 << ", Attempts = " << FailureInfo->Attempts << "\n"; 643 } 644 } 645 } 646 647 #ifndef NDEBUG 648 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index, ValueInfo VI) { 649 auto SL = VI.getSummaryList(); 650 return SL.empty() 651 ? false 652 : SL[0]->getSummaryKind() == GlobalValueSummary::GlobalVarKind; 653 } 654 655 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index, 656 GlobalValue::GUID G) { 657 if (const auto &VI = Index.getValueInfo(G)) 658 return isGlobalVarSummary(Index, VI); 659 return false; 660 } 661 662 template <class T> 663 static unsigned numGlobalVarSummaries(const ModuleSummaryIndex &Index, 664 T &Cont) { 665 unsigned NumGVS = 0; 666 for (auto &V : Cont) 667 if (isGlobalVarSummary(Index, V)) 668 ++NumGVS; 669 return NumGVS; 670 } 671 #endif 672 673 #ifndef NDEBUG 674 static bool 675 checkVariableImport(const ModuleSummaryIndex &Index, 676 StringMap<FunctionImporter::ImportMapTy> &ImportLists, 677 StringMap<FunctionImporter::ExportSetTy> &ExportLists) { 678 679 DenseSet<GlobalValue::GUID> FlattenedImports; 680 681 for (auto &ImportPerModule : ImportLists) 682 for (auto &ExportPerModule : ImportPerModule.second) 683 FlattenedImports.insert(ExportPerModule.second.begin(), 684 ExportPerModule.second.end()); 685 686 // Checks that all GUIDs of read/writeonly vars we see in export lists 687 // are also in the import lists. Otherwise we my face linker undefs, 688 // because readonly and writeonly vars are internalized in their 689 // source modules. The exception would be if it has a linkage type indicating 690 // that there may have been a copy existing in the importing module (e.g. 691 // linkonce_odr). In that case we cannot accurately do this checking. 692 auto IsReadOrWriteOnlyVarNeedingImporting = [&](StringRef ModulePath, 693 const ValueInfo &VI) { 694 auto *GVS = dyn_cast_or_null<GlobalVarSummary>( 695 Index.findSummaryInModule(VI, ModulePath)); 696 return GVS && (Index.isReadOnly(GVS) || Index.isWriteOnly(GVS)) && 697 !(GVS->linkage() == GlobalValue::AvailableExternallyLinkage || 698 GVS->linkage() == GlobalValue::WeakODRLinkage || 699 GVS->linkage() == GlobalValue::LinkOnceODRLinkage); 700 }; 701 702 for (auto &ExportPerModule : ExportLists) 703 for (auto &VI : ExportPerModule.second) 704 if (!FlattenedImports.count(VI.getGUID()) && 705 IsReadOrWriteOnlyVarNeedingImporting(ExportPerModule.first(), VI)) 706 return false; 707 708 return true; 709 } 710 #endif 711 712 /// Compute all the import and export for every module using the Index. 713 void llvm::ComputeCrossModuleImport( 714 const ModuleSummaryIndex &Index, 715 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 716 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 717 isPrevailing, 718 StringMap<FunctionImporter::ImportMapTy> &ImportLists, 719 StringMap<FunctionImporter::ExportSetTy> &ExportLists) { 720 // For each module that has function defined, compute the import/export lists. 721 for (const auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { 722 auto &ImportList = ImportLists[DefinedGVSummaries.first()]; 723 LLVM_DEBUG(dbgs() << "Computing import for Module '" 724 << DefinedGVSummaries.first() << "'\n"); 725 ComputeImportForModule(DefinedGVSummaries.second, isPrevailing, Index, 726 DefinedGVSummaries.first(), ImportList, 727 &ExportLists); 728 } 729 730 // When computing imports we only added the variables and functions being 731 // imported to the export list. We also need to mark any references and calls 732 // they make as exported as well. We do this here, as it is more efficient 733 // since we may import the same values multiple times into different modules 734 // during the import computation. 735 for (auto &ELI : ExportLists) { 736 FunctionImporter::ExportSetTy NewExports; 737 const auto &DefinedGVSummaries = 738 ModuleToDefinedGVSummaries.lookup(ELI.first()); 739 for (auto &EI : ELI.second) { 740 // Find the copy defined in the exporting module so that we can mark the 741 // values it references in that specific definition as exported. 742 // Below we will add all references and called values, without regard to 743 // whether they are also defined in this module. We subsequently prune the 744 // list to only include those defined in the exporting module, see comment 745 // there as to why. 746 auto DS = DefinedGVSummaries.find(EI.getGUID()); 747 // Anything marked exported during the import computation must have been 748 // defined in the exporting module. 749 assert(DS != DefinedGVSummaries.end()); 750 auto *S = DS->getSecond(); 751 S = S->getBaseObject(); 752 if (auto *GVS = dyn_cast<GlobalVarSummary>(S)) { 753 // Export referenced functions and variables. We don't export/promote 754 // objects referenced by writeonly variable initializer, because 755 // we convert such variables initializers to "zeroinitializer". 756 // See processGlobalForThinLTO. 757 if (!Index.isWriteOnly(GVS)) 758 for (const auto &VI : GVS->refs()) 759 NewExports.insert(VI); 760 } else { 761 auto *FS = cast<FunctionSummary>(S); 762 for (const auto &Edge : FS->calls()) 763 NewExports.insert(Edge.first); 764 for (const auto &Ref : FS->refs()) 765 NewExports.insert(Ref); 766 } 767 } 768 // Prune list computed above to only include values defined in the exporting 769 // module. We do this after the above insertion since we may hit the same 770 // ref/call target multiple times in above loop, and it is more efficient to 771 // avoid a set lookup each time. 772 for (auto EI = NewExports.begin(); EI != NewExports.end();) { 773 if (!DefinedGVSummaries.count(EI->getGUID())) 774 NewExports.erase(EI++); 775 else 776 ++EI; 777 } 778 ELI.second.insert(NewExports.begin(), NewExports.end()); 779 } 780 781 assert(checkVariableImport(Index, ImportLists, ExportLists)); 782 #ifndef NDEBUG 783 LLVM_DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() 784 << " modules:\n"); 785 for (auto &ModuleImports : ImportLists) { 786 auto ModName = ModuleImports.first(); 787 auto &Exports = ExportLists[ModName]; 788 unsigned NumGVS = numGlobalVarSummaries(Index, Exports); 789 LLVM_DEBUG(dbgs() << "* Module " << ModName << " exports " 790 << Exports.size() - NumGVS << " functions and " << NumGVS 791 << " vars. Imports from " << ModuleImports.second.size() 792 << " modules.\n"); 793 for (auto &Src : ModuleImports.second) { 794 auto SrcModName = Src.first(); 795 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second); 796 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod 797 << " functions imported from " << SrcModName << "\n"); 798 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod 799 << " global vars imported from " << SrcModName << "\n"); 800 } 801 } 802 #endif 803 } 804 805 #ifndef NDEBUG 806 static void dumpImportListForModule(const ModuleSummaryIndex &Index, 807 StringRef ModulePath, 808 FunctionImporter::ImportMapTy &ImportList) { 809 LLVM_DEBUG(dbgs() << "* Module " << ModulePath << " imports from " 810 << ImportList.size() << " modules.\n"); 811 for (auto &Src : ImportList) { 812 auto SrcModName = Src.first(); 813 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second); 814 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod 815 << " functions imported from " << SrcModName << "\n"); 816 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod << " vars imported from " 817 << SrcModName << "\n"); 818 } 819 } 820 #endif 821 822 /// Compute all the imports for the given module in the Index. 823 void llvm::ComputeCrossModuleImportForModule( 824 StringRef ModulePath, 825 function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 826 isPrevailing, 827 const ModuleSummaryIndex &Index, 828 FunctionImporter::ImportMapTy &ImportList) { 829 // Collect the list of functions this module defines. 830 // GUID -> Summary 831 GVSummaryMapTy FunctionSummaryMap; 832 Index.collectDefinedFunctionsForModule(ModulePath, FunctionSummaryMap); 833 834 // Compute the import list for this module. 835 LLVM_DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); 836 ComputeImportForModule(FunctionSummaryMap, isPrevailing, Index, ModulePath, 837 ImportList); 838 839 #ifndef NDEBUG 840 dumpImportListForModule(Index, ModulePath, ImportList); 841 #endif 842 } 843 844 // Mark all external summaries in Index for import into the given module. 845 // Used for distributed builds using a distributed index. 846 void llvm::ComputeCrossModuleImportForModuleFromIndex( 847 StringRef ModulePath, const ModuleSummaryIndex &Index, 848 FunctionImporter::ImportMapTy &ImportList) { 849 for (const auto &GlobalList : Index) { 850 // Ignore entries for undefined references. 851 if (GlobalList.second.SummaryList.empty()) 852 continue; 853 854 auto GUID = GlobalList.first; 855 assert(GlobalList.second.SummaryList.size() == 1 && 856 "Expected individual combined index to have one summary per GUID"); 857 auto &Summary = GlobalList.second.SummaryList[0]; 858 // Skip the summaries for the importing module. These are included to 859 // e.g. record required linkage changes. 860 if (Summary->modulePath() == ModulePath) 861 continue; 862 // Add an entry to provoke importing by thinBackend. 863 ImportList[Summary->modulePath()].insert(GUID); 864 } 865 #ifndef NDEBUG 866 dumpImportListForModule(Index, ModulePath, ImportList); 867 #endif 868 } 869 870 // For SamplePGO, the indirect call targets for local functions will 871 // have its original name annotated in profile. We try to find the 872 // corresponding PGOFuncName as the GUID, and fix up the edges 873 // accordingly. 874 void updateValueInfoForIndirectCalls(ModuleSummaryIndex &Index, 875 FunctionSummary *FS) { 876 for (auto &EI : FS->mutableCalls()) { 877 if (!EI.first.getSummaryList().empty()) 878 continue; 879 auto GUID = Index.getGUIDFromOriginalID(EI.first.getGUID()); 880 if (GUID == 0) 881 continue; 882 // Update the edge to point directly to the correct GUID. 883 auto VI = Index.getValueInfo(GUID); 884 if (llvm::any_of( 885 VI.getSummaryList(), 886 [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) { 887 // The mapping from OriginalId to GUID may return a GUID 888 // that corresponds to a static variable. Filter it out here. 889 // This can happen when 890 // 1) There is a call to a library function which is not defined 891 // in the index. 892 // 2) There is a static variable with the OriginalGUID identical 893 // to the GUID of the library function in 1); 894 // When this happens the static variable in 2) will be found, 895 // which needs to be filtered out. 896 return SummaryPtr->getSummaryKind() == 897 GlobalValueSummary::GlobalVarKind; 898 })) 899 continue; 900 EI.first = VI; 901 } 902 } 903 904 void llvm::updateIndirectCalls(ModuleSummaryIndex &Index) { 905 for (const auto &Entry : Index) { 906 for (const auto &S : Entry.second.SummaryList) { 907 if (auto *FS = dyn_cast<FunctionSummary>(S.get())) 908 updateValueInfoForIndirectCalls(Index, FS); 909 } 910 } 911 } 912 913 void llvm::computeDeadSymbolsAndUpdateIndirectCalls( 914 ModuleSummaryIndex &Index, 915 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols, 916 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing) { 917 assert(!Index.withGlobalValueDeadStripping()); 918 if (!ComputeDead || 919 // Don't do anything when nothing is live, this is friendly with tests. 920 GUIDPreservedSymbols.empty()) { 921 // Still need to update indirect calls. 922 updateIndirectCalls(Index); 923 return; 924 } 925 unsigned LiveSymbols = 0; 926 SmallVector<ValueInfo, 128> Worklist; 927 Worklist.reserve(GUIDPreservedSymbols.size() * 2); 928 for (auto GUID : GUIDPreservedSymbols) { 929 ValueInfo VI = Index.getValueInfo(GUID); 930 if (!VI) 931 continue; 932 for (const auto &S : VI.getSummaryList()) 933 S->setLive(true); 934 } 935 936 // Add values flagged in the index as live roots to the worklist. 937 for (const auto &Entry : Index) { 938 auto VI = Index.getValueInfo(Entry); 939 for (const auto &S : Entry.second.SummaryList) { 940 if (auto *FS = dyn_cast<FunctionSummary>(S.get())) 941 updateValueInfoForIndirectCalls(Index, FS); 942 if (S->isLive()) { 943 LLVM_DEBUG(dbgs() << "Live root: " << VI << "\n"); 944 Worklist.push_back(VI); 945 ++LiveSymbols; 946 break; 947 } 948 } 949 } 950 951 // Make value live and add it to the worklist if it was not live before. 952 auto visit = [&](ValueInfo VI, bool IsAliasee) { 953 // FIXME: If we knew which edges were created for indirect call profiles, 954 // we could skip them here. Any that are live should be reached via 955 // other edges, e.g. reference edges. Otherwise, using a profile collected 956 // on a slightly different binary might provoke preserving, importing 957 // and ultimately promoting calls to functions not linked into this 958 // binary, which increases the binary size unnecessarily. Note that 959 // if this code changes, the importer needs to change so that edges 960 // to functions marked dead are skipped. 961 962 if (llvm::any_of(VI.getSummaryList(), 963 [](const std::unique_ptr<llvm::GlobalValueSummary> &S) { 964 return S->isLive(); 965 })) 966 return; 967 968 // We only keep live symbols that are known to be non-prevailing if any are 969 // available_externally, linkonceodr, weakodr. Those symbols are discarded 970 // later in the EliminateAvailableExternally pass and setting them to 971 // not-live could break downstreams users of liveness information (PR36483) 972 // or limit optimization opportunities. 973 if (isPrevailing(VI.getGUID()) == PrevailingType::No) { 974 bool KeepAliveLinkage = false; 975 bool Interposable = false; 976 for (const auto &S : VI.getSummaryList()) { 977 if (S->linkage() == GlobalValue::AvailableExternallyLinkage || 978 S->linkage() == GlobalValue::WeakODRLinkage || 979 S->linkage() == GlobalValue::LinkOnceODRLinkage) 980 KeepAliveLinkage = true; 981 else if (GlobalValue::isInterposableLinkage(S->linkage())) 982 Interposable = true; 983 } 984 985 if (!IsAliasee) { 986 if (!KeepAliveLinkage) 987 return; 988 989 if (Interposable) 990 report_fatal_error( 991 "Interposable and available_externally/linkonce_odr/weak_odr " 992 "symbol"); 993 } 994 } 995 996 for (const auto &S : VI.getSummaryList()) 997 S->setLive(true); 998 ++LiveSymbols; 999 Worklist.push_back(VI); 1000 }; 1001 1002 while (!Worklist.empty()) { 1003 auto VI = Worklist.pop_back_val(); 1004 for (const auto &Summary : VI.getSummaryList()) { 1005 if (auto *AS = dyn_cast<AliasSummary>(Summary.get())) { 1006 // If this is an alias, visit the aliasee VI to ensure that all copies 1007 // are marked live and it is added to the worklist for further 1008 // processing of its references. 1009 visit(AS->getAliaseeVI(), true); 1010 continue; 1011 } 1012 for (auto Ref : Summary->refs()) 1013 visit(Ref, false); 1014 if (auto *FS = dyn_cast<FunctionSummary>(Summary.get())) 1015 for (auto Call : FS->calls()) 1016 visit(Call.first, false); 1017 } 1018 } 1019 Index.setWithGlobalValueDeadStripping(); 1020 1021 unsigned DeadSymbols = Index.size() - LiveSymbols; 1022 LLVM_DEBUG(dbgs() << LiveSymbols << " symbols Live, and " << DeadSymbols 1023 << " symbols Dead \n"); 1024 NumDeadSymbols += DeadSymbols; 1025 NumLiveSymbols += LiveSymbols; 1026 } 1027 1028 // Compute dead symbols and propagate constants in combined index. 1029 void llvm::computeDeadSymbolsWithConstProp( 1030 ModuleSummaryIndex &Index, 1031 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols, 1032 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing, 1033 bool ImportEnabled) { 1034 computeDeadSymbolsAndUpdateIndirectCalls(Index, GUIDPreservedSymbols, 1035 isPrevailing); 1036 if (ImportEnabled) 1037 Index.propagateAttributes(GUIDPreservedSymbols); 1038 } 1039 1040 /// Compute the set of summaries needed for a ThinLTO backend compilation of 1041 /// \p ModulePath. 1042 void llvm::gatherImportedSummariesForModule( 1043 StringRef ModulePath, 1044 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 1045 const FunctionImporter::ImportMapTy &ImportList, 1046 std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) { 1047 // Include all summaries from the importing module. 1048 ModuleToSummariesForIndex[std::string(ModulePath)] = 1049 ModuleToDefinedGVSummaries.lookup(ModulePath); 1050 // Include summaries for imports. 1051 for (const auto &ILI : ImportList) { 1052 auto &SummariesForIndex = 1053 ModuleToSummariesForIndex[std::string(ILI.first())]; 1054 const auto &DefinedGVSummaries = 1055 ModuleToDefinedGVSummaries.lookup(ILI.first()); 1056 for (const auto &GI : ILI.second) { 1057 const auto &DS = DefinedGVSummaries.find(GI); 1058 assert(DS != DefinedGVSummaries.end() && 1059 "Expected a defined summary for imported global value"); 1060 SummariesForIndex[GI] = DS->second; 1061 } 1062 } 1063 } 1064 1065 /// Emit the files \p ModulePath will import from into \p OutputFilename. 1066 std::error_code llvm::EmitImportsFiles( 1067 StringRef ModulePath, StringRef OutputFilename, 1068 const std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) { 1069 std::error_code EC; 1070 raw_fd_ostream ImportsOS(OutputFilename, EC, sys::fs::OpenFlags::OF_None); 1071 if (EC) 1072 return EC; 1073 for (const auto &ILI : ModuleToSummariesForIndex) 1074 // The ModuleToSummariesForIndex map includes an entry for the current 1075 // Module (needed for writing out the index files). We don't want to 1076 // include it in the imports file, however, so filter it out. 1077 if (ILI.first != ModulePath) 1078 ImportsOS << ILI.first << "\n"; 1079 return std::error_code(); 1080 } 1081 1082 bool llvm::convertToDeclaration(GlobalValue &GV) { 1083 LLVM_DEBUG(dbgs() << "Converting to a declaration: `" << GV.getName() 1084 << "\n"); 1085 if (Function *F = dyn_cast<Function>(&GV)) { 1086 F->deleteBody(); 1087 F->clearMetadata(); 1088 F->setComdat(nullptr); 1089 } else if (GlobalVariable *V = dyn_cast<GlobalVariable>(&GV)) { 1090 V->setInitializer(nullptr); 1091 V->setLinkage(GlobalValue::ExternalLinkage); 1092 V->clearMetadata(); 1093 V->setComdat(nullptr); 1094 } else { 1095 GlobalValue *NewGV; 1096 if (GV.getValueType()->isFunctionTy()) 1097 NewGV = 1098 Function::Create(cast<FunctionType>(GV.getValueType()), 1099 GlobalValue::ExternalLinkage, GV.getAddressSpace(), 1100 "", GV.getParent()); 1101 else 1102 NewGV = 1103 new GlobalVariable(*GV.getParent(), GV.getValueType(), 1104 /*isConstant*/ false, GlobalValue::ExternalLinkage, 1105 /*init*/ nullptr, "", 1106 /*insertbefore*/ nullptr, GV.getThreadLocalMode(), 1107 GV.getType()->getAddressSpace()); 1108 NewGV->takeName(&GV); 1109 GV.replaceAllUsesWith(NewGV); 1110 return false; 1111 } 1112 if (!GV.isImplicitDSOLocal()) 1113 GV.setDSOLocal(false); 1114 return true; 1115 } 1116 1117 void llvm::thinLTOFinalizeInModule(Module &TheModule, 1118 const GVSummaryMapTy &DefinedGlobals, 1119 bool PropagateAttrs) { 1120 DenseSet<Comdat *> NonPrevailingComdats; 1121 auto FinalizeInModule = [&](GlobalValue &GV, bool Propagate = false) { 1122 // See if the global summary analysis computed a new resolved linkage. 1123 const auto &GS = DefinedGlobals.find(GV.getGUID()); 1124 if (GS == DefinedGlobals.end()) 1125 return; 1126 1127 if (Propagate) 1128 if (FunctionSummary *FS = dyn_cast<FunctionSummary>(GS->second)) { 1129 if (Function *F = dyn_cast<Function>(&GV)) { 1130 // TODO: propagate ReadNone and ReadOnly. 1131 if (FS->fflags().ReadNone && !F->doesNotAccessMemory()) 1132 F->setDoesNotAccessMemory(); 1133 1134 if (FS->fflags().ReadOnly && !F->onlyReadsMemory()) 1135 F->setOnlyReadsMemory(); 1136 1137 if (FS->fflags().NoRecurse && !F->doesNotRecurse()) 1138 F->setDoesNotRecurse(); 1139 1140 if (FS->fflags().NoUnwind && !F->doesNotThrow()) 1141 F->setDoesNotThrow(); 1142 } 1143 } 1144 1145 auto NewLinkage = GS->second->linkage(); 1146 if (GlobalValue::isLocalLinkage(GV.getLinkage()) || 1147 // Don't internalize anything here, because the code below 1148 // lacks necessary correctness checks. Leave this job to 1149 // LLVM 'internalize' pass. 1150 GlobalValue::isLocalLinkage(NewLinkage) || 1151 // In case it was dead and already converted to declaration. 1152 GV.isDeclaration()) 1153 return; 1154 1155 // Set the potentially more constraining visibility computed from summaries. 1156 // The DefaultVisibility condition is because older GlobalValueSummary does 1157 // not record DefaultVisibility and we don't want to change protected/hidden 1158 // to default. 1159 if (GS->second->getVisibility() != GlobalValue::DefaultVisibility) 1160 GV.setVisibility(GS->second->getVisibility()); 1161 1162 if (NewLinkage == GV.getLinkage()) 1163 return; 1164 1165 // Check for a non-prevailing def that has interposable linkage 1166 // (e.g. non-odr weak or linkonce). In that case we can't simply 1167 // convert to available_externally, since it would lose the 1168 // interposable property and possibly get inlined. Simply drop 1169 // the definition in that case. 1170 if (GlobalValue::isAvailableExternallyLinkage(NewLinkage) && 1171 GlobalValue::isInterposableLinkage(GV.getLinkage())) { 1172 if (!convertToDeclaration(GV)) 1173 // FIXME: Change this to collect replaced GVs and later erase 1174 // them from the parent module once thinLTOResolvePrevailingGUID is 1175 // changed to enable this for aliases. 1176 llvm_unreachable("Expected GV to be converted"); 1177 } else { 1178 // If all copies of the original symbol had global unnamed addr and 1179 // linkonce_odr linkage, or if all of them had local unnamed addr linkage 1180 // and are constants, then it should be an auto hide symbol. In that case 1181 // the thin link would have marked it as CanAutoHide. Add hidden 1182 // visibility to the symbol to preserve the property. 1183 if (NewLinkage == GlobalValue::WeakODRLinkage && 1184 GS->second->canAutoHide()) { 1185 assert(GV.canBeOmittedFromSymbolTable()); 1186 GV.setVisibility(GlobalValue::HiddenVisibility); 1187 } 1188 1189 LLVM_DEBUG(dbgs() << "ODR fixing up linkage for `" << GV.getName() 1190 << "` from " << GV.getLinkage() << " to " << NewLinkage 1191 << "\n"); 1192 GV.setLinkage(NewLinkage); 1193 } 1194 // Remove declarations from comdats, including available_externally 1195 // as this is a declaration for the linker, and will be dropped eventually. 1196 // It is illegal for comdats to contain declarations. 1197 auto *GO = dyn_cast_or_null<GlobalObject>(&GV); 1198 if (GO && GO->isDeclarationForLinker() && GO->hasComdat()) { 1199 if (GO->getComdat()->getName() == GO->getName()) 1200 NonPrevailingComdats.insert(GO->getComdat()); 1201 GO->setComdat(nullptr); 1202 } 1203 }; 1204 1205 // Process functions and global now 1206 for (auto &GV : TheModule) 1207 FinalizeInModule(GV, PropagateAttrs); 1208 for (auto &GV : TheModule.globals()) 1209 FinalizeInModule(GV); 1210 for (auto &GV : TheModule.aliases()) 1211 FinalizeInModule(GV); 1212 1213 // For a non-prevailing comdat, all its members must be available_externally. 1214 // FinalizeInModule has handled non-local-linkage GlobalValues. Here we handle 1215 // local linkage GlobalValues. 1216 if (NonPrevailingComdats.empty()) 1217 return; 1218 for (auto &GO : TheModule.global_objects()) { 1219 if (auto *C = GO.getComdat(); C && NonPrevailingComdats.count(C)) { 1220 GO.setComdat(nullptr); 1221 GO.setLinkage(GlobalValue::AvailableExternallyLinkage); 1222 } 1223 } 1224 bool Changed; 1225 do { 1226 Changed = false; 1227 // If an alias references a GlobalValue in a non-prevailing comdat, change 1228 // it to available_externally. For simplicity we only handle GlobalValue and 1229 // ConstantExpr with a base object. ConstantExpr without a base object is 1230 // unlikely used in a COMDAT. 1231 for (auto &GA : TheModule.aliases()) { 1232 if (GA.hasAvailableExternallyLinkage()) 1233 continue; 1234 GlobalObject *Obj = GA.getAliaseeObject(); 1235 assert(Obj && "aliasee without an base object is unimplemented"); 1236 if (Obj->hasAvailableExternallyLinkage()) { 1237 GA.setLinkage(GlobalValue::AvailableExternallyLinkage); 1238 Changed = true; 1239 } 1240 } 1241 } while (Changed); 1242 } 1243 1244 /// Run internalization on \p TheModule based on symmary analysis. 1245 void llvm::thinLTOInternalizeModule(Module &TheModule, 1246 const GVSummaryMapTy &DefinedGlobals) { 1247 // Declare a callback for the internalize pass that will ask for every 1248 // candidate GlobalValue if it can be internalized or not. 1249 auto MustPreserveGV = [&](const GlobalValue &GV) -> bool { 1250 // It may be the case that GV is on a chain of an ifunc, its alias and 1251 // subsequent aliases. In this case, the summary for the value is not 1252 // available. 1253 if (isa<GlobalIFunc>(&GV) || 1254 (isa<GlobalAlias>(&GV) && 1255 isa<GlobalIFunc>(cast<GlobalAlias>(&GV)->getAliaseeObject()))) 1256 return true; 1257 1258 // Lookup the linkage recorded in the summaries during global analysis. 1259 auto GS = DefinedGlobals.find(GV.getGUID()); 1260 if (GS == DefinedGlobals.end()) { 1261 // Must have been promoted (possibly conservatively). Find original 1262 // name so that we can access the correct summary and see if it can 1263 // be internalized again. 1264 // FIXME: Eventually we should control promotion instead of promoting 1265 // and internalizing again. 1266 StringRef OrigName = 1267 ModuleSummaryIndex::getOriginalNameBeforePromote(GV.getName()); 1268 std::string OrigId = GlobalValue::getGlobalIdentifier( 1269 OrigName, GlobalValue::InternalLinkage, 1270 TheModule.getSourceFileName()); 1271 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigId)); 1272 if (GS == DefinedGlobals.end()) { 1273 // Also check the original non-promoted non-globalized name. In some 1274 // cases a preempted weak value is linked in as a local copy because 1275 // it is referenced by an alias (IRLinker::linkGlobalValueProto). 1276 // In that case, since it was originally not a local value, it was 1277 // recorded in the index using the original name. 1278 // FIXME: This may not be needed once PR27866 is fixed. 1279 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigName)); 1280 assert(GS != DefinedGlobals.end()); 1281 } 1282 } 1283 return !GlobalValue::isLocalLinkage(GS->second->linkage()); 1284 }; 1285 1286 // FIXME: See if we can just internalize directly here via linkage changes 1287 // based on the index, rather than invoking internalizeModule. 1288 internalizeModule(TheModule, MustPreserveGV); 1289 } 1290 1291 /// Make alias a clone of its aliasee. 1292 static Function *replaceAliasWithAliasee(Module *SrcModule, GlobalAlias *GA) { 1293 Function *Fn = cast<Function>(GA->getAliaseeObject()); 1294 1295 ValueToValueMapTy VMap; 1296 Function *NewFn = CloneFunction(Fn, VMap); 1297 // Clone should use the original alias's linkage, visibility and name, and we 1298 // ensure all uses of alias instead use the new clone (casted if necessary). 1299 NewFn->setLinkage(GA->getLinkage()); 1300 NewFn->setVisibility(GA->getVisibility()); 1301 GA->replaceAllUsesWith(ConstantExpr::getBitCast(NewFn, GA->getType())); 1302 NewFn->takeName(GA); 1303 return NewFn; 1304 } 1305 1306 // Internalize values that we marked with specific attribute 1307 // in processGlobalForThinLTO. 1308 static void internalizeGVsAfterImport(Module &M) { 1309 for (auto &GV : M.globals()) 1310 // Skip GVs which have been converted to declarations 1311 // by dropDeadSymbols. 1312 if (!GV.isDeclaration() && GV.hasAttribute("thinlto-internalize")) { 1313 GV.setLinkage(GlobalValue::InternalLinkage); 1314 GV.setVisibility(GlobalValue::DefaultVisibility); 1315 } 1316 } 1317 1318 // Automatically import functions in Module \p DestModule based on the summaries 1319 // index. 1320 Expected<bool> FunctionImporter::importFunctions( 1321 Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) { 1322 LLVM_DEBUG(dbgs() << "Starting import for Module " 1323 << DestModule.getModuleIdentifier() << "\n"); 1324 unsigned ImportedCount = 0, ImportedGVCount = 0; 1325 1326 IRMover Mover(DestModule); 1327 // Do the actual import of functions now, one Module at a time 1328 std::set<StringRef> ModuleNameOrderedList; 1329 for (const auto &FunctionsToImportPerModule : ImportList) { 1330 ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); 1331 } 1332 for (const auto &Name : ModuleNameOrderedList) { 1333 // Get the module for the import 1334 const auto &FunctionsToImportPerModule = ImportList.find(Name); 1335 assert(FunctionsToImportPerModule != ImportList.end()); 1336 Expected<std::unique_ptr<Module>> SrcModuleOrErr = ModuleLoader(Name); 1337 if (!SrcModuleOrErr) 1338 return SrcModuleOrErr.takeError(); 1339 std::unique_ptr<Module> SrcModule = std::move(*SrcModuleOrErr); 1340 assert(&DestModule.getContext() == &SrcModule->getContext() && 1341 "Context mismatch"); 1342 1343 // If modules were created with lazy metadata loading, materialize it 1344 // now, before linking it (otherwise this will be a noop). 1345 if (Error Err = SrcModule->materializeMetadata()) 1346 return std::move(Err); 1347 1348 auto &ImportGUIDs = FunctionsToImportPerModule->second; 1349 // Find the globals to import 1350 SetVector<GlobalValue *> GlobalsToImport; 1351 for (Function &F : *SrcModule) { 1352 if (!F.hasName()) 1353 continue; 1354 auto GUID = F.getGUID(); 1355 auto Import = ImportGUIDs.count(GUID); 1356 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " 1357 << GUID << " " << F.getName() << " from " 1358 << SrcModule->getSourceFileName() << "\n"); 1359 if (Import) { 1360 if (Error Err = F.materialize()) 1361 return std::move(Err); 1362 if (EnableImportMetadata) { 1363 // Add 'thinlto_src_module' metadata for statistics and debugging. 1364 F.setMetadata( 1365 "thinlto_src_module", 1366 MDNode::get(DestModule.getContext(), 1367 {MDString::get(DestModule.getContext(), 1368 SrcModule->getSourceFileName())})); 1369 } 1370 GlobalsToImport.insert(&F); 1371 } 1372 } 1373 for (GlobalVariable &GV : SrcModule->globals()) { 1374 if (!GV.hasName()) 1375 continue; 1376 auto GUID = GV.getGUID(); 1377 auto Import = ImportGUIDs.count(GUID); 1378 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " 1379 << GUID << " " << GV.getName() << " from " 1380 << SrcModule->getSourceFileName() << "\n"); 1381 if (Import) { 1382 if (Error Err = GV.materialize()) 1383 return std::move(Err); 1384 ImportedGVCount += GlobalsToImport.insert(&GV); 1385 } 1386 } 1387 for (GlobalAlias &GA : SrcModule->aliases()) { 1388 if (!GA.hasName() || isa<GlobalIFunc>(GA.getAliaseeObject())) 1389 continue; 1390 auto GUID = GA.getGUID(); 1391 auto Import = ImportGUIDs.count(GUID); 1392 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " 1393 << GUID << " " << GA.getName() << " from " 1394 << SrcModule->getSourceFileName() << "\n"); 1395 if (Import) { 1396 if (Error Err = GA.materialize()) 1397 return std::move(Err); 1398 // Import alias as a copy of its aliasee. 1399 GlobalObject *GO = GA.getAliaseeObject(); 1400 if (Error Err = GO->materialize()) 1401 return std::move(Err); 1402 auto *Fn = replaceAliasWithAliasee(SrcModule.get(), &GA); 1403 LLVM_DEBUG(dbgs() << "Is importing aliasee fn " << GO->getGUID() << " " 1404 << GO->getName() << " from " 1405 << SrcModule->getSourceFileName() << "\n"); 1406 if (EnableImportMetadata) { 1407 // Add 'thinlto_src_module' metadata for statistics and debugging. 1408 Fn->setMetadata( 1409 "thinlto_src_module", 1410 MDNode::get(DestModule.getContext(), 1411 {MDString::get(DestModule.getContext(), 1412 SrcModule->getSourceFileName())})); 1413 } 1414 GlobalsToImport.insert(Fn); 1415 } 1416 } 1417 1418 // Upgrade debug info after we're done materializing all the globals and we 1419 // have loaded all the required metadata! 1420 UpgradeDebugInfo(*SrcModule); 1421 1422 // Set the partial sample profile ratio in the profile summary module flag 1423 // of the imported source module, if applicable, so that the profile summary 1424 // module flag will match with that of the destination module when it's 1425 // imported. 1426 SrcModule->setPartialSampleProfileRatio(Index); 1427 1428 // Link in the specified functions. 1429 if (renameModuleForThinLTO(*SrcModule, Index, ClearDSOLocalOnDeclarations, 1430 &GlobalsToImport)) 1431 return true; 1432 1433 if (PrintImports) { 1434 for (const auto *GV : GlobalsToImport) 1435 dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() 1436 << " from " << SrcModule->getSourceFileName() << "\n"; 1437 } 1438 1439 if (Error Err = Mover.move(std::move(SrcModule), 1440 GlobalsToImport.getArrayRef(), nullptr, 1441 /*IsPerformingImport=*/true)) 1442 return createStringError(errc::invalid_argument, 1443 Twine("Function Import: link error: ") + 1444 toString(std::move(Err))); 1445 1446 ImportedCount += GlobalsToImport.size(); 1447 NumImportedModules++; 1448 } 1449 1450 internalizeGVsAfterImport(DestModule); 1451 1452 NumImportedFunctions += (ImportedCount - ImportedGVCount); 1453 NumImportedGlobalVars += ImportedGVCount; 1454 1455 LLVM_DEBUG(dbgs() << "Imported " << ImportedCount - ImportedGVCount 1456 << " functions for Module " 1457 << DestModule.getModuleIdentifier() << "\n"); 1458 LLVM_DEBUG(dbgs() << "Imported " << ImportedGVCount 1459 << " global variables for Module " 1460 << DestModule.getModuleIdentifier() << "\n"); 1461 return ImportedCount; 1462 } 1463 1464 static bool doImportingForModule( 1465 Module &M, function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)> 1466 isPrevailing) { 1467 if (SummaryFile.empty()) 1468 report_fatal_error("error: -function-import requires -summary-file\n"); 1469 Expected<std::unique_ptr<ModuleSummaryIndex>> IndexPtrOrErr = 1470 getModuleSummaryIndexForFile(SummaryFile); 1471 if (!IndexPtrOrErr) { 1472 logAllUnhandledErrors(IndexPtrOrErr.takeError(), errs(), 1473 "Error loading file '" + SummaryFile + "': "); 1474 return false; 1475 } 1476 std::unique_ptr<ModuleSummaryIndex> Index = std::move(*IndexPtrOrErr); 1477 1478 // First step is collecting the import list. 1479 FunctionImporter::ImportMapTy ImportList; 1480 // If requested, simply import all functions in the index. This is used 1481 // when testing distributed backend handling via the opt tool, when 1482 // we have distributed indexes containing exactly the summaries to import. 1483 if (ImportAllIndex) 1484 ComputeCrossModuleImportForModuleFromIndex(M.getModuleIdentifier(), *Index, 1485 ImportList); 1486 else 1487 ComputeCrossModuleImportForModule(M.getModuleIdentifier(), isPrevailing, 1488 *Index, ImportList); 1489 1490 // Conservatively mark all internal values as promoted. This interface is 1491 // only used when doing importing via the function importing pass. The pass 1492 // is only enabled when testing importing via the 'opt' tool, which does 1493 // not do the ThinLink that would normally determine what values to promote. 1494 for (auto &I : *Index) { 1495 for (auto &S : I.second.SummaryList) { 1496 if (GlobalValue::isLocalLinkage(S->linkage())) 1497 S->setLinkage(GlobalValue::ExternalLinkage); 1498 } 1499 } 1500 1501 // Next we need to promote to global scope and rename any local values that 1502 // are potentially exported to other modules. 1503 if (renameModuleForThinLTO(M, *Index, /*ClearDSOLocalOnDeclarations=*/false, 1504 /*GlobalsToImport=*/nullptr)) { 1505 errs() << "Error renaming module\n"; 1506 return true; 1507 } 1508 1509 // Perform the import now. 1510 auto ModuleLoader = [&M](StringRef Identifier) { 1511 return loadFile(std::string(Identifier), M.getContext()); 1512 }; 1513 FunctionImporter Importer(*Index, ModuleLoader, 1514 /*ClearDSOLocalOnDeclarations=*/false); 1515 Expected<bool> Result = Importer.importFunctions(M, ImportList); 1516 1517 // FIXME: Probably need to propagate Errors through the pass manager. 1518 if (!Result) { 1519 logAllUnhandledErrors(Result.takeError(), errs(), 1520 "Error importing module: "); 1521 return true; 1522 } 1523 1524 return true; 1525 } 1526 1527 PreservedAnalyses FunctionImportPass::run(Module &M, 1528 ModuleAnalysisManager &AM) { 1529 // This is only used for testing the function import pass via opt, where we 1530 // don't have prevailing information from the LTO context available, so just 1531 // conservatively assume everything is prevailing (which is fine for the very 1532 // limited use of prevailing checking in this pass). 1533 auto isPrevailing = [](GlobalValue::GUID, const GlobalValueSummary *) { 1534 return true; 1535 }; 1536 if (!doImportingForModule(M, isPrevailing)) 1537 return PreservedAnalyses::all(); 1538 1539 return PreservedAnalyses::none(); 1540 } 1541