1 //===- ModuleManager.cpp - Module Manager ---------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file defines the ModuleManager class, which manages a set of loaded 10 // modules for the ASTReader. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "clang/Serialization/ModuleManager.h" 15 #include "clang/Basic/FileManager.h" 16 #include "clang/Basic/LLVM.h" 17 #include "clang/Lex/HeaderSearch.h" 18 #include "clang/Lex/ModuleMap.h" 19 #include "clang/Serialization/GlobalModuleIndex.h" 20 #include "clang/Serialization/InMemoryModuleCache.h" 21 #include "clang/Serialization/ModuleFile.h" 22 #include "clang/Serialization/PCHContainerOperations.h" 23 #include "llvm/ADT/STLExtras.h" 24 #include "llvm/ADT/SetVector.h" 25 #include "llvm/ADT/SmallPtrSet.h" 26 #include "llvm/ADT/SmallVector.h" 27 #include "llvm/ADT/StringRef.h" 28 #include "llvm/ADT/iterator.h" 29 #include "llvm/Support/Chrono.h" 30 #include "llvm/Support/DOTGraphTraits.h" 31 #include "llvm/Support/ErrorOr.h" 32 #include "llvm/Support/GraphWriter.h" 33 #include "llvm/Support/MemoryBuffer.h" 34 #include "llvm/Support/VirtualFileSystem.h" 35 #include <algorithm> 36 #include <cassert> 37 #include <memory> 38 #include <string> 39 #include <system_error> 40 41 using namespace clang; 42 using namespace serialization; 43 44 ModuleFile *ModuleManager::lookupByFileName(StringRef Name) const { 45 auto Entry = FileMgr.getFile(Name, /*OpenFile=*/false, 46 /*CacheFailure=*/false); 47 if (Entry) 48 return lookup(*Entry); 49 50 return nullptr; 51 } 52 53 ModuleFile *ModuleManager::lookupByModuleName(StringRef Name) const { 54 if (const Module *Mod = HeaderSearchInfo.getModuleMap().findModule(Name)) 55 if (const FileEntry *File = Mod->getASTFile()) 56 return lookup(File); 57 58 return nullptr; 59 } 60 61 ModuleFile *ModuleManager::lookup(const FileEntry *File) const { 62 auto Known = Modules.find(File); 63 if (Known == Modules.end()) 64 return nullptr; 65 66 return Known->second; 67 } 68 69 std::unique_ptr<llvm::MemoryBuffer> 70 ModuleManager::lookupBuffer(StringRef Name) { 71 auto Entry = FileMgr.getFile(Name, /*OpenFile=*/false, 72 /*CacheFailure=*/false); 73 if (!Entry) 74 return nullptr; 75 return std::move(InMemoryBuffers[*Entry]); 76 } 77 78 static bool checkSignature(ASTFileSignature Signature, 79 ASTFileSignature ExpectedSignature, 80 std::string &ErrorStr) { 81 if (!ExpectedSignature || Signature == ExpectedSignature) 82 return false; 83 84 ErrorStr = 85 Signature ? "signature mismatch" : "could not read module signature"; 86 return true; 87 } 88 89 static void updateModuleImports(ModuleFile &MF, ModuleFile *ImportedBy, 90 SourceLocation ImportLoc) { 91 if (ImportedBy) { 92 MF.ImportedBy.insert(ImportedBy); 93 ImportedBy->Imports.insert(&MF); 94 } else { 95 if (!MF.DirectlyImported) 96 MF.ImportLoc = ImportLoc; 97 98 MF.DirectlyImported = true; 99 } 100 } 101 102 ModuleManager::AddModuleResult 103 ModuleManager::addModule(StringRef FileName, ModuleKind Type, 104 SourceLocation ImportLoc, ModuleFile *ImportedBy, 105 unsigned Generation, 106 off_t ExpectedSize, time_t ExpectedModTime, 107 ASTFileSignature ExpectedSignature, 108 ASTFileSignatureReader ReadSignature, 109 ModuleFile *&Module, 110 std::string &ErrorStr) { 111 Module = nullptr; 112 113 // Look for the file entry. This only fails if the expected size or 114 // modification time differ. 115 OptionalFileEntryRefDegradesToFileEntryPtr Entry; 116 if (Type == MK_ExplicitModule || Type == MK_PrebuiltModule) { 117 // If we're not expecting to pull this file out of the module cache, it 118 // might have a different mtime due to being moved across filesystems in 119 // a distributed build. The size must still match, though. (As must the 120 // contents, but we can't check that.) 121 ExpectedModTime = 0; 122 } 123 // Note: ExpectedSize and ExpectedModTime will be 0 for MK_ImplicitModule 124 // when using an ASTFileSignature. 125 if (lookupModuleFile(FileName, ExpectedSize, ExpectedModTime, Entry)) { 126 ErrorStr = "module file out of date"; 127 return OutOfDate; 128 } 129 130 if (!Entry && FileName != "-") { 131 ErrorStr = "module file not found"; 132 return Missing; 133 } 134 135 // The ModuleManager's use of FileEntry nodes as the keys for its map of 136 // loaded modules is less than ideal. Uniqueness for FileEntry nodes is 137 // maintained by FileManager, which in turn uses inode numbers on hosts 138 // that support that. When coupled with the module cache's proclivity for 139 // turning over and deleting stale PCMs, this means entries for different 140 // module files can wind up reusing the same underlying inode. When this 141 // happens, subsequent accesses to the Modules map will disagree on the 142 // ModuleFile associated with a given file. In general, it is not sufficient 143 // to resolve this conundrum with a type like FileEntryRef that stores the 144 // name of the FileEntry node on first access because of path canonicalization 145 // issues. However, the paths constructed for implicit module builds are 146 // fully under Clang's control. We *can*, therefore, rely on their structure 147 // being consistent across operating systems and across subsequent accesses 148 // to the Modules map. 149 auto implicitModuleNamesMatch = [](ModuleKind Kind, const ModuleFile *MF, 150 const FileEntry *Entry) -> bool { 151 if (Kind != MK_ImplicitModule) 152 return true; 153 return Entry->getName() == MF->FileName; 154 }; 155 156 // Check whether we already loaded this module, before 157 if (ModuleFile *ModuleEntry = Modules.lookup(Entry)) { 158 if (implicitModuleNamesMatch(Type, ModuleEntry, Entry)) { 159 // Check the stored signature. 160 if (checkSignature(ModuleEntry->Signature, ExpectedSignature, ErrorStr)) 161 return OutOfDate; 162 163 Module = ModuleEntry; 164 updateModuleImports(*ModuleEntry, ImportedBy, ImportLoc); 165 return AlreadyLoaded; 166 } 167 } 168 169 // Allocate a new module. 170 auto NewModule = std::make_unique<ModuleFile>(Type, Generation); 171 NewModule->Index = Chain.size(); 172 NewModule->FileName = FileName.str(); 173 NewModule->File = Entry; 174 NewModule->ImportLoc = ImportLoc; 175 NewModule->InputFilesValidationTimestamp = 0; 176 177 if (NewModule->Kind == MK_ImplicitModule) { 178 std::string TimestampFilename = NewModule->getTimestampFilename(); 179 llvm::vfs::Status Status; 180 // A cached stat value would be fine as well. 181 if (!FileMgr.getNoncachedStatValue(TimestampFilename, Status)) 182 NewModule->InputFilesValidationTimestamp = 183 llvm::sys::toTimeT(Status.getLastModificationTime()); 184 } 185 186 // Load the contents of the module 187 if (std::unique_ptr<llvm::MemoryBuffer> Buffer = lookupBuffer(FileName)) { 188 // The buffer was already provided for us. 189 NewModule->Buffer = &ModuleCache->addBuiltPCM(FileName, std::move(Buffer)); 190 // Since the cached buffer is reused, it is safe to close the file 191 // descriptor that was opened while stat()ing the PCM in 192 // lookupModuleFile() above, it won't be needed any longer. 193 Entry->closeFile(); 194 } else if (llvm::MemoryBuffer *Buffer = 195 getModuleCache().lookupPCM(FileName)) { 196 NewModule->Buffer = Buffer; 197 // As above, the file descriptor is no longer needed. 198 Entry->closeFile(); 199 } else if (getModuleCache().shouldBuildPCM(FileName)) { 200 // Report that the module is out of date, since we tried (and failed) to 201 // import it earlier. 202 Entry->closeFile(); 203 return OutOfDate; 204 } else { 205 // Open the AST file. 206 llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Buf((std::error_code())); 207 if (FileName == "-") { 208 Buf = llvm::MemoryBuffer::getSTDIN(); 209 } else { 210 // Get a buffer of the file and close the file descriptor when done. 211 // The file is volatile because in a parallel build we expect multiple 212 // compiler processes to use the same module file rebuilding it if needed. 213 // 214 // RequiresNullTerminator is false because module files don't need it, and 215 // this allows the file to still be mmapped. 216 Buf = FileMgr.getBufferForFile(NewModule->File, 217 /*IsVolatile=*/true, 218 /*RequiresNullTerminator=*/false); 219 } 220 221 if (!Buf) { 222 ErrorStr = Buf.getError().message(); 223 return Missing; 224 } 225 226 NewModule->Buffer = &getModuleCache().addPCM(FileName, std::move(*Buf)); 227 } 228 229 // Initialize the stream. 230 NewModule->Data = PCHContainerRdr.ExtractPCH(*NewModule->Buffer); 231 232 // Read the signature eagerly now so that we can check it. Avoid calling 233 // ReadSignature unless there's something to check though. 234 if (ExpectedSignature && checkSignature(ReadSignature(NewModule->Data), 235 ExpectedSignature, ErrorStr)) 236 return OutOfDate; 237 238 // We're keeping this module. Store it everywhere. 239 Module = Modules[Entry] = NewModule.get(); 240 241 updateModuleImports(*NewModule, ImportedBy, ImportLoc); 242 243 if (!NewModule->isModule()) 244 PCHChain.push_back(NewModule.get()); 245 if (!ImportedBy) 246 Roots.push_back(NewModule.get()); 247 248 Chain.push_back(std::move(NewModule)); 249 return NewlyLoaded; 250 } 251 252 void ModuleManager::removeModules(ModuleIterator First, ModuleMap *modMap) { 253 auto Last = end(); 254 if (First == Last) 255 return; 256 257 // Explicitly clear VisitOrder since we might not notice it is stale. 258 VisitOrder.clear(); 259 260 // Collect the set of module file pointers that we'll be removing. 261 llvm::SmallPtrSet<ModuleFile *, 4> victimSet( 262 (llvm::pointer_iterator<ModuleIterator>(First)), 263 (llvm::pointer_iterator<ModuleIterator>(Last))); 264 265 auto IsVictim = [&](ModuleFile *MF) { 266 return victimSet.count(MF); 267 }; 268 // Remove any references to the now-destroyed modules. 269 for (auto I = begin(); I != First; ++I) { 270 I->Imports.remove_if(IsVictim); 271 I->ImportedBy.remove_if(IsVictim); 272 } 273 Roots.erase(std::remove_if(Roots.begin(), Roots.end(), IsVictim), 274 Roots.end()); 275 276 // Remove the modules from the PCH chain. 277 for (auto I = First; I != Last; ++I) { 278 if (!I->isModule()) { 279 PCHChain.erase(llvm::find(PCHChain, &*I), PCHChain.end()); 280 break; 281 } 282 } 283 284 // Delete the modules and erase them from the various structures. 285 for (ModuleIterator victim = First; victim != Last; ++victim) { 286 Modules.erase(victim->File); 287 288 if (modMap) { 289 StringRef ModuleName = victim->ModuleName; 290 if (Module *mod = modMap->findModule(ModuleName)) { 291 mod->setASTFile(None); 292 } 293 } 294 } 295 296 // Delete the modules. 297 Chain.erase(Chain.begin() + (First - begin()), Chain.end()); 298 } 299 300 void 301 ModuleManager::addInMemoryBuffer(StringRef FileName, 302 std::unique_ptr<llvm::MemoryBuffer> Buffer) { 303 const FileEntry *Entry = 304 FileMgr.getVirtualFile(FileName, Buffer->getBufferSize(), 0); 305 InMemoryBuffers[Entry] = std::move(Buffer); 306 } 307 308 ModuleManager::VisitState *ModuleManager::allocateVisitState() { 309 // Fast path: if we have a cached state, use it. 310 if (FirstVisitState) { 311 VisitState *Result = FirstVisitState; 312 FirstVisitState = FirstVisitState->NextState; 313 Result->NextState = nullptr; 314 return Result; 315 } 316 317 // Allocate and return a new state. 318 return new VisitState(size()); 319 } 320 321 void ModuleManager::returnVisitState(VisitState *State) { 322 assert(State->NextState == nullptr && "Visited state is in list?"); 323 State->NextState = FirstVisitState; 324 FirstVisitState = State; 325 } 326 327 void ModuleManager::setGlobalIndex(GlobalModuleIndex *Index) { 328 GlobalIndex = Index; 329 if (!GlobalIndex) { 330 ModulesInCommonWithGlobalIndex.clear(); 331 return; 332 } 333 334 // Notify the global module index about all of the modules we've already 335 // loaded. 336 for (ModuleFile &M : *this) 337 if (!GlobalIndex->loadedModuleFile(&M)) 338 ModulesInCommonWithGlobalIndex.push_back(&M); 339 } 340 341 void ModuleManager::moduleFileAccepted(ModuleFile *MF) { 342 if (!GlobalIndex || GlobalIndex->loadedModuleFile(MF)) 343 return; 344 345 ModulesInCommonWithGlobalIndex.push_back(MF); 346 } 347 348 ModuleManager::ModuleManager(FileManager &FileMgr, 349 InMemoryModuleCache &ModuleCache, 350 const PCHContainerReader &PCHContainerRdr, 351 const HeaderSearch &HeaderSearchInfo) 352 : FileMgr(FileMgr), ModuleCache(&ModuleCache), 353 PCHContainerRdr(PCHContainerRdr), HeaderSearchInfo(HeaderSearchInfo) {} 354 355 ModuleManager::~ModuleManager() { delete FirstVisitState; } 356 357 void ModuleManager::visit(llvm::function_ref<bool(ModuleFile &M)> Visitor, 358 llvm::SmallPtrSetImpl<ModuleFile *> *ModuleFilesHit) { 359 // If the visitation order vector is the wrong size, recompute the order. 360 if (VisitOrder.size() != Chain.size()) { 361 unsigned N = size(); 362 VisitOrder.clear(); 363 VisitOrder.reserve(N); 364 365 // Record the number of incoming edges for each module. When we 366 // encounter a module with no incoming edges, push it into the queue 367 // to seed the queue. 368 SmallVector<ModuleFile *, 4> Queue; 369 Queue.reserve(N); 370 llvm::SmallVector<unsigned, 4> UnusedIncomingEdges; 371 UnusedIncomingEdges.resize(size()); 372 for (ModuleFile &M : llvm::reverse(*this)) { 373 unsigned Size = M.ImportedBy.size(); 374 UnusedIncomingEdges[M.Index] = Size; 375 if (!Size) 376 Queue.push_back(&M); 377 } 378 379 // Traverse the graph, making sure to visit a module before visiting any 380 // of its dependencies. 381 while (!Queue.empty()) { 382 ModuleFile *CurrentModule = Queue.pop_back_val(); 383 VisitOrder.push_back(CurrentModule); 384 385 // For any module that this module depends on, push it on the 386 // stack (if it hasn't already been marked as visited). 387 for (auto M = CurrentModule->Imports.rbegin(), 388 MEnd = CurrentModule->Imports.rend(); 389 M != MEnd; ++M) { 390 // Remove our current module as an impediment to visiting the 391 // module we depend on. If we were the last unvisited module 392 // that depends on this particular module, push it into the 393 // queue to be visited. 394 unsigned &NumUnusedEdges = UnusedIncomingEdges[(*M)->Index]; 395 if (NumUnusedEdges && (--NumUnusedEdges == 0)) 396 Queue.push_back(*M); 397 } 398 } 399 400 assert(VisitOrder.size() == N && "Visitation order is wrong?"); 401 402 delete FirstVisitState; 403 FirstVisitState = nullptr; 404 } 405 406 VisitState *State = allocateVisitState(); 407 unsigned VisitNumber = State->NextVisitNumber++; 408 409 // If the caller has provided us with a hit-set that came from the global 410 // module index, mark every module file in common with the global module 411 // index that is *not* in that set as 'visited'. 412 if (ModuleFilesHit && !ModulesInCommonWithGlobalIndex.empty()) { 413 for (unsigned I = 0, N = ModulesInCommonWithGlobalIndex.size(); I != N; ++I) 414 { 415 ModuleFile *M = ModulesInCommonWithGlobalIndex[I]; 416 if (!ModuleFilesHit->count(M)) 417 State->VisitNumber[M->Index] = VisitNumber; 418 } 419 } 420 421 for (unsigned I = 0, N = VisitOrder.size(); I != N; ++I) { 422 ModuleFile *CurrentModule = VisitOrder[I]; 423 // Should we skip this module file? 424 if (State->VisitNumber[CurrentModule->Index] == VisitNumber) 425 continue; 426 427 // Visit the module. 428 assert(State->VisitNumber[CurrentModule->Index] == VisitNumber - 1); 429 State->VisitNumber[CurrentModule->Index] = VisitNumber; 430 if (!Visitor(*CurrentModule)) 431 continue; 432 433 // The visitor has requested that cut off visitation of any 434 // module that the current module depends on. To indicate this 435 // behavior, we mark all of the reachable modules as having been visited. 436 ModuleFile *NextModule = CurrentModule; 437 do { 438 // For any module that this module depends on, push it on the 439 // stack (if it hasn't already been marked as visited). 440 for (llvm::SetVector<ModuleFile *>::iterator 441 M = NextModule->Imports.begin(), 442 MEnd = NextModule->Imports.end(); 443 M != MEnd; ++M) { 444 if (State->VisitNumber[(*M)->Index] != VisitNumber) { 445 State->Stack.push_back(*M); 446 State->VisitNumber[(*M)->Index] = VisitNumber; 447 } 448 } 449 450 if (State->Stack.empty()) 451 break; 452 453 // Pop the next module off the stack. 454 NextModule = State->Stack.pop_back_val(); 455 } while (true); 456 } 457 458 returnVisitState(State); 459 } 460 461 bool ModuleManager::lookupModuleFile(StringRef FileName, off_t ExpectedSize, 462 time_t ExpectedModTime, 463 Optional<FileEntryRef> &File) { 464 File = None; 465 if (FileName == "-") 466 return false; 467 468 // Open the file immediately to ensure there is no race between stat'ing and 469 // opening the file. 470 Optional<FileEntryRef> FileOrErr = 471 expectedToOptional(FileMgr.getFileRef(FileName, /*OpenFile=*/true, 472 /*CacheFailure=*/false)); 473 if (!FileOrErr) 474 return false; 475 476 File = *FileOrErr; 477 478 if ((ExpectedSize && ExpectedSize != File->getSize()) || 479 (ExpectedModTime && ExpectedModTime != File->getModificationTime())) 480 // Do not destroy File, as it may be referenced. If we need to rebuild it, 481 // it will be destroyed by removeModules. 482 return true; 483 484 return false; 485 } 486 487 #ifndef NDEBUG 488 namespace llvm { 489 490 template<> 491 struct GraphTraits<ModuleManager> { 492 using NodeRef = ModuleFile *; 493 using ChildIteratorType = llvm::SetVector<ModuleFile *>::const_iterator; 494 using nodes_iterator = pointer_iterator<ModuleManager::ModuleConstIterator>; 495 496 static ChildIteratorType child_begin(NodeRef Node) { 497 return Node->Imports.begin(); 498 } 499 500 static ChildIteratorType child_end(NodeRef Node) { 501 return Node->Imports.end(); 502 } 503 504 static nodes_iterator nodes_begin(const ModuleManager &Manager) { 505 return nodes_iterator(Manager.begin()); 506 } 507 508 static nodes_iterator nodes_end(const ModuleManager &Manager) { 509 return nodes_iterator(Manager.end()); 510 } 511 }; 512 513 template<> 514 struct DOTGraphTraits<ModuleManager> : public DefaultDOTGraphTraits { 515 explicit DOTGraphTraits(bool IsSimple = false) 516 : DefaultDOTGraphTraits(IsSimple) {} 517 518 static bool renderGraphFromBottomUp() { return true; } 519 520 std::string getNodeLabel(ModuleFile *M, const ModuleManager&) { 521 return M->ModuleName; 522 } 523 }; 524 525 } // namespace llvm 526 527 void ModuleManager::viewGraph() { 528 llvm::ViewGraph(*this, "Modules"); 529 } 530 #endif 531