1 //===- ModuleDepCollector.cpp - Callbacks to collect deps -------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "clang/Tooling/DependencyScanning/ModuleDepCollector.h" 10 11 #include "clang/Frontend/CompilerInstance.h" 12 #include "clang/Lex/Preprocessor.h" 13 #include "clang/Tooling/DependencyScanning/DependencyScanningWorker.h" 14 #include "llvm/Support/StringSaver.h" 15 16 using namespace clang; 17 using namespace tooling; 18 using namespace dependencies; 19 20 static void optimizeHeaderSearchOpts(HeaderSearchOptions &Opts, 21 ASTReader &Reader, 22 const serialization::ModuleFile &MF) { 23 // Only preserve search paths that were used during the dependency scan. 24 std::vector<HeaderSearchOptions::Entry> Entries = Opts.UserEntries; 25 Opts.UserEntries.clear(); 26 for (unsigned I = 0; I < Entries.size(); ++I) 27 if (MF.SearchPathUsage[I]) 28 Opts.UserEntries.push_back(Entries[I]); 29 } 30 31 CompilerInvocation ModuleDepCollector::makeInvocationForModuleBuildWithoutPaths( 32 const ModuleDeps &Deps, 33 llvm::function_ref<void(CompilerInvocation &)> Optimize) const { 34 // Make a deep copy of the original Clang invocation. 35 CompilerInvocation CI(OriginalInvocation); 36 37 CI.getLangOpts()->resetNonModularOptions(); 38 CI.getPreprocessorOpts().resetNonModularOptions(); 39 40 // Remove options incompatible with explicit module build or are likely to 41 // differ between identical modules discovered from different translation 42 // units. 43 CI.getFrontendOpts().Inputs.clear(); 44 CI.getFrontendOpts().OutputFile.clear(); 45 CI.getCodeGenOpts().MainFileName.clear(); 46 CI.getCodeGenOpts().DwarfDebugFlags.clear(); 47 48 CI.getFrontendOpts().ProgramAction = frontend::GenerateModule; 49 CI.getLangOpts()->ModuleName = Deps.ID.ModuleName; 50 CI.getFrontendOpts().IsSystemModule = Deps.IsSystem; 51 52 CI.getLangOpts()->ImplicitModules = false; 53 54 // Report the prebuilt modules this module uses. 55 for (const auto &PrebuiltModule : Deps.PrebuiltModuleDeps) 56 CI.getFrontendOpts().ModuleFiles.push_back(PrebuiltModule.PCMFile); 57 58 Optimize(CI); 59 60 // The original invocation probably didn't have strict context hash enabled. 61 // We will use the context hash of this invocation to distinguish between 62 // multiple incompatible versions of the same module and will use it when 63 // reporting dependencies to the clients. Let's make sure we're using 64 // **strict** context hash in order to prevent accidental sharing of 65 // incompatible modules (e.g. with differences in search paths). 66 CI.getHeaderSearchOpts().ModulesStrictContextHash = true; 67 68 return CI; 69 } 70 71 static std::vector<std::string> 72 serializeCompilerInvocation(const CompilerInvocation &CI) { 73 // Set up string allocator. 74 llvm::BumpPtrAllocator Alloc; 75 llvm::StringSaver Strings(Alloc); 76 auto SA = [&Strings](const Twine &Arg) { return Strings.save(Arg).data(); }; 77 78 // Synthesize full command line from the CompilerInvocation, including "-cc1". 79 SmallVector<const char *, 32> Args{"-cc1"}; 80 CI.generateCC1CommandLine(Args, SA); 81 82 // Convert arguments to the return type. 83 return std::vector<std::string>{Args.begin(), Args.end()}; 84 } 85 86 std::vector<std::string> ModuleDeps::getCanonicalCommandLine( 87 std::function<StringRef(ModuleID)> LookupPCMPath, 88 std::function<const ModuleDeps &(ModuleID)> LookupModuleDeps) const { 89 CompilerInvocation CI(BuildInvocation); 90 FrontendOptions &FrontendOpts = CI.getFrontendOpts(); 91 92 InputKind ModuleMapInputKind(FrontendOpts.DashX.getLanguage(), 93 InputKind::Format::ModuleMap); 94 FrontendOpts.Inputs.emplace_back(ClangModuleMapFile, ModuleMapInputKind); 95 FrontendOpts.OutputFile = std::string(LookupPCMPath(ID)); 96 97 dependencies::detail::collectPCMAndModuleMapPaths( 98 ClangModuleDeps, LookupPCMPath, LookupModuleDeps, 99 FrontendOpts.ModuleFiles, FrontendOpts.ModuleMapFiles); 100 101 return serializeCompilerInvocation(CI); 102 } 103 104 std::vector<std::string> 105 ModuleDeps::getCanonicalCommandLineWithoutModulePaths() const { 106 return serializeCompilerInvocation(BuildInvocation); 107 } 108 109 void dependencies::detail::collectPCMAndModuleMapPaths( 110 llvm::ArrayRef<ModuleID> Modules, 111 std::function<StringRef(ModuleID)> LookupPCMPath, 112 std::function<const ModuleDeps &(ModuleID)> LookupModuleDeps, 113 std::vector<std::string> &PCMPaths, std::vector<std::string> &ModMapPaths) { 114 llvm::StringSet<> AlreadyAdded; 115 116 std::function<void(llvm::ArrayRef<ModuleID>)> AddArgs = 117 [&](llvm::ArrayRef<ModuleID> Modules) { 118 for (const ModuleID &MID : Modules) { 119 if (!AlreadyAdded.insert(MID.ModuleName + MID.ContextHash).second) 120 continue; 121 const ModuleDeps &M = LookupModuleDeps(MID); 122 // Depth first traversal. 123 AddArgs(M.ClangModuleDeps); 124 PCMPaths.push_back(LookupPCMPath(MID).str()); 125 if (!M.ClangModuleMapFile.empty()) 126 ModMapPaths.push_back(M.ClangModuleMapFile); 127 } 128 }; 129 130 AddArgs(Modules); 131 } 132 133 void ModuleDepCollectorPP::FileChanged(SourceLocation Loc, 134 FileChangeReason Reason, 135 SrcMgr::CharacteristicKind FileType, 136 FileID PrevFID) { 137 if (Reason != PPCallbacks::EnterFile) 138 return; 139 140 // This has to be delayed as the context hash can change at the start of 141 // `CompilerInstance::ExecuteAction`. 142 if (MDC.ContextHash.empty()) { 143 MDC.ContextHash = MDC.ScanInstance.getInvocation().getModuleHash(); 144 MDC.Consumer.handleContextHash(MDC.ContextHash); 145 } 146 147 SourceManager &SM = MDC.ScanInstance.getSourceManager(); 148 149 // Dependency generation really does want to go all the way to the 150 // file entry for a source location to find out what is depended on. 151 // We do not want #line markers to affect dependency generation! 152 if (Optional<StringRef> Filename = 153 SM.getNonBuiltinFilenameForID(SM.getFileID(SM.getExpansionLoc(Loc)))) 154 MDC.FileDeps.push_back( 155 std::string(llvm::sys::path::remove_leading_dotslash(*Filename))); 156 } 157 158 void ModuleDepCollectorPP::InclusionDirective( 159 SourceLocation HashLoc, const Token &IncludeTok, StringRef FileName, 160 bool IsAngled, CharSourceRange FilenameRange, const FileEntry *File, 161 StringRef SearchPath, StringRef RelativePath, const Module *Imported, 162 SrcMgr::CharacteristicKind FileType) { 163 if (!File && !Imported) { 164 // This is a non-modular include that HeaderSearch failed to find. Add it 165 // here as `FileChanged` will never see it. 166 MDC.FileDeps.push_back(std::string(FileName)); 167 } 168 handleImport(Imported); 169 } 170 171 void ModuleDepCollectorPP::moduleImport(SourceLocation ImportLoc, 172 ModuleIdPath Path, 173 const Module *Imported) { 174 handleImport(Imported); 175 } 176 177 void ModuleDepCollectorPP::handleImport(const Module *Imported) { 178 if (!Imported) 179 return; 180 181 const Module *TopLevelModule = Imported->getTopLevelModule(); 182 183 if (MDC.isPrebuiltModule(TopLevelModule)) 184 DirectPrebuiltModularDeps.insert(TopLevelModule); 185 else 186 DirectModularDeps.insert(TopLevelModule); 187 } 188 189 void ModuleDepCollectorPP::EndOfMainFile() { 190 FileID MainFileID = MDC.ScanInstance.getSourceManager().getMainFileID(); 191 MDC.MainFile = std::string(MDC.ScanInstance.getSourceManager() 192 .getFileEntryForID(MainFileID) 193 ->getName()); 194 195 if (!MDC.ScanInstance.getPreprocessorOpts().ImplicitPCHInclude.empty()) 196 MDC.FileDeps.push_back( 197 MDC.ScanInstance.getPreprocessorOpts().ImplicitPCHInclude); 198 199 for (const Module *M : DirectModularDeps) { 200 // A top-level module might not be actually imported as a module when 201 // -fmodule-name is used to compile a translation unit that imports this 202 // module. In that case it can be skipped. The appropriate header 203 // dependencies will still be reported as expected. 204 if (!M->getASTFile()) 205 continue; 206 handleTopLevelModule(M); 207 } 208 209 MDC.Consumer.handleDependencyOutputOpts(*MDC.Opts); 210 211 for (auto &&I : MDC.ModularDeps) 212 MDC.Consumer.handleModuleDependency(I.second); 213 214 for (auto &&I : MDC.FileDeps) 215 MDC.Consumer.handleFileDependency(I); 216 217 for (auto &&I : DirectPrebuiltModularDeps) 218 MDC.Consumer.handlePrebuiltModuleDependency(PrebuiltModuleDep{I}); 219 } 220 221 ModuleID ModuleDepCollectorPP::handleTopLevelModule(const Module *M) { 222 assert(M == M->getTopLevelModule() && "Expected top level module!"); 223 224 // If this module has been handled already, just return its ID. 225 auto ModI = MDC.ModularDeps.insert({M, ModuleDeps{}}); 226 if (!ModI.second) 227 return ModI.first->second.ID; 228 229 ModuleDeps &MD = ModI.first->second; 230 231 MD.ID.ModuleName = M->getFullModuleName(); 232 MD.ImportedByMainFile = DirectModularDeps.contains(M); 233 MD.ImplicitModulePCMPath = std::string(M->getASTFile()->getName()); 234 MD.IsSystem = M->IsSystem; 235 236 const FileEntry *ModuleMap = MDC.ScanInstance.getPreprocessor() 237 .getHeaderSearchInfo() 238 .getModuleMap() 239 .getModuleMapFileForUniquing(M); 240 241 if (ModuleMap) { 242 StringRef Path = ModuleMap->tryGetRealPathName(); 243 if (Path.empty()) 244 Path = ModuleMap->getName(); 245 MD.ClangModuleMapFile = std::string(Path); 246 } 247 248 serialization::ModuleFile *MF = 249 MDC.ScanInstance.getASTReader()->getModuleManager().lookup( 250 M->getASTFile()); 251 MDC.ScanInstance.getASTReader()->visitInputFiles( 252 *MF, true, true, [&](const serialization::InputFile &IF, bool isSystem) { 253 // __inferred_module.map is the result of the way in which an implicit 254 // module build handles inferred modules. It adds an overlay VFS with 255 // this file in the proper directory and relies on the rest of Clang to 256 // handle it like normal. With explicitly built modules we don't need 257 // to play VFS tricks, so replace it with the correct module map. 258 if (IF.getFile()->getName().endswith("__inferred_module.map")) { 259 MD.FileDeps.insert(ModuleMap->getName()); 260 return; 261 } 262 MD.FileDeps.insert(IF.getFile()->getName()); 263 }); 264 265 // Add direct prebuilt module dependencies now, so that we can use them when 266 // creating a CompilerInvocation and computing context hash for this 267 // ModuleDeps instance. 268 llvm::DenseSet<const Module *> SeenModules; 269 addAllSubmodulePrebuiltDeps(M, MD, SeenModules); 270 271 MD.BuildInvocation = MDC.makeInvocationForModuleBuildWithoutPaths( 272 MD, [&](CompilerInvocation &BuildInvocation) { 273 if (MDC.OptimizeArgs) 274 optimizeHeaderSearchOpts(BuildInvocation.getHeaderSearchOpts(), 275 *MDC.ScanInstance.getASTReader(), *MF); 276 }); 277 MD.ID.ContextHash = MD.BuildInvocation.getModuleHash(); 278 279 llvm::DenseSet<const Module *> AddedModules; 280 addAllSubmoduleDeps(M, MD, AddedModules); 281 282 return MD.ID; 283 } 284 285 void ModuleDepCollectorPP::addAllSubmodulePrebuiltDeps( 286 const Module *M, ModuleDeps &MD, 287 llvm::DenseSet<const Module *> &SeenSubmodules) { 288 addModulePrebuiltDeps(M, MD, SeenSubmodules); 289 290 for (const Module *SubM : M->submodules()) 291 addAllSubmodulePrebuiltDeps(SubM, MD, SeenSubmodules); 292 } 293 294 void ModuleDepCollectorPP::addModulePrebuiltDeps( 295 const Module *M, ModuleDeps &MD, 296 llvm::DenseSet<const Module *> &SeenSubmodules) { 297 for (const Module *Import : M->Imports) 298 if (Import->getTopLevelModule() != M->getTopLevelModule()) 299 if (MDC.isPrebuiltModule(Import->getTopLevelModule())) 300 if (SeenSubmodules.insert(Import->getTopLevelModule()).second) 301 MD.PrebuiltModuleDeps.emplace_back(Import->getTopLevelModule()); 302 } 303 304 void ModuleDepCollectorPP::addAllSubmoduleDeps( 305 const Module *M, ModuleDeps &MD, 306 llvm::DenseSet<const Module *> &AddedModules) { 307 addModuleDep(M, MD, AddedModules); 308 309 for (const Module *SubM : M->submodules()) 310 addAllSubmoduleDeps(SubM, MD, AddedModules); 311 } 312 313 void ModuleDepCollectorPP::addModuleDep( 314 const Module *M, ModuleDeps &MD, 315 llvm::DenseSet<const Module *> &AddedModules) { 316 for (const Module *Import : M->Imports) { 317 if (Import->getTopLevelModule() != M->getTopLevelModule() && 318 !MDC.isPrebuiltModule(Import)) { 319 ModuleID ImportID = handleTopLevelModule(Import->getTopLevelModule()); 320 if (AddedModules.insert(Import->getTopLevelModule()).second) 321 MD.ClangModuleDeps.push_back(ImportID); 322 } 323 } 324 } 325 326 ModuleDepCollector::ModuleDepCollector( 327 std::unique_ptr<DependencyOutputOptions> Opts, 328 CompilerInstance &ScanInstance, DependencyConsumer &C, 329 CompilerInvocation &&OriginalCI, bool OptimizeArgs) 330 : ScanInstance(ScanInstance), Consumer(C), Opts(std::move(Opts)), 331 OriginalInvocation(std::move(OriginalCI)), OptimizeArgs(OptimizeArgs) {} 332 333 void ModuleDepCollector::attachToPreprocessor(Preprocessor &PP) { 334 PP.addPPCallbacks(std::make_unique<ModuleDepCollectorPP>(*this)); 335 } 336 337 void ModuleDepCollector::attachToASTReader(ASTReader &R) {} 338 339 bool ModuleDepCollector::isPrebuiltModule(const Module *M) { 340 std::string Name(M->getTopLevelModuleName()); 341 const auto &PrebuiltModuleFiles = 342 ScanInstance.getHeaderSearchOpts().PrebuiltModuleFiles; 343 auto PrebuiltModuleFileIt = PrebuiltModuleFiles.find(Name); 344 if (PrebuiltModuleFileIt == PrebuiltModuleFiles.end()) 345 return false; 346 assert("Prebuilt module came from the expected AST file" && 347 PrebuiltModuleFileIt->second == M->getASTFile()->getName()); 348 return true; 349 } 350