//===- ExtractAPI/ExtractAPIConsumer.cpp ------------------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// /// /// \file /// This file implements the ExtractAPIAction, and ASTConsumer to collect API /// information. /// //===----------------------------------------------------------------------===// #include "clang/AST/ASTConcept.h" #include "clang/AST/ASTConsumer.h" #include "clang/AST/ASTContext.h" #include "clang/AST/DeclObjC.h" #include "clang/Basic/DiagnosticFrontend.h" #include "clang/Basic/SourceLocation.h" #include "clang/Basic/SourceManager.h" #include "clang/Basic/TargetInfo.h" #include "clang/ExtractAPI/API.h" #include "clang/ExtractAPI/APIIgnoresList.h" #include "clang/ExtractAPI/ExtractAPIVisitor.h" #include "clang/ExtractAPI/FrontendActions.h" #include "clang/ExtractAPI/Serialization/SymbolGraphSerializer.h" #include "clang/Frontend/ASTConsumers.h" #include "clang/Frontend/CompilerInstance.h" #include "clang/Frontend/FrontendOptions.h" #include "clang/Frontend/MultiplexConsumer.h" #include "clang/Lex/MacroInfo.h" #include "clang/Lex/PPCallbacks.h" #include "clang/Lex/Preprocessor.h" #include "clang/Lex/PreprocessorOptions.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallString.h" #include "llvm/ADT/SmallVector.h" #include "llvm/Support/Casting.h" #include "llvm/Support/Error.h" #include "llvm/Support/FileSystem.h" #include "llvm/Support/MemoryBuffer.h" #include "llvm/Support/Path.h" #include "llvm/Support/Regex.h" #include "llvm/Support/raw_ostream.h" #include #include #include using namespace clang; using namespace extractapi; namespace { std::optional getRelativeIncludeName(const CompilerInstance &CI, StringRef File, bool *IsQuoted = nullptr) { assert(CI.hasFileManager() && "CompilerInstance does not have a FileNamager!"); using namespace llvm::sys; // Matches framework include patterns const llvm::Regex Rule("/(.+)\\.framework/(.+)?Headers/(.+)"); const auto &FS = CI.getVirtualFileSystem(); SmallString<128> FilePath(File.begin(), File.end()); FS.makeAbsolute(FilePath); path::remove_dots(FilePath, true); FilePath = path::convert_to_slash(FilePath); File = FilePath; // Checks whether `Dir` is a strict path prefix of `File`. If so returns // the prefix length. Otherwise return 0. auto CheckDir = [&](llvm::StringRef Dir) -> unsigned { llvm::SmallString<32> DirPath(Dir.begin(), Dir.end()); FS.makeAbsolute(DirPath); path::remove_dots(DirPath, true); Dir = DirPath; for (auto NI = path::begin(File), NE = path::end(File), DI = path::begin(Dir), DE = path::end(Dir); /*termination condition in loop*/; ++NI, ++DI) { // '.' components in File are ignored. while (NI != NE && *NI == ".") ++NI; if (NI == NE) break; // '.' components in Dir are ignored. while (DI != DE && *DI == ".") ++DI; // Dir is a prefix of File, up to '.' components and choice of path // separators. if (DI == DE) return NI - path::begin(File); // Consider all path separators equal. if (NI->size() == 1 && DI->size() == 1 && path::is_separator(NI->front()) && path::is_separator(DI->front())) continue; // Special case Apple .sdk folders since the search path is typically a // symlink like `iPhoneSimulator14.5.sdk` while the file is instead // located in `iPhoneSimulator.sdk` (the real folder). if (NI->endswith(".sdk") && DI->endswith(".sdk")) { StringRef NBasename = path::stem(*NI); StringRef DBasename = path::stem(*DI); if (DBasename.startswith(NBasename)) continue; } if (*NI != *DI) break; } return 0; }; unsigned PrefixLength = 0; // Go through the search paths and find the first one that is a prefix of // the header. for (const auto &Entry : CI.getHeaderSearchOpts().UserEntries) { // Note whether the match is found in a quoted entry. if (IsQuoted) *IsQuoted = Entry.Group == frontend::Quoted; if (auto EntryFile = CI.getFileManager().getOptionalFileRef(Entry.Path)) { if (auto HMap = HeaderMap::Create(*EntryFile, CI.getFileManager())) { // If this is a headermap entry, try to reverse lookup the full path // for a spelled name before mapping. StringRef SpelledFilename = HMap->reverseLookupFilename(File); if (!SpelledFilename.empty()) return SpelledFilename.str(); // No matching mapping in this headermap, try next search entry. continue; } } // Entry is a directory search entry, try to check if it's a prefix of File. PrefixLength = CheckDir(Entry.Path); if (PrefixLength > 0) { // The header is found in a framework path, construct the framework-style // include name `` if (Entry.IsFramework) { SmallVector Matches; Rule.match(File, &Matches); // Returned matches are always in stable order. if (Matches.size() != 4) return std::nullopt; return path::convert_to_slash( (Matches[1].drop_front(Matches[1].rfind('/') + 1) + "/" + Matches[3]) .str()); } // The header is found in a normal search path, strip the search path // prefix to get an include name. return path::convert_to_slash(File.drop_front(PrefixLength)); } } // Couldn't determine a include name, use full path instead. return std::nullopt; } struct LocationFileChecker { bool operator()(SourceLocation Loc) { // If the loc refers to a macro expansion we need to first get the file // location of the expansion. auto &SM = CI.getSourceManager(); auto FileLoc = SM.getFileLoc(Loc); FileID FID = SM.getFileID(FileLoc); if (FID.isInvalid()) return false; const auto *File = SM.getFileEntryForID(FID); if (!File) return false; if (KnownFileEntries.count(File)) return true; if (ExternalFileEntries.count(File)) return false; StringRef FileName = File->tryGetRealPathName().empty() ? File->getName() : File->tryGetRealPathName(); // Try to reduce the include name the same way we tried to include it. bool IsQuoted = false; if (auto IncludeName = getRelativeIncludeName(CI, FileName, &IsQuoted)) if (llvm::any_of(KnownFiles, [&IsQuoted, &IncludeName](const auto &KnownFile) { return KnownFile.first.equals(*IncludeName) && KnownFile.second == IsQuoted; })) { KnownFileEntries.insert(File); return true; } // Record that the file was not found to avoid future reverse lookup for // the same file. ExternalFileEntries.insert(File); return false; } LocationFileChecker(const CompilerInstance &CI, SmallVector, bool>> &KnownFiles) : CI(CI), KnownFiles(KnownFiles), ExternalFileEntries() { for (const auto &KnownFile : KnownFiles) if (auto FileEntry = CI.getFileManager().getFile(KnownFile.first)) KnownFileEntries.insert(*FileEntry); } private: const CompilerInstance &CI; SmallVector, bool>> &KnownFiles; llvm::DenseSet KnownFileEntries; llvm::DenseSet ExternalFileEntries; }; struct BatchExtractAPIVisitor : ExtractAPIVisitor { bool shouldDeclBeIncluded(const Decl *D) const { bool ShouldBeIncluded = true; // Check that we have the definition for redeclarable types. if (auto *TD = llvm::dyn_cast(D)) ShouldBeIncluded = TD->isThisDeclarationADefinition(); else if (auto *Interface = llvm::dyn_cast(D)) ShouldBeIncluded = Interface->isThisDeclarationADefinition(); else if (auto *Protocol = llvm::dyn_cast(D)) ShouldBeIncluded = Protocol->isThisDeclarationADefinition(); ShouldBeIncluded = ShouldBeIncluded && LCF(D->getLocation()); return ShouldBeIncluded; } BatchExtractAPIVisitor(LocationFileChecker &LCF, ASTContext &Context, APISet &API) : ExtractAPIVisitor(Context, API), LCF(LCF) {} private: LocationFileChecker &LCF; }; class WrappingExtractAPIConsumer : public ASTConsumer { public: WrappingExtractAPIConsumer(ASTContext &Context, APISet &API) : Visitor(Context, API) {} void HandleTranslationUnit(ASTContext &Context) override { // Use ExtractAPIVisitor to traverse symbol declarations in the context. Visitor.TraverseDecl(Context.getTranslationUnitDecl()); } private: ExtractAPIVisitor<> Visitor; }; class ExtractAPIConsumer : public ASTConsumer { public: ExtractAPIConsumer(ASTContext &Context, std::unique_ptr LCF, APISet &API) : Visitor(*LCF, Context, API), LCF(std::move(LCF)) {} void HandleTranslationUnit(ASTContext &Context) override { // Use ExtractAPIVisitor to traverse symbol declarations in the context. Visitor.TraverseDecl(Context.getTranslationUnitDecl()); } private: BatchExtractAPIVisitor Visitor; std::unique_ptr LCF; }; class MacroCallback : public PPCallbacks { public: MacroCallback(const SourceManager &SM, APISet &API, Preprocessor &PP) : SM(SM), API(API), PP(PP) {} void MacroDefined(const Token &MacroNameToken, const MacroDirective *MD) override { auto *MacroInfo = MD->getMacroInfo(); if (MacroInfo->isBuiltinMacro()) return; auto SourceLoc = MacroNameToken.getLocation(); if (SM.isWrittenInBuiltinFile(SourceLoc) || SM.isWrittenInCommandLineFile(SourceLoc)) return; PendingMacros.emplace_back(MacroNameToken, MD); } // If a macro gets undefined at some point during preprocessing of the inputs // it means that it isn't an exposed API and we should therefore not add a // macro definition for it. void MacroUndefined(const Token &MacroNameToken, const MacroDefinition &MD, const MacroDirective *Undef) override { // If this macro wasn't previously defined we don't need to do anything // here. if (!Undef) return; llvm::erase_if(PendingMacros, [&MD, this](const PendingMacro &PM) { return MD.getMacroInfo()->isIdenticalTo(*PM.MD->getMacroInfo(), PP, /*Syntactically*/ false); }); } void EndOfMainFile() override { for (auto &PM : PendingMacros) { // `isUsedForHeaderGuard` is only set when the preprocessor leaves the // file so check for it here. if (PM.MD->getMacroInfo()->isUsedForHeaderGuard()) continue; if (!shouldMacroBeIncluded(PM)) continue; StringRef Name = PM.MacroNameToken.getIdentifierInfo()->getName(); PresumedLoc Loc = SM.getPresumedLoc(PM.MacroNameToken.getLocation()); StringRef USR = API.recordUSRForMacro(Name, PM.MacroNameToken.getLocation(), SM); API.addMacroDefinition( Name, USR, Loc, DeclarationFragmentsBuilder::getFragmentsForMacro(Name, PM.MD), DeclarationFragmentsBuilder::getSubHeadingForMacro(Name), SM.isInSystemHeader(PM.MacroNameToken.getLocation())); } PendingMacros.clear(); } protected: struct PendingMacro { Token MacroNameToken; const MacroDirective *MD; PendingMacro(const Token &MacroNameToken, const MacroDirective *MD) : MacroNameToken(MacroNameToken), MD(MD) {} }; virtual bool shouldMacroBeIncluded(const PendingMacro &PM) { return true; } const SourceManager &SM; APISet &API; Preprocessor &PP; llvm::SmallVector PendingMacros; }; class APIMacroCallback : public MacroCallback { public: APIMacroCallback(const SourceManager &SM, APISet &API, Preprocessor &PP, LocationFileChecker &LCF) : MacroCallback(SM, API, PP), LCF(LCF) {} bool shouldMacroBeIncluded(const PendingMacro &PM) override { // Do not include macros from external files return LCF(PM.MacroNameToken.getLocation()); } private: LocationFileChecker &LCF; }; } // namespace void ExtractAPIActionBase::ImplEndSourceFileAction() { if (!OS) return; // Setup a SymbolGraphSerializer to write out collected API information in // the Symbol Graph format. // FIXME: Make the kind of APISerializer configurable. SymbolGraphSerializer SGSerializer(*API, IgnoresList); SGSerializer.serialize(*OS); OS.reset(); } std::unique_ptr ExtractAPIAction::CreateOutputFile(CompilerInstance &CI, StringRef InFile) { std::unique_ptr OS; OS = CI.createDefaultOutputFile(/*Binary=*/false, InFile, /*Extension=*/"json", /*RemoveFileOnSignal=*/false); if (!OS) return nullptr; return OS; } std::unique_ptr ExtractAPIAction::CreateASTConsumer(CompilerInstance &CI, StringRef InFile) { OS = CreateOutputFile(CI, InFile); if (!OS) return nullptr; auto ProductName = CI.getFrontendOpts().ProductName; // Now that we have enough information about the language options and the // target triple, let's create the APISet before anyone uses it. API = std::make_unique( CI.getTarget().getTriple(), CI.getFrontendOpts().Inputs.back().getKind().getLanguage(), ProductName); auto LCF = std::make_unique(CI, KnownInputFiles); CI.getPreprocessor().addPPCallbacks(std::make_unique( CI.getSourceManager(), *API, CI.getPreprocessor(), *LCF)); // Do not include location in anonymous decls. PrintingPolicy Policy = CI.getASTContext().getPrintingPolicy(); Policy.AnonymousTagLocations = false; CI.getASTContext().setPrintingPolicy(Policy); if (!CI.getFrontendOpts().ExtractAPIIgnoresFileList.empty()) { llvm::handleAllErrors( APIIgnoresList::create(CI.getFrontendOpts().ExtractAPIIgnoresFileList, CI.getFileManager()) .moveInto(IgnoresList), [&CI](const IgnoresFileNotFound &Err) { CI.getDiagnostics().Report( diag::err_extract_api_ignores_file_not_found) << Err.Path; }); } return std::make_unique(CI.getASTContext(), std::move(LCF), *API); } bool ExtractAPIAction::PrepareToExecuteAction(CompilerInstance &CI) { auto &Inputs = CI.getFrontendOpts().Inputs; if (Inputs.empty()) return true; if (!CI.hasFileManager()) if (!CI.createFileManager()) return false; auto Kind = Inputs[0].getKind(); // Convert the header file inputs into a single input buffer. SmallString<256> HeaderContents; bool IsQuoted = false; for (const FrontendInputFile &FIF : Inputs) { if (Kind.isObjectiveC()) HeaderContents += "#import"; else HeaderContents += "#include"; StringRef FilePath = FIF.getFile(); if (auto RelativeName = getRelativeIncludeName(CI, FilePath, &IsQuoted)) { if (IsQuoted) HeaderContents += " \""; else HeaderContents += " <"; HeaderContents += *RelativeName; if (IsQuoted) HeaderContents += "\"\n"; else HeaderContents += ">\n"; KnownInputFiles.emplace_back(static_cast>(*RelativeName), IsQuoted); } else { HeaderContents += " \""; HeaderContents += FilePath; HeaderContents += "\"\n"; KnownInputFiles.emplace_back(FilePath, true); } } if (CI.getHeaderSearchOpts().Verbose) CI.getVerboseOutputStream() << getInputBufferName() << ":\n" << HeaderContents << "\n"; Buffer = llvm::MemoryBuffer::getMemBufferCopy(HeaderContents, getInputBufferName()); // Set that buffer up as our "real" input in the CompilerInstance. Inputs.clear(); Inputs.emplace_back(Buffer->getMemBufferRef(), Kind, /*IsSystem*/ false); return true; } void ExtractAPIAction::EndSourceFileAction() { ImplEndSourceFileAction(); } std::unique_ptr WrappingExtractAPIAction::CreateASTConsumer(CompilerInstance &CI, StringRef InFile) { auto OtherConsumer = WrapperFrontendAction::CreateASTConsumer(CI, InFile); if (!OtherConsumer) return nullptr; CreatedASTConsumer = true; OS = CreateOutputFile(CI, InFile); if (!OS) return nullptr; auto ProductName = CI.getFrontendOpts().ProductName; // Now that we have enough information about the language options and the // target triple, let's create the APISet before anyone uses it. API = std::make_unique( CI.getTarget().getTriple(), CI.getFrontendOpts().Inputs.back().getKind().getLanguage(), ProductName); CI.getPreprocessor().addPPCallbacks(std::make_unique( CI.getSourceManager(), *API, CI.getPreprocessor())); // Do not include location in anonymous decls. PrintingPolicy Policy = CI.getASTContext().getPrintingPolicy(); Policy.AnonymousTagLocations = false; CI.getASTContext().setPrintingPolicy(Policy); if (!CI.getFrontendOpts().ExtractAPIIgnoresFileList.empty()) { llvm::handleAllErrors( APIIgnoresList::create(CI.getFrontendOpts().ExtractAPIIgnoresFileList, CI.getFileManager()) .moveInto(IgnoresList), [&CI](const IgnoresFileNotFound &Err) { CI.getDiagnostics().Report( diag::err_extract_api_ignores_file_not_found) << Err.Path; }); } auto WrappingConsumer = std::make_unique(CI.getASTContext(), *API); std::vector> Consumers; Consumers.push_back(std::move(OtherConsumer)); Consumers.push_back(std::move(WrappingConsumer)); return std::make_unique(std::move(Consumers)); } void WrappingExtractAPIAction::EndSourceFileAction() { // Invoke wrapped action's method. WrapperFrontendAction::EndSourceFileAction(); if (CreatedASTConsumer) { ImplEndSourceFileAction(); } } std::unique_ptr WrappingExtractAPIAction::CreateOutputFile(CompilerInstance &CI, StringRef InFile) { std::unique_ptr OS; std::string OutputDir = CI.getFrontendOpts().SymbolGraphOutputDir; // The symbol graphs need to be generated as a side effect of regular // compilation so the output should be dumped in the directory provided with // the command line option. llvm::SmallString<128> OutFilePath(OutputDir); auto Seperator = llvm::sys::path::get_separator(); auto Infilename = llvm::sys::path::filename(InFile); OutFilePath.append({Seperator, Infilename}); llvm::sys::path::replace_extension(OutFilePath, "json"); // StringRef outputFilePathref = *OutFilePath; // don't use the default output file OS = CI.createOutputFile(/*OutputPath=*/OutFilePath, /*Binary=*/false, /*RemoveFileOnSignal=*/true, /*UseTemporary=*/true, /*CreateMissingDirectories=*/true); if (!OS) return nullptr; return OS; }