1a7dea167SDimitry Andric //===- DependencyScanningFilesystem.cpp - clang-scan-deps fs --------------===//
2a7dea167SDimitry Andric //
3a7dea167SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4a7dea167SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5a7dea167SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6a7dea167SDimitry Andric //
7a7dea167SDimitry Andric //===----------------------------------------------------------------------===//
8a7dea167SDimitry Andric
9a7dea167SDimitry Andric #include "clang/Tooling/DependencyScanning/DependencyScanningFilesystem.h"
10a7dea167SDimitry Andric #include "llvm/Support/MemoryBuffer.h"
110eae32dcSDimitry Andric #include "llvm/Support/SmallVectorMemoryBuffer.h"
12a7dea167SDimitry Andric #include "llvm/Support/Threading.h"
13bdd1243dSDimitry Andric #include <optional>
14a7dea167SDimitry Andric
15a7dea167SDimitry Andric using namespace clang;
16a7dea167SDimitry Andric using namespace tooling;
17a7dea167SDimitry Andric using namespace dependencies;
18a7dea167SDimitry Andric
1904eeddc0SDimitry Andric llvm::ErrorOr<DependencyScanningWorkerFilesystem::TentativeEntry>
readFile(StringRef Filename)2004eeddc0SDimitry Andric DependencyScanningWorkerFilesystem::readFile(StringRef Filename) {
21a7dea167SDimitry Andric // Load the file and its content from the file system.
2204eeddc0SDimitry Andric auto MaybeFile = getUnderlyingFS().openFileForRead(Filename);
23a7dea167SDimitry Andric if (!MaybeFile)
24a7dea167SDimitry Andric return MaybeFile.getError();
250eae32dcSDimitry Andric auto File = std::move(*MaybeFile);
26a7dea167SDimitry Andric
270eae32dcSDimitry Andric auto MaybeStat = File->status();
280eae32dcSDimitry Andric if (!MaybeStat)
290eae32dcSDimitry Andric return MaybeStat.getError();
300eae32dcSDimitry Andric auto Stat = std::move(*MaybeStat);
310eae32dcSDimitry Andric
320eae32dcSDimitry Andric auto MaybeBuffer = File->getBuffer(Stat.getName());
33a7dea167SDimitry Andric if (!MaybeBuffer)
34a7dea167SDimitry Andric return MaybeBuffer.getError();
350eae32dcSDimitry Andric auto Buffer = std::move(*MaybeBuffer);
360eae32dcSDimitry Andric
3704eeddc0SDimitry Andric // If the file size changed between read and stat, pretend it didn't.
3804eeddc0SDimitry Andric if (Stat.getSize() != Buffer->getBufferSize())
3904eeddc0SDimitry Andric Stat = llvm::vfs::Status::copyWithNewSize(Stat, Buffer->getBufferSize());
4004eeddc0SDimitry Andric
4104eeddc0SDimitry Andric return TentativeEntry(Stat, std::move(Buffer));
420eae32dcSDimitry Andric }
430eae32dcSDimitry Andric
ensureDirectiveTokensArePopulated(EntryRef Ref)44*0fca6ea1SDimitry Andric bool DependencyScanningWorkerFilesystem::ensureDirectiveTokensArePopulated(
45*0fca6ea1SDimitry Andric EntryRef Ref) {
46*0fca6ea1SDimitry Andric auto &Entry = Ref.Entry;
47*0fca6ea1SDimitry Andric
48*0fca6ea1SDimitry Andric if (Entry.isError() || Entry.isDirectory())
49*0fca6ea1SDimitry Andric return false;
5004eeddc0SDimitry Andric
5181ad6265SDimitry Andric CachedFileContents *Contents = Entry.getCachedContents();
5204eeddc0SDimitry Andric assert(Contents && "contents not initialized");
5304eeddc0SDimitry Andric
5404eeddc0SDimitry Andric // Double-checked locking.
5581ad6265SDimitry Andric if (Contents->DepDirectives.load())
56*0fca6ea1SDimitry Andric return true;
5704eeddc0SDimitry Andric
5804eeddc0SDimitry Andric std::lock_guard<std::mutex> GuardLock(Contents->ValueLock);
5904eeddc0SDimitry Andric
6004eeddc0SDimitry Andric // Double-checked locking.
6181ad6265SDimitry Andric if (Contents->DepDirectives.load())
62*0fca6ea1SDimitry Andric return true;
63a7dea167SDimitry Andric
6481ad6265SDimitry Andric SmallVector<dependency_directives_scan::Directive, 64> Directives;
6581ad6265SDimitry Andric // Scan the file for preprocessor directives that might affect the
6681ad6265SDimitry Andric // dependencies.
6781ad6265SDimitry Andric if (scanSourceForDependencyDirectives(Contents->Original->getBuffer(),
6881ad6265SDimitry Andric Contents->DepDirectiveTokens,
6981ad6265SDimitry Andric Directives)) {
7081ad6265SDimitry Andric Contents->DepDirectiveTokens.clear();
710eae32dcSDimitry Andric // FIXME: Propagate the diagnostic if desired by the client.
72bdd1243dSDimitry Andric Contents->DepDirectives.store(new std::optional<DependencyDirectivesTy>());
73*0fca6ea1SDimitry Andric return false;
74a7dea167SDimitry Andric }
75a7dea167SDimitry Andric
7681ad6265SDimitry Andric // This function performed double-checked locking using `DepDirectives`.
7781ad6265SDimitry Andric // Assigning it must be the last thing this function does, otherwise other
78*0fca6ea1SDimitry Andric // threads may skip the critical section (`DepDirectives != nullptr`), leading
79*0fca6ea1SDimitry Andric // to a data race.
8081ad6265SDimitry Andric Contents->DepDirectives.store(
81bdd1243dSDimitry Andric new std::optional<DependencyDirectivesTy>(std::move(Directives)));
82*0fca6ea1SDimitry Andric return true;
83a7dea167SDimitry Andric }
84a7dea167SDimitry Andric
850eae32dcSDimitry Andric DependencyScanningFilesystemSharedCache::
DependencyScanningFilesystemSharedCache()860eae32dcSDimitry Andric DependencyScanningFilesystemSharedCache() {
87a7dea167SDimitry Andric // This heuristic was chosen using a empirical testing on a
88a7dea167SDimitry Andric // reasonably high core machine (iMacPro 18 cores / 36 threads). The cache
89a7dea167SDimitry Andric // sharding gives a performance edge by reducing the lock contention.
90a7dea167SDimitry Andric // FIXME: A better heuristic might also consider the OS to account for
91a7dea167SDimitry Andric // the different cost of lock contention on different OSes.
925ffd83dbSDimitry Andric NumShards =
935ffd83dbSDimitry Andric std::max(2u, llvm::hardware_concurrency().compute_thread_count() / 4);
94a7dea167SDimitry Andric CacheShards = std::make_unique<CacheShard[]>(NumShards);
95a7dea167SDimitry Andric }
96a7dea167SDimitry Andric
9704eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard &
getShardForFilename(StringRef Filename) const9804eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::getShardForFilename(
9904eeddc0SDimitry Andric StringRef Filename) const {
1004542f901SDimitry Andric assert(llvm::sys::path::is_absolute_gnu(Filename));
10104eeddc0SDimitry Andric return CacheShards[llvm::hash_value(Filename) % NumShards];
10204eeddc0SDimitry Andric }
10304eeddc0SDimitry Andric
10404eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard &
getShardForUID(llvm::sys::fs::UniqueID UID) const10504eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::getShardForUID(
10604eeddc0SDimitry Andric llvm::sys::fs::UniqueID UID) const {
10704eeddc0SDimitry Andric auto Hash = llvm::hash_combine(UID.getDevice(), UID.getFile());
10804eeddc0SDimitry Andric return CacheShards[Hash % NumShards];
10904eeddc0SDimitry Andric }
11004eeddc0SDimitry Andric
11104eeddc0SDimitry Andric const CachedFileSystemEntry *
findEntryByFilename(StringRef Filename) const11204eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::findEntryByFilename(
11304eeddc0SDimitry Andric StringRef Filename) const {
1144542f901SDimitry Andric assert(llvm::sys::path::is_absolute_gnu(Filename));
11504eeddc0SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
116*0fca6ea1SDimitry Andric auto It = CacheByFilename.find(Filename);
117*0fca6ea1SDimitry Andric return It == CacheByFilename.end() ? nullptr : It->getValue().first;
11804eeddc0SDimitry Andric }
11904eeddc0SDimitry Andric
12004eeddc0SDimitry Andric const CachedFileSystemEntry *
findEntryByUID(llvm::sys::fs::UniqueID UID) const12104eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::findEntryByUID(
12204eeddc0SDimitry Andric llvm::sys::fs::UniqueID UID) const {
12304eeddc0SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
12404eeddc0SDimitry Andric auto It = EntriesByUID.find(UID);
12504eeddc0SDimitry Andric return It == EntriesByUID.end() ? nullptr : It->getSecond();
12604eeddc0SDimitry Andric }
12704eeddc0SDimitry Andric
12804eeddc0SDimitry Andric const CachedFileSystemEntry &
12904eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::
getOrEmplaceEntryForFilename(StringRef Filename,llvm::ErrorOr<llvm::vfs::Status> Stat)13004eeddc0SDimitry Andric getOrEmplaceEntryForFilename(StringRef Filename,
13104eeddc0SDimitry Andric llvm::ErrorOr<llvm::vfs::Status> Stat) {
13204eeddc0SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
133*0fca6ea1SDimitry Andric auto [It, Inserted] = CacheByFilename.insert({Filename, {nullptr, nullptr}});
134*0fca6ea1SDimitry Andric auto &[CachedEntry, CachedRealPath] = It->getValue();
135*0fca6ea1SDimitry Andric if (!CachedEntry) {
136*0fca6ea1SDimitry Andric // The entry is not present in the shared cache. Either the cache doesn't
137*0fca6ea1SDimitry Andric // know about the file at all, or it only knows about its real path.
138*0fca6ea1SDimitry Andric assert((Inserted || CachedRealPath) && "existing file with empty pair");
139*0fca6ea1SDimitry Andric CachedEntry =
14004eeddc0SDimitry Andric new (EntryStorage.Allocate()) CachedFileSystemEntry(std::move(Stat));
141*0fca6ea1SDimitry Andric }
142*0fca6ea1SDimitry Andric return *CachedEntry;
14304eeddc0SDimitry Andric }
14404eeddc0SDimitry Andric
14504eeddc0SDimitry Andric const CachedFileSystemEntry &
getOrEmplaceEntryForUID(llvm::sys::fs::UniqueID UID,llvm::vfs::Status Stat,std::unique_ptr<llvm::MemoryBuffer> Contents)14604eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::getOrEmplaceEntryForUID(
14704eeddc0SDimitry Andric llvm::sys::fs::UniqueID UID, llvm::vfs::Status Stat,
14804eeddc0SDimitry Andric std::unique_ptr<llvm::MemoryBuffer> Contents) {
14904eeddc0SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
150*0fca6ea1SDimitry Andric auto [It, Inserted] = EntriesByUID.insert({UID, nullptr});
151*0fca6ea1SDimitry Andric auto &CachedEntry = It->getSecond();
152*0fca6ea1SDimitry Andric if (Inserted) {
15304eeddc0SDimitry Andric CachedFileContents *StoredContents = nullptr;
15404eeddc0SDimitry Andric if (Contents)
15504eeddc0SDimitry Andric StoredContents = new (ContentsStorage.Allocate())
15604eeddc0SDimitry Andric CachedFileContents(std::move(Contents));
157*0fca6ea1SDimitry Andric CachedEntry = new (EntryStorage.Allocate())
15804eeddc0SDimitry Andric CachedFileSystemEntry(std::move(Stat), StoredContents);
15904eeddc0SDimitry Andric }
160*0fca6ea1SDimitry Andric return *CachedEntry;
16104eeddc0SDimitry Andric }
16204eeddc0SDimitry Andric
16304eeddc0SDimitry Andric const CachedFileSystemEntry &
16404eeddc0SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::
getOrInsertEntryForFilename(StringRef Filename,const CachedFileSystemEntry & Entry)16504eeddc0SDimitry Andric getOrInsertEntryForFilename(StringRef Filename,
16604eeddc0SDimitry Andric const CachedFileSystemEntry &Entry) {
16704eeddc0SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
168*0fca6ea1SDimitry Andric auto [It, Inserted] = CacheByFilename.insert({Filename, {&Entry, nullptr}});
169*0fca6ea1SDimitry Andric auto &[CachedEntry, CachedRealPath] = It->getValue();
170*0fca6ea1SDimitry Andric if (!Inserted || !CachedEntry)
171*0fca6ea1SDimitry Andric CachedEntry = &Entry;
172*0fca6ea1SDimitry Andric return *CachedEntry;
173a7dea167SDimitry Andric }
174a7dea167SDimitry Andric
175*0fca6ea1SDimitry Andric const CachedRealPath *
findRealPathByFilename(StringRef Filename) const176*0fca6ea1SDimitry Andric DependencyScanningFilesystemSharedCache::CacheShard::findRealPathByFilename(
177*0fca6ea1SDimitry Andric StringRef Filename) const {
178*0fca6ea1SDimitry Andric assert(llvm::sys::path::is_absolute_gnu(Filename));
179*0fca6ea1SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
180*0fca6ea1SDimitry Andric auto It = CacheByFilename.find(Filename);
181*0fca6ea1SDimitry Andric return It == CacheByFilename.end() ? nullptr : It->getValue().second;
182*0fca6ea1SDimitry Andric }
183*0fca6ea1SDimitry Andric
184*0fca6ea1SDimitry Andric const CachedRealPath &DependencyScanningFilesystemSharedCache::CacheShard::
getOrEmplaceRealPathForFilename(StringRef Filename,llvm::ErrorOr<llvm::StringRef> RealPath)185*0fca6ea1SDimitry Andric getOrEmplaceRealPathForFilename(StringRef Filename,
186*0fca6ea1SDimitry Andric llvm::ErrorOr<llvm::StringRef> RealPath) {
187*0fca6ea1SDimitry Andric std::lock_guard<std::mutex> LockGuard(CacheLock);
188*0fca6ea1SDimitry Andric
189*0fca6ea1SDimitry Andric const CachedRealPath *&StoredRealPath = CacheByFilename[Filename].second;
190*0fca6ea1SDimitry Andric if (!StoredRealPath) {
191*0fca6ea1SDimitry Andric auto OwnedRealPath = [&]() -> CachedRealPath {
192*0fca6ea1SDimitry Andric if (!RealPath)
193*0fca6ea1SDimitry Andric return RealPath.getError();
194*0fca6ea1SDimitry Andric return RealPath->str();
195*0fca6ea1SDimitry Andric }();
196*0fca6ea1SDimitry Andric
197*0fca6ea1SDimitry Andric StoredRealPath = new (RealPathStorage.Allocate())
198*0fca6ea1SDimitry Andric CachedRealPath(std::move(OwnedRealPath));
199*0fca6ea1SDimitry Andric }
200*0fca6ea1SDimitry Andric
201*0fca6ea1SDimitry Andric return *StoredRealPath;
202480093f4SDimitry Andric }
203480093f4SDimitry Andric
shouldCacheStatFailures(StringRef Filename)204480093f4SDimitry Andric static bool shouldCacheStatFailures(StringRef Filename) {
205480093f4SDimitry Andric StringRef Ext = llvm::sys::path::extension(Filename);
206480093f4SDimitry Andric if (Ext.empty())
207480093f4SDimitry Andric return false; // This may be the module cache directory.
20806c3fb27SDimitry Andric return true;
209480093f4SDimitry Andric }
210480093f4SDimitry Andric
DependencyScanningWorkerFilesystem(DependencyScanningFilesystemSharedCache & SharedCache,IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS)2114542f901SDimitry Andric DependencyScanningWorkerFilesystem::DependencyScanningWorkerFilesystem(
2124542f901SDimitry Andric DependencyScanningFilesystemSharedCache &SharedCache,
2134542f901SDimitry Andric IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS)
214*0fca6ea1SDimitry Andric : llvm::RTTIExtends<DependencyScanningWorkerFilesystem,
215*0fca6ea1SDimitry Andric llvm::vfs::ProxyFileSystem>(std::move(FS)),
216*0fca6ea1SDimitry Andric SharedCache(SharedCache),
2174542f901SDimitry Andric WorkingDirForCacheLookup(llvm::errc::invalid_argument) {
2184542f901SDimitry Andric updateWorkingDirForCacheLookup();
2194542f901SDimitry Andric }
2204542f901SDimitry Andric
22104eeddc0SDimitry Andric const CachedFileSystemEntry &
getOrEmplaceSharedEntryForUID(TentativeEntry TEntry)22204eeddc0SDimitry Andric DependencyScanningWorkerFilesystem::getOrEmplaceSharedEntryForUID(
22304eeddc0SDimitry Andric TentativeEntry TEntry) {
22404eeddc0SDimitry Andric auto &Shard = SharedCache.getShardForUID(TEntry.Status.getUniqueID());
22504eeddc0SDimitry Andric return Shard.getOrEmplaceEntryForUID(TEntry.Status.getUniqueID(),
22604eeddc0SDimitry Andric std::move(TEntry.Status),
22704eeddc0SDimitry Andric std::move(TEntry.Contents));
22804eeddc0SDimitry Andric }
22904eeddc0SDimitry Andric
23004eeddc0SDimitry Andric const CachedFileSystemEntry *
findEntryByFilenameWithWriteThrough(StringRef Filename)23104eeddc0SDimitry Andric DependencyScanningWorkerFilesystem::findEntryByFilenameWithWriteThrough(
23204eeddc0SDimitry Andric StringRef Filename) {
23304eeddc0SDimitry Andric if (const auto *Entry = LocalCache.findEntryByFilename(Filename))
23404eeddc0SDimitry Andric return Entry;
23504eeddc0SDimitry Andric auto &Shard = SharedCache.getShardForFilename(Filename);
23604eeddc0SDimitry Andric if (const auto *Entry = Shard.findEntryByFilename(Filename))
23704eeddc0SDimitry Andric return &LocalCache.insertEntryForFilename(Filename, *Entry);
23804eeddc0SDimitry Andric return nullptr;
23904eeddc0SDimitry Andric }
24004eeddc0SDimitry Andric
24104eeddc0SDimitry Andric llvm::ErrorOr<const CachedFileSystemEntry &>
computeAndStoreResult(StringRef OriginalFilename,StringRef FilenameForLookup)2424542f901SDimitry Andric DependencyScanningWorkerFilesystem::computeAndStoreResult(
2434542f901SDimitry Andric StringRef OriginalFilename, StringRef FilenameForLookup) {
2444542f901SDimitry Andric llvm::ErrorOr<llvm::vfs::Status> Stat =
2454542f901SDimitry Andric getUnderlyingFS().status(OriginalFilename);
24604eeddc0SDimitry Andric if (!Stat) {
2474542f901SDimitry Andric if (!shouldCacheStatFailures(OriginalFilename))
24804eeddc0SDimitry Andric return Stat.getError();
24904eeddc0SDimitry Andric const auto &Entry =
2504542f901SDimitry Andric getOrEmplaceSharedEntryForFilename(FilenameForLookup, Stat.getError());
2514542f901SDimitry Andric return insertLocalEntryForFilename(FilenameForLookup, Entry);
25204eeddc0SDimitry Andric }
25304eeddc0SDimitry Andric
25404eeddc0SDimitry Andric if (const auto *Entry = findSharedEntryByUID(*Stat))
2554542f901SDimitry Andric return insertLocalEntryForFilename(FilenameForLookup, *Entry);
25604eeddc0SDimitry Andric
25704eeddc0SDimitry Andric auto TEntry =
2584542f901SDimitry Andric Stat->isDirectory() ? TentativeEntry(*Stat) : readFile(OriginalFilename);
25904eeddc0SDimitry Andric
26004eeddc0SDimitry Andric const CachedFileSystemEntry *SharedEntry = [&]() {
26104eeddc0SDimitry Andric if (TEntry) {
26204eeddc0SDimitry Andric const auto &UIDEntry = getOrEmplaceSharedEntryForUID(std::move(*TEntry));
2634542f901SDimitry Andric return &getOrInsertSharedEntryForFilename(FilenameForLookup, UIDEntry);
26404eeddc0SDimitry Andric }
2654542f901SDimitry Andric return &getOrEmplaceSharedEntryForFilename(FilenameForLookup,
2664542f901SDimitry Andric TEntry.getError());
26704eeddc0SDimitry Andric }();
26804eeddc0SDimitry Andric
2694542f901SDimitry Andric return insertLocalEntryForFilename(FilenameForLookup, *SharedEntry);
270fe6060f1SDimitry Andric }
271fe6060f1SDimitry Andric
2720eae32dcSDimitry Andric llvm::ErrorOr<EntryRef>
getOrCreateFileSystemEntry(StringRef OriginalFilename)273a7dea167SDimitry Andric DependencyScanningWorkerFilesystem::getOrCreateFileSystemEntry(
274*0fca6ea1SDimitry Andric StringRef OriginalFilename) {
2754542f901SDimitry Andric SmallString<256> PathBuf;
276*0fca6ea1SDimitry Andric auto FilenameForLookup = tryGetFilenameForLookup(OriginalFilename, PathBuf);
277*0fca6ea1SDimitry Andric if (!FilenameForLookup)
278*0fca6ea1SDimitry Andric return FilenameForLookup.getError();
279*0fca6ea1SDimitry Andric
2804542f901SDimitry Andric if (const auto *Entry =
281*0fca6ea1SDimitry Andric findEntryByFilenameWithWriteThrough(*FilenameForLookup))
282*0fca6ea1SDimitry Andric return EntryRef(OriginalFilename, *Entry).unwrapError();
283*0fca6ea1SDimitry Andric auto MaybeEntry = computeAndStoreResult(OriginalFilename, *FilenameForLookup);
28404eeddc0SDimitry Andric if (!MaybeEntry)
28504eeddc0SDimitry Andric return MaybeEntry.getError();
286*0fca6ea1SDimitry Andric return EntryRef(OriginalFilename, *MaybeEntry).unwrapError();
287a7dea167SDimitry Andric }
288a7dea167SDimitry Andric
289a7dea167SDimitry Andric llvm::ErrorOr<llvm::vfs::Status>
status(const Twine & Path)290a7dea167SDimitry Andric DependencyScanningWorkerFilesystem::status(const Twine &Path) {
291a7dea167SDimitry Andric SmallString<256> OwnedFilename;
292a7dea167SDimitry Andric StringRef Filename = Path.toStringRef(OwnedFilename);
2930eae32dcSDimitry Andric
2945f757f3fSDimitry Andric if (Filename.ends_with(".pcm"))
29506c3fb27SDimitry Andric return getUnderlyingFS().status(Path);
29606c3fb27SDimitry Andric
2970eae32dcSDimitry Andric llvm::ErrorOr<EntryRef> Result = getOrCreateFileSystemEntry(Filename);
298a7dea167SDimitry Andric if (!Result)
299a7dea167SDimitry Andric return Result.getError();
3000eae32dcSDimitry Andric return Result->getStatus();
301a7dea167SDimitry Andric }
302a7dea167SDimitry Andric
exists(const Twine & Path)303*0fca6ea1SDimitry Andric bool DependencyScanningWorkerFilesystem::exists(const Twine &Path) {
304*0fca6ea1SDimitry Andric // While some VFS overlay filesystems may implement more-efficient
305*0fca6ea1SDimitry Andric // mechanisms for `exists` queries, `DependencyScanningWorkerFilesystem`
306*0fca6ea1SDimitry Andric // typically wraps `RealFileSystem` which does not specialize `exists`,
307*0fca6ea1SDimitry Andric // so it is not likely to benefit from such optimizations. Instead,
308*0fca6ea1SDimitry Andric // it is more-valuable to have this query go through the
309*0fca6ea1SDimitry Andric // cached-`status` code-path of the `DependencyScanningWorkerFilesystem`.
310*0fca6ea1SDimitry Andric llvm::ErrorOr<llvm::vfs::Status> Status = status(Path);
311*0fca6ea1SDimitry Andric return Status && Status->exists();
312*0fca6ea1SDimitry Andric }
313*0fca6ea1SDimitry Andric
314a7dea167SDimitry Andric namespace {
315a7dea167SDimitry Andric
316a7dea167SDimitry Andric /// The VFS that is used by clang consumes the \c CachedFileSystemEntry using
317a7dea167SDimitry Andric /// this subclass.
31881ad6265SDimitry Andric class DepScanFile final : public llvm::vfs::File {
319a7dea167SDimitry Andric public:
DepScanFile(std::unique_ptr<llvm::MemoryBuffer> Buffer,llvm::vfs::Status Stat)32081ad6265SDimitry Andric DepScanFile(std::unique_ptr<llvm::MemoryBuffer> Buffer,
321a7dea167SDimitry Andric llvm::vfs::Status Stat)
322a7dea167SDimitry Andric : Buffer(std::move(Buffer)), Stat(std::move(Stat)) {}
323a7dea167SDimitry Andric
32481ad6265SDimitry Andric static llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>> create(EntryRef Entry);
325a7dea167SDimitry Andric
status()326e8d8bef9SDimitry Andric llvm::ErrorOr<llvm::vfs::Status> status() override { return Stat; }
327a7dea167SDimitry Andric
328a7dea167SDimitry Andric llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
getBuffer(const Twine & Name,int64_t FileSize,bool RequiresNullTerminator,bool IsVolatile)329a7dea167SDimitry Andric getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
330a7dea167SDimitry Andric bool IsVolatile) override {
331a7dea167SDimitry Andric return std::move(Buffer);
332a7dea167SDimitry Andric }
333a7dea167SDimitry Andric
close()334a7dea167SDimitry Andric std::error_code close() override { return {}; }
335a7dea167SDimitry Andric
336a7dea167SDimitry Andric private:
337a7dea167SDimitry Andric std::unique_ptr<llvm::MemoryBuffer> Buffer;
338a7dea167SDimitry Andric llvm::vfs::Status Stat;
339a7dea167SDimitry Andric };
340a7dea167SDimitry Andric
341e8d8bef9SDimitry Andric } // end anonymous namespace
342e8d8bef9SDimitry Andric
34381ad6265SDimitry Andric llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>
create(EntryRef Entry)34481ad6265SDimitry Andric DepScanFile::create(EntryRef Entry) {
34504eeddc0SDimitry Andric assert(!Entry.isError() && "error");
34604eeddc0SDimitry Andric
3470eae32dcSDimitry Andric if (Entry.isDirectory())
3480eae32dcSDimitry Andric return std::make_error_code(std::errc::is_a_directory);
3490eae32dcSDimitry Andric
35081ad6265SDimitry Andric auto Result = std::make_unique<DepScanFile>(
35104eeddc0SDimitry Andric llvm::MemoryBuffer::getMemBuffer(Entry.getContents(),
35204eeddc0SDimitry Andric Entry.getStatus().getName(),
353a7dea167SDimitry Andric /*RequiresNullTerminator=*/false),
35404eeddc0SDimitry Andric Entry.getStatus());
3550eae32dcSDimitry Andric
356a7dea167SDimitry Andric return llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>(
357a7dea167SDimitry Andric std::unique_ptr<llvm::vfs::File>(std::move(Result)));
358a7dea167SDimitry Andric }
359a7dea167SDimitry Andric
360a7dea167SDimitry Andric llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>
openFileForRead(const Twine & Path)361a7dea167SDimitry Andric DependencyScanningWorkerFilesystem::openFileForRead(const Twine &Path) {
362a7dea167SDimitry Andric SmallString<256> OwnedFilename;
363a7dea167SDimitry Andric StringRef Filename = Path.toStringRef(OwnedFilename);
364a7dea167SDimitry Andric
3655f757f3fSDimitry Andric if (Filename.ends_with(".pcm"))
36606c3fb27SDimitry Andric return getUnderlyingFS().openFileForRead(Path);
36706c3fb27SDimitry Andric
3680eae32dcSDimitry Andric llvm::ErrorOr<EntryRef> Result = getOrCreateFileSystemEntry(Filename);
369a7dea167SDimitry Andric if (!Result)
370a7dea167SDimitry Andric return Result.getError();
37181ad6265SDimitry Andric return DepScanFile::create(Result.get());
372a7dea167SDimitry Andric }
3734542f901SDimitry Andric
374*0fca6ea1SDimitry Andric std::error_code
getRealPath(const Twine & Path,SmallVectorImpl<char> & Output)375*0fca6ea1SDimitry Andric DependencyScanningWorkerFilesystem::getRealPath(const Twine &Path,
376*0fca6ea1SDimitry Andric SmallVectorImpl<char> &Output) {
377*0fca6ea1SDimitry Andric SmallString<256> OwnedFilename;
378*0fca6ea1SDimitry Andric StringRef OriginalFilename = Path.toStringRef(OwnedFilename);
379*0fca6ea1SDimitry Andric
380*0fca6ea1SDimitry Andric SmallString<256> PathBuf;
381*0fca6ea1SDimitry Andric auto FilenameForLookup = tryGetFilenameForLookup(OriginalFilename, PathBuf);
382*0fca6ea1SDimitry Andric if (!FilenameForLookup)
383*0fca6ea1SDimitry Andric return FilenameForLookup.getError();
384*0fca6ea1SDimitry Andric
385*0fca6ea1SDimitry Andric auto HandleCachedRealPath =
386*0fca6ea1SDimitry Andric [&Output](const CachedRealPath &RealPath) -> std::error_code {
387*0fca6ea1SDimitry Andric if (!RealPath)
388*0fca6ea1SDimitry Andric return RealPath.getError();
389*0fca6ea1SDimitry Andric Output.assign(RealPath->begin(), RealPath->end());
390*0fca6ea1SDimitry Andric return {};
391*0fca6ea1SDimitry Andric };
392*0fca6ea1SDimitry Andric
393*0fca6ea1SDimitry Andric // If we already have the result in local cache, no work required.
394*0fca6ea1SDimitry Andric if (const auto *RealPath =
395*0fca6ea1SDimitry Andric LocalCache.findRealPathByFilename(*FilenameForLookup))
396*0fca6ea1SDimitry Andric return HandleCachedRealPath(*RealPath);
397*0fca6ea1SDimitry Andric
398*0fca6ea1SDimitry Andric // If we have the result in the shared cache, cache it locally.
399*0fca6ea1SDimitry Andric auto &Shard = SharedCache.getShardForFilename(*FilenameForLookup);
400*0fca6ea1SDimitry Andric if (const auto *ShardRealPath =
401*0fca6ea1SDimitry Andric Shard.findRealPathByFilename(*FilenameForLookup)) {
402*0fca6ea1SDimitry Andric const auto &RealPath = LocalCache.insertRealPathForFilename(
403*0fca6ea1SDimitry Andric *FilenameForLookup, *ShardRealPath);
404*0fca6ea1SDimitry Andric return HandleCachedRealPath(RealPath);
405*0fca6ea1SDimitry Andric }
406*0fca6ea1SDimitry Andric
407*0fca6ea1SDimitry Andric // If we don't know the real path, compute it...
408*0fca6ea1SDimitry Andric std::error_code EC = getUnderlyingFS().getRealPath(OriginalFilename, Output);
409*0fca6ea1SDimitry Andric llvm::ErrorOr<llvm::StringRef> ComputedRealPath = EC;
410*0fca6ea1SDimitry Andric if (!EC)
411*0fca6ea1SDimitry Andric ComputedRealPath = StringRef{Output.data(), Output.size()};
412*0fca6ea1SDimitry Andric
413*0fca6ea1SDimitry Andric // ...and try to write it into the shared cache. In case some other thread won
414*0fca6ea1SDimitry Andric // this race and already wrote its own result there, just adopt it. Write
415*0fca6ea1SDimitry Andric // whatever is in the shared cache into the local one.
416*0fca6ea1SDimitry Andric const auto &RealPath = Shard.getOrEmplaceRealPathForFilename(
417*0fca6ea1SDimitry Andric *FilenameForLookup, ComputedRealPath);
418*0fca6ea1SDimitry Andric return HandleCachedRealPath(
419*0fca6ea1SDimitry Andric LocalCache.insertRealPathForFilename(*FilenameForLookup, RealPath));
420*0fca6ea1SDimitry Andric }
421*0fca6ea1SDimitry Andric
setCurrentWorkingDirectory(const Twine & Path)4224542f901SDimitry Andric std::error_code DependencyScanningWorkerFilesystem::setCurrentWorkingDirectory(
4234542f901SDimitry Andric const Twine &Path) {
4244542f901SDimitry Andric std::error_code EC = ProxyFileSystem::setCurrentWorkingDirectory(Path);
4254542f901SDimitry Andric updateWorkingDirForCacheLookup();
4264542f901SDimitry Andric return EC;
4274542f901SDimitry Andric }
4284542f901SDimitry Andric
updateWorkingDirForCacheLookup()4294542f901SDimitry Andric void DependencyScanningWorkerFilesystem::updateWorkingDirForCacheLookup() {
4304542f901SDimitry Andric llvm::ErrorOr<std::string> CWD =
4314542f901SDimitry Andric getUnderlyingFS().getCurrentWorkingDirectory();
4324542f901SDimitry Andric if (!CWD) {
4334542f901SDimitry Andric WorkingDirForCacheLookup = CWD.getError();
4344542f901SDimitry Andric } else if (!llvm::sys::path::is_absolute_gnu(*CWD)) {
4354542f901SDimitry Andric WorkingDirForCacheLookup = llvm::errc::invalid_argument;
4364542f901SDimitry Andric } else {
4374542f901SDimitry Andric WorkingDirForCacheLookup = *CWD;
4384542f901SDimitry Andric }
4394542f901SDimitry Andric assert(!WorkingDirForCacheLookup ||
4404542f901SDimitry Andric llvm::sys::path::is_absolute_gnu(*WorkingDirForCacheLookup));
4414542f901SDimitry Andric }
442*0fca6ea1SDimitry Andric
443*0fca6ea1SDimitry Andric llvm::ErrorOr<StringRef>
tryGetFilenameForLookup(StringRef OriginalFilename,llvm::SmallVectorImpl<char> & PathBuf) const444*0fca6ea1SDimitry Andric DependencyScanningWorkerFilesystem::tryGetFilenameForLookup(
445*0fca6ea1SDimitry Andric StringRef OriginalFilename, llvm::SmallVectorImpl<char> &PathBuf) const {
446*0fca6ea1SDimitry Andric StringRef FilenameForLookup;
447*0fca6ea1SDimitry Andric if (llvm::sys::path::is_absolute_gnu(OriginalFilename)) {
448*0fca6ea1SDimitry Andric FilenameForLookup = OriginalFilename;
449*0fca6ea1SDimitry Andric } else if (!WorkingDirForCacheLookup) {
450*0fca6ea1SDimitry Andric return WorkingDirForCacheLookup.getError();
451*0fca6ea1SDimitry Andric } else {
452*0fca6ea1SDimitry Andric StringRef RelFilename = OriginalFilename;
453*0fca6ea1SDimitry Andric RelFilename.consume_front("./");
454*0fca6ea1SDimitry Andric PathBuf.assign(WorkingDirForCacheLookup->begin(),
455*0fca6ea1SDimitry Andric WorkingDirForCacheLookup->end());
456*0fca6ea1SDimitry Andric llvm::sys::path::append(PathBuf, RelFilename);
457*0fca6ea1SDimitry Andric FilenameForLookup = StringRef{PathBuf.begin(), PathBuf.size()};
458*0fca6ea1SDimitry Andric }
459*0fca6ea1SDimitry Andric assert(llvm::sys::path::is_absolute_gnu(FilenameForLookup));
460*0fca6ea1SDimitry Andric return FilenameForLookup;
461*0fca6ea1SDimitry Andric }
462*0fca6ea1SDimitry Andric
463*0fca6ea1SDimitry Andric const char DependencyScanningWorkerFilesystem::ID = 0;
464