xref: /freebsd/contrib/llvm-project/llvm/lib/Support/VirtualFileSystem.cpp (revision 833a452e9f082a7982a31c21f0da437dbbe0a39d)
1 //===- VirtualFileSystem.cpp - Virtual File System Layer ------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the VirtualFileSystem interface.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/Support/VirtualFileSystem.h"
14 #include "llvm/ADT/ArrayRef.h"
15 #include "llvm/ADT/DenseMap.h"
16 #include "llvm/ADT/IntrusiveRefCntPtr.h"
17 #include "llvm/ADT/None.h"
18 #include "llvm/ADT/Optional.h"
19 #include "llvm/ADT/STLExtras.h"
20 #include "llvm/ADT/SmallString.h"
21 #include "llvm/ADT/SmallVector.h"
22 #include "llvm/ADT/StringRef.h"
23 #include "llvm/ADT/StringSet.h"
24 #include "llvm/ADT/Twine.h"
25 #include "llvm/ADT/iterator_range.h"
26 #include "llvm/Config/llvm-config.h"
27 #include "llvm/Support/Casting.h"
28 #include "llvm/Support/Chrono.h"
29 #include "llvm/Support/Compiler.h"
30 #include "llvm/Support/Debug.h"
31 #include "llvm/Support/Errc.h"
32 #include "llvm/Support/ErrorHandling.h"
33 #include "llvm/Support/ErrorOr.h"
34 #include "llvm/Support/FileSystem.h"
35 #include "llvm/Support/MemoryBuffer.h"
36 #include "llvm/Support/Path.h"
37 #include "llvm/Support/Process.h"
38 #include "llvm/Support/SMLoc.h"
39 #include "llvm/Support/SourceMgr.h"
40 #include "llvm/Support/YAMLParser.h"
41 #include "llvm/Support/raw_ostream.h"
42 #include <algorithm>
43 #include <atomic>
44 #include <cassert>
45 #include <cstdint>
46 #include <iterator>
47 #include <limits>
48 #include <map>
49 #include <memory>
50 #include <mutex>
51 #include <string>
52 #include <system_error>
53 #include <utility>
54 #include <vector>
55 
56 using namespace llvm;
57 using namespace llvm::vfs;
58 
59 using llvm::sys::fs::file_t;
60 using llvm::sys::fs::file_status;
61 using llvm::sys::fs::file_type;
62 using llvm::sys::fs::kInvalidFile;
63 using llvm::sys::fs::perms;
64 using llvm::sys::fs::UniqueID;
65 
66 Status::Status(const file_status &Status)
67     : UID(Status.getUniqueID()), MTime(Status.getLastModificationTime()),
68       User(Status.getUser()), Group(Status.getGroup()), Size(Status.getSize()),
69       Type(Status.type()), Perms(Status.permissions()) {}
70 
71 Status::Status(const Twine &Name, UniqueID UID, sys::TimePoint<> MTime,
72                uint32_t User, uint32_t Group, uint64_t Size, file_type Type,
73                perms Perms)
74     : Name(Name.str()), UID(UID), MTime(MTime), User(User), Group(Group),
75       Size(Size), Type(Type), Perms(Perms) {}
76 
77 Status Status::copyWithNewName(const Status &In, const Twine &NewName) {
78   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
79                 In.getUser(), In.getGroup(), In.getSize(), In.getType(),
80                 In.getPermissions());
81 }
82 
83 Status Status::copyWithNewName(const file_status &In, const Twine &NewName) {
84   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
85                 In.getUser(), In.getGroup(), In.getSize(), In.type(),
86                 In.permissions());
87 }
88 
89 bool Status::equivalent(const Status &Other) const {
90   assert(isStatusKnown() && Other.isStatusKnown());
91   return getUniqueID() == Other.getUniqueID();
92 }
93 
94 bool Status::isDirectory() const { return Type == file_type::directory_file; }
95 
96 bool Status::isRegularFile() const { return Type == file_type::regular_file; }
97 
98 bool Status::isOther() const {
99   return exists() && !isRegularFile() && !isDirectory() && !isSymlink();
100 }
101 
102 bool Status::isSymlink() const { return Type == file_type::symlink_file; }
103 
104 bool Status::isStatusKnown() const { return Type != file_type::status_error; }
105 
106 bool Status::exists() const {
107   return isStatusKnown() && Type != file_type::file_not_found;
108 }
109 
110 File::~File() = default;
111 
112 FileSystem::~FileSystem() = default;
113 
114 ErrorOr<std::unique_ptr<MemoryBuffer>>
115 FileSystem::getBufferForFile(const llvm::Twine &Name, int64_t FileSize,
116                              bool RequiresNullTerminator, bool IsVolatile) {
117   auto F = openFileForRead(Name);
118   if (!F)
119     return F.getError();
120 
121   return (*F)->getBuffer(Name, FileSize, RequiresNullTerminator, IsVolatile);
122 }
123 
124 std::error_code FileSystem::makeAbsolute(SmallVectorImpl<char> &Path) const {
125   if (llvm::sys::path::is_absolute(Path))
126     return {};
127 
128   auto WorkingDir = getCurrentWorkingDirectory();
129   if (!WorkingDir)
130     return WorkingDir.getError();
131 
132   llvm::sys::fs::make_absolute(WorkingDir.get(), Path);
133   return {};
134 }
135 
136 std::error_code FileSystem::getRealPath(const Twine &Path,
137                                         SmallVectorImpl<char> &Output) const {
138   return errc::operation_not_permitted;
139 }
140 
141 std::error_code FileSystem::isLocal(const Twine &Path, bool &Result) {
142   return errc::operation_not_permitted;
143 }
144 
145 bool FileSystem::exists(const Twine &Path) {
146   auto Status = status(Path);
147   return Status && Status->exists();
148 }
149 
150 #ifndef NDEBUG
151 static bool isTraversalComponent(StringRef Component) {
152   return Component.equals("..") || Component.equals(".");
153 }
154 
155 static bool pathHasTraversal(StringRef Path) {
156   using namespace llvm::sys;
157 
158   for (StringRef Comp : llvm::make_range(path::begin(Path), path::end(Path)))
159     if (isTraversalComponent(Comp))
160       return true;
161   return false;
162 }
163 #endif
164 
165 //===-----------------------------------------------------------------------===/
166 // RealFileSystem implementation
167 //===-----------------------------------------------------------------------===/
168 
169 namespace {
170 
171 /// Wrapper around a raw file descriptor.
172 class RealFile : public File {
173   friend class RealFileSystem;
174 
175   file_t FD;
176   Status S;
177   std::string RealName;
178 
179   RealFile(file_t RawFD, StringRef NewName, StringRef NewRealPathName)
180       : FD(RawFD), S(NewName, {}, {}, {}, {}, {},
181                      llvm::sys::fs::file_type::status_error, {}),
182         RealName(NewRealPathName.str()) {
183     assert(FD != kInvalidFile && "Invalid or inactive file descriptor");
184   }
185 
186 public:
187   ~RealFile() override;
188 
189   ErrorOr<Status> status() override;
190   ErrorOr<std::string> getName() override;
191   ErrorOr<std::unique_ptr<MemoryBuffer>> getBuffer(const Twine &Name,
192                                                    int64_t FileSize,
193                                                    bool RequiresNullTerminator,
194                                                    bool IsVolatile) override;
195   std::error_code close() override;
196 };
197 
198 } // namespace
199 
200 RealFile::~RealFile() { close(); }
201 
202 ErrorOr<Status> RealFile::status() {
203   assert(FD != kInvalidFile && "cannot stat closed file");
204   if (!S.isStatusKnown()) {
205     file_status RealStatus;
206     if (std::error_code EC = sys::fs::status(FD, RealStatus))
207       return EC;
208     S = Status::copyWithNewName(RealStatus, S.getName());
209   }
210   return S;
211 }
212 
213 ErrorOr<std::string> RealFile::getName() {
214   return RealName.empty() ? S.getName().str() : RealName;
215 }
216 
217 ErrorOr<std::unique_ptr<MemoryBuffer>>
218 RealFile::getBuffer(const Twine &Name, int64_t FileSize,
219                     bool RequiresNullTerminator, bool IsVolatile) {
220   assert(FD != kInvalidFile && "cannot get buffer for closed file");
221   return MemoryBuffer::getOpenFile(FD, Name, FileSize, RequiresNullTerminator,
222                                    IsVolatile);
223 }
224 
225 std::error_code RealFile::close() {
226   std::error_code EC = sys::fs::closeFile(FD);
227   FD = kInvalidFile;
228   return EC;
229 }
230 
231 namespace {
232 
233 /// A file system according to your operating system.
234 /// This may be linked to the process's working directory, or maintain its own.
235 ///
236 /// Currently, its own working directory is emulated by storing the path and
237 /// sending absolute paths to llvm::sys::fs:: functions.
238 /// A more principled approach would be to push this down a level, modelling
239 /// the working dir as an llvm::sys::fs::WorkingDir or similar.
240 /// This would enable the use of openat()-style functions on some platforms.
241 class RealFileSystem : public FileSystem {
242 public:
243   explicit RealFileSystem(bool LinkCWDToProcess) {
244     if (!LinkCWDToProcess) {
245       SmallString<128> PWD, RealPWD;
246       if (llvm::sys::fs::current_path(PWD))
247         return; // Awful, but nothing to do here.
248       if (llvm::sys::fs::real_path(PWD, RealPWD))
249         WD = {PWD, PWD};
250       else
251         WD = {PWD, RealPWD};
252     }
253   }
254 
255   ErrorOr<Status> status(const Twine &Path) override;
256   ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine &Path) override;
257   directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override;
258 
259   llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override;
260   std::error_code setCurrentWorkingDirectory(const Twine &Path) override;
261   std::error_code isLocal(const Twine &Path, bool &Result) override;
262   std::error_code getRealPath(const Twine &Path,
263                               SmallVectorImpl<char> &Output) const override;
264 
265 private:
266   // If this FS has its own working dir, use it to make Path absolute.
267   // The returned twine is safe to use as long as both Storage and Path live.
268   Twine adjustPath(const Twine &Path, SmallVectorImpl<char> &Storage) const {
269     if (!WD)
270       return Path;
271     Path.toVector(Storage);
272     sys::fs::make_absolute(WD->Resolved, Storage);
273     return Storage;
274   }
275 
276   struct WorkingDirectory {
277     // The current working directory, without symlinks resolved. (echo $PWD).
278     SmallString<128> Specified;
279     // The current working directory, with links resolved. (readlink .).
280     SmallString<128> Resolved;
281   };
282   Optional<WorkingDirectory> WD;
283 };
284 
285 } // namespace
286 
287 ErrorOr<Status> RealFileSystem::status(const Twine &Path) {
288   SmallString<256> Storage;
289   sys::fs::file_status RealStatus;
290   if (std::error_code EC =
291           sys::fs::status(adjustPath(Path, Storage), RealStatus))
292     return EC;
293   return Status::copyWithNewName(RealStatus, Path);
294 }
295 
296 ErrorOr<std::unique_ptr<File>>
297 RealFileSystem::openFileForRead(const Twine &Name) {
298   SmallString<256> RealName, Storage;
299   Expected<file_t> FDOrErr = sys::fs::openNativeFileForRead(
300       adjustPath(Name, Storage), sys::fs::OF_None, &RealName);
301   if (!FDOrErr)
302     return errorToErrorCode(FDOrErr.takeError());
303   return std::unique_ptr<File>(
304       new RealFile(*FDOrErr, Name.str(), RealName.str()));
305 }
306 
307 llvm::ErrorOr<std::string> RealFileSystem::getCurrentWorkingDirectory() const {
308   if (WD)
309     return std::string(WD->Specified.str());
310 
311   SmallString<128> Dir;
312   if (std::error_code EC = llvm::sys::fs::current_path(Dir))
313     return EC;
314   return std::string(Dir.str());
315 }
316 
317 std::error_code RealFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
318   if (!WD)
319     return llvm::sys::fs::set_current_path(Path);
320 
321   SmallString<128> Absolute, Resolved, Storage;
322   adjustPath(Path, Storage).toVector(Absolute);
323   bool IsDir;
324   if (auto Err = llvm::sys::fs::is_directory(Absolute, IsDir))
325     return Err;
326   if (!IsDir)
327     return std::make_error_code(std::errc::not_a_directory);
328   if (auto Err = llvm::sys::fs::real_path(Absolute, Resolved))
329     return Err;
330   WD = {Absolute, Resolved};
331   return std::error_code();
332 }
333 
334 std::error_code RealFileSystem::isLocal(const Twine &Path, bool &Result) {
335   SmallString<256> Storage;
336   return llvm::sys::fs::is_local(adjustPath(Path, Storage), Result);
337 }
338 
339 std::error_code
340 RealFileSystem::getRealPath(const Twine &Path,
341                             SmallVectorImpl<char> &Output) const {
342   SmallString<256> Storage;
343   return llvm::sys::fs::real_path(adjustPath(Path, Storage), Output);
344 }
345 
346 IntrusiveRefCntPtr<FileSystem> vfs::getRealFileSystem() {
347   static IntrusiveRefCntPtr<FileSystem> FS(new RealFileSystem(true));
348   return FS;
349 }
350 
351 std::unique_ptr<FileSystem> vfs::createPhysicalFileSystem() {
352   return std::make_unique<RealFileSystem>(false);
353 }
354 
355 namespace {
356 
357 class RealFSDirIter : public llvm::vfs::detail::DirIterImpl {
358   llvm::sys::fs::directory_iterator Iter;
359 
360 public:
361   RealFSDirIter(const Twine &Path, std::error_code &EC) : Iter(Path, EC) {
362     if (Iter != llvm::sys::fs::directory_iterator())
363       CurrentEntry = directory_entry(Iter->path(), Iter->type());
364   }
365 
366   std::error_code increment() override {
367     std::error_code EC;
368     Iter.increment(EC);
369     CurrentEntry = (Iter == llvm::sys::fs::directory_iterator())
370                        ? directory_entry()
371                        : directory_entry(Iter->path(), Iter->type());
372     return EC;
373   }
374 };
375 
376 } // namespace
377 
378 directory_iterator RealFileSystem::dir_begin(const Twine &Dir,
379                                              std::error_code &EC) {
380   SmallString<128> Storage;
381   return directory_iterator(
382       std::make_shared<RealFSDirIter>(adjustPath(Dir, Storage), EC));
383 }
384 
385 //===-----------------------------------------------------------------------===/
386 // OverlayFileSystem implementation
387 //===-----------------------------------------------------------------------===/
388 
389 OverlayFileSystem::OverlayFileSystem(IntrusiveRefCntPtr<FileSystem> BaseFS) {
390   FSList.push_back(std::move(BaseFS));
391 }
392 
393 void OverlayFileSystem::pushOverlay(IntrusiveRefCntPtr<FileSystem> FS) {
394   FSList.push_back(FS);
395   // Synchronize added file systems by duplicating the working directory from
396   // the first one in the list.
397   FS->setCurrentWorkingDirectory(getCurrentWorkingDirectory().get());
398 }
399 
400 ErrorOr<Status> OverlayFileSystem::status(const Twine &Path) {
401   // FIXME: handle symlinks that cross file systems
402   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
403     ErrorOr<Status> Status = (*I)->status(Path);
404     if (Status || Status.getError() != llvm::errc::no_such_file_or_directory)
405       return Status;
406   }
407   return make_error_code(llvm::errc::no_such_file_or_directory);
408 }
409 
410 ErrorOr<std::unique_ptr<File>>
411 OverlayFileSystem::openFileForRead(const llvm::Twine &Path) {
412   // FIXME: handle symlinks that cross file systems
413   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
414     auto Result = (*I)->openFileForRead(Path);
415     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
416       return Result;
417   }
418   return make_error_code(llvm::errc::no_such_file_or_directory);
419 }
420 
421 llvm::ErrorOr<std::string>
422 OverlayFileSystem::getCurrentWorkingDirectory() const {
423   // All file systems are synchronized, just take the first working directory.
424   return FSList.front()->getCurrentWorkingDirectory();
425 }
426 
427 std::error_code
428 OverlayFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
429   for (auto &FS : FSList)
430     if (std::error_code EC = FS->setCurrentWorkingDirectory(Path))
431       return EC;
432   return {};
433 }
434 
435 std::error_code OverlayFileSystem::isLocal(const Twine &Path, bool &Result) {
436   for (auto &FS : FSList)
437     if (FS->exists(Path))
438       return FS->isLocal(Path, Result);
439   return errc::no_such_file_or_directory;
440 }
441 
442 std::error_code
443 OverlayFileSystem::getRealPath(const Twine &Path,
444                                SmallVectorImpl<char> &Output) const {
445   for (auto &FS : FSList)
446     if (FS->exists(Path))
447       return FS->getRealPath(Path, Output);
448   return errc::no_such_file_or_directory;
449 }
450 
451 llvm::vfs::detail::DirIterImpl::~DirIterImpl() = default;
452 
453 namespace {
454 
455 /// Combines and deduplicates directory entries across multiple file systems.
456 class CombiningDirIterImpl : public llvm::vfs::detail::DirIterImpl {
457   using FileSystemPtr = llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem>;
458 
459   /// File systems to check for entries in. Processed in reverse order.
460   SmallVector<FileSystemPtr, 8> FSList;
461   /// The directory iterator for the current filesystem.
462   directory_iterator CurrentDirIter;
463   /// The path of the directory to iterate the entries of.
464   std::string DirPath;
465   /// The set of names already returned as entries.
466   llvm::StringSet<> SeenNames;
467 
468   /// Sets \c CurrentDirIter to an iterator of \c DirPath in the next file
469   /// system in the list, or leaves it as is (at its end position) if we've
470   /// already gone through them all.
471   std::error_code incrementFS() {
472     while (!FSList.empty()) {
473       std::error_code EC;
474       CurrentDirIter = FSList.back()->dir_begin(DirPath, EC);
475       FSList.pop_back();
476       if (EC && EC != errc::no_such_file_or_directory)
477         return EC;
478       if (CurrentDirIter != directory_iterator())
479         break; // found
480     }
481     return {};
482   }
483 
484   std::error_code incrementDirIter(bool IsFirstTime) {
485     assert((IsFirstTime || CurrentDirIter != directory_iterator()) &&
486            "incrementing past end");
487     std::error_code EC;
488     if (!IsFirstTime)
489       CurrentDirIter.increment(EC);
490     if (!EC && CurrentDirIter == directory_iterator())
491       EC = incrementFS();
492     return EC;
493   }
494 
495   std::error_code incrementImpl(bool IsFirstTime) {
496     while (true) {
497       std::error_code EC = incrementDirIter(IsFirstTime);
498       if (EC || CurrentDirIter == directory_iterator()) {
499         CurrentEntry = directory_entry();
500         return EC;
501       }
502       CurrentEntry = *CurrentDirIter;
503       StringRef Name = llvm::sys::path::filename(CurrentEntry.path());
504       if (SeenNames.insert(Name).second)
505         return EC; // name not seen before
506     }
507     llvm_unreachable("returned above");
508   }
509 
510 public:
511   CombiningDirIterImpl(ArrayRef<FileSystemPtr> FileSystems, std::string Dir,
512                        std::error_code &EC)
513       : FSList(FileSystems.begin(), FileSystems.end()),
514         DirPath(std::move(Dir)) {
515     if (!FSList.empty()) {
516       CurrentDirIter = FSList.back()->dir_begin(DirPath, EC);
517       FSList.pop_back();
518       if (!EC || EC == errc::no_such_file_or_directory)
519         EC = incrementImpl(true);
520     }
521   }
522 
523   CombiningDirIterImpl(directory_iterator FirstIter, FileSystemPtr Fallback,
524                        std::string FallbackDir, std::error_code &EC)
525       : FSList({Fallback}), CurrentDirIter(FirstIter),
526         DirPath(std::move(FallbackDir)) {
527     if (!EC || EC == errc::no_such_file_or_directory)
528       EC = incrementImpl(true);
529   }
530 
531   std::error_code increment() override { return incrementImpl(false); }
532 };
533 
534 } // namespace
535 
536 directory_iterator OverlayFileSystem::dir_begin(const Twine &Dir,
537                                                 std::error_code &EC) {
538   return directory_iterator(
539       std::make_shared<CombiningDirIterImpl>(FSList, Dir.str(), EC));
540 }
541 
542 void ProxyFileSystem::anchor() {}
543 
544 namespace llvm {
545 namespace vfs {
546 
547 namespace detail {
548 
549 enum InMemoryNodeKind { IME_File, IME_Directory, IME_HardLink };
550 
551 /// The in memory file system is a tree of Nodes. Every node can either be a
552 /// file , hardlink or a directory.
553 class InMemoryNode {
554   InMemoryNodeKind Kind;
555   std::string FileName;
556 
557 public:
558   InMemoryNode(llvm::StringRef FileName, InMemoryNodeKind Kind)
559       : Kind(Kind), FileName(std::string(llvm::sys::path::filename(FileName))) {
560   }
561   virtual ~InMemoryNode() = default;
562 
563   /// Get the filename of this node (the name without the directory part).
564   StringRef getFileName() const { return FileName; }
565   InMemoryNodeKind getKind() const { return Kind; }
566   virtual std::string toString(unsigned Indent) const = 0;
567 };
568 
569 class InMemoryFile : public InMemoryNode {
570   Status Stat;
571   std::unique_ptr<llvm::MemoryBuffer> Buffer;
572 
573 public:
574   InMemoryFile(Status Stat, std::unique_ptr<llvm::MemoryBuffer> Buffer)
575       : InMemoryNode(Stat.getName(), IME_File), Stat(std::move(Stat)),
576         Buffer(std::move(Buffer)) {}
577 
578   /// Return the \p Status for this node. \p RequestedName should be the name
579   /// through which the caller referred to this node. It will override
580   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
581   Status getStatus(const Twine &RequestedName) const {
582     return Status::copyWithNewName(Stat, RequestedName);
583   }
584   llvm::MemoryBuffer *getBuffer() const { return Buffer.get(); }
585 
586   std::string toString(unsigned Indent) const override {
587     return (std::string(Indent, ' ') + Stat.getName() + "\n").str();
588   }
589 
590   static bool classof(const InMemoryNode *N) {
591     return N->getKind() == IME_File;
592   }
593 };
594 
595 namespace {
596 
597 class InMemoryHardLink : public InMemoryNode {
598   const InMemoryFile &ResolvedFile;
599 
600 public:
601   InMemoryHardLink(StringRef Path, const InMemoryFile &ResolvedFile)
602       : InMemoryNode(Path, IME_HardLink), ResolvedFile(ResolvedFile) {}
603   const InMemoryFile &getResolvedFile() const { return ResolvedFile; }
604 
605   std::string toString(unsigned Indent) const override {
606     return std::string(Indent, ' ') + "HardLink to -> " +
607            ResolvedFile.toString(0);
608   }
609 
610   static bool classof(const InMemoryNode *N) {
611     return N->getKind() == IME_HardLink;
612   }
613 };
614 
615 /// Adapt a InMemoryFile for VFS' File interface.  The goal is to make
616 /// \p InMemoryFileAdaptor mimic as much as possible the behavior of
617 /// \p RealFile.
618 class InMemoryFileAdaptor : public File {
619   const InMemoryFile &Node;
620   /// The name to use when returning a Status for this file.
621   std::string RequestedName;
622 
623 public:
624   explicit InMemoryFileAdaptor(const InMemoryFile &Node,
625                                std::string RequestedName)
626       : Node(Node), RequestedName(std::move(RequestedName)) {}
627 
628   llvm::ErrorOr<Status> status() override {
629     return Node.getStatus(RequestedName);
630   }
631 
632   llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
633   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
634             bool IsVolatile) override {
635     llvm::MemoryBuffer *Buf = Node.getBuffer();
636     return llvm::MemoryBuffer::getMemBuffer(
637         Buf->getBuffer(), Buf->getBufferIdentifier(), RequiresNullTerminator);
638   }
639 
640   std::error_code close() override { return {}; }
641 };
642 } // namespace
643 
644 class InMemoryDirectory : public InMemoryNode {
645   Status Stat;
646   llvm::StringMap<std::unique_ptr<InMemoryNode>> Entries;
647 
648 public:
649   InMemoryDirectory(Status Stat)
650       : InMemoryNode(Stat.getName(), IME_Directory), Stat(std::move(Stat)) {}
651 
652   /// Return the \p Status for this node. \p RequestedName should be the name
653   /// through which the caller referred to this node. It will override
654   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
655   Status getStatus(const Twine &RequestedName) const {
656     return Status::copyWithNewName(Stat, RequestedName);
657   }
658   InMemoryNode *getChild(StringRef Name) {
659     auto I = Entries.find(Name);
660     if (I != Entries.end())
661       return I->second.get();
662     return nullptr;
663   }
664 
665   InMemoryNode *addChild(StringRef Name, std::unique_ptr<InMemoryNode> Child) {
666     return Entries.insert(make_pair(Name, std::move(Child)))
667         .first->second.get();
668   }
669 
670   using const_iterator = decltype(Entries)::const_iterator;
671 
672   const_iterator begin() const { return Entries.begin(); }
673   const_iterator end() const { return Entries.end(); }
674 
675   std::string toString(unsigned Indent) const override {
676     std::string Result =
677         (std::string(Indent, ' ') + Stat.getName() + "\n").str();
678     for (const auto &Entry : Entries)
679       Result += Entry.second->toString(Indent + 2);
680     return Result;
681   }
682 
683   static bool classof(const InMemoryNode *N) {
684     return N->getKind() == IME_Directory;
685   }
686 };
687 
688 namespace {
689 Status getNodeStatus(const InMemoryNode *Node, const Twine &RequestedName) {
690   if (auto Dir = dyn_cast<detail::InMemoryDirectory>(Node))
691     return Dir->getStatus(RequestedName);
692   if (auto File = dyn_cast<detail::InMemoryFile>(Node))
693     return File->getStatus(RequestedName);
694   if (auto Link = dyn_cast<detail::InMemoryHardLink>(Node))
695     return Link->getResolvedFile().getStatus(RequestedName);
696   llvm_unreachable("Unknown node type");
697 }
698 } // namespace
699 } // namespace detail
700 
701 InMemoryFileSystem::InMemoryFileSystem(bool UseNormalizedPaths)
702     : Root(new detail::InMemoryDirectory(
703           Status("", getNextVirtualUniqueID(), llvm::sys::TimePoint<>(), 0, 0,
704                  0, llvm::sys::fs::file_type::directory_file,
705                  llvm::sys::fs::perms::all_all))),
706       UseNormalizedPaths(UseNormalizedPaths) {}
707 
708 InMemoryFileSystem::~InMemoryFileSystem() = default;
709 
710 std::string InMemoryFileSystem::toString() const {
711   return Root->toString(/*Indent=*/0);
712 }
713 
714 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
715                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
716                                  Optional<uint32_t> User,
717                                  Optional<uint32_t> Group,
718                                  Optional<llvm::sys::fs::file_type> Type,
719                                  Optional<llvm::sys::fs::perms> Perms,
720                                  const detail::InMemoryFile *HardLinkTarget) {
721   SmallString<128> Path;
722   P.toVector(Path);
723 
724   // Fix up relative paths. This just prepends the current working directory.
725   std::error_code EC = makeAbsolute(Path);
726   assert(!EC);
727   (void)EC;
728 
729   if (useNormalizedPaths())
730     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
731 
732   if (Path.empty())
733     return false;
734 
735   detail::InMemoryDirectory *Dir = Root.get();
736   auto I = llvm::sys::path::begin(Path), E = sys::path::end(Path);
737   const auto ResolvedUser = User.getValueOr(0);
738   const auto ResolvedGroup = Group.getValueOr(0);
739   const auto ResolvedType = Type.getValueOr(sys::fs::file_type::regular_file);
740   const auto ResolvedPerms = Perms.getValueOr(sys::fs::all_all);
741   assert(!(HardLinkTarget && Buffer) && "HardLink cannot have a buffer");
742   // Any intermediate directories we create should be accessible by
743   // the owner, even if Perms says otherwise for the final path.
744   const auto NewDirectoryPerms = ResolvedPerms | sys::fs::owner_all;
745   while (true) {
746     StringRef Name = *I;
747     detail::InMemoryNode *Node = Dir->getChild(Name);
748     ++I;
749     if (!Node) {
750       if (I == E) {
751         // End of the path.
752         std::unique_ptr<detail::InMemoryNode> Child;
753         if (HardLinkTarget)
754           Child.reset(new detail::InMemoryHardLink(P.str(), *HardLinkTarget));
755         else {
756           // Create a new file or directory.
757           Status Stat(P.str(), getNextVirtualUniqueID(),
758                       llvm::sys::toTimePoint(ModificationTime), ResolvedUser,
759                       ResolvedGroup, Buffer->getBufferSize(), ResolvedType,
760                       ResolvedPerms);
761           if (ResolvedType == sys::fs::file_type::directory_file) {
762             Child.reset(new detail::InMemoryDirectory(std::move(Stat)));
763           } else {
764             Child.reset(
765                 new detail::InMemoryFile(std::move(Stat), std::move(Buffer)));
766           }
767         }
768         Dir->addChild(Name, std::move(Child));
769         return true;
770       }
771 
772       // Create a new directory. Use the path up to here.
773       Status Stat(
774           StringRef(Path.str().begin(), Name.end() - Path.str().begin()),
775           getNextVirtualUniqueID(), llvm::sys::toTimePoint(ModificationTime),
776           ResolvedUser, ResolvedGroup, 0, sys::fs::file_type::directory_file,
777           NewDirectoryPerms);
778       Dir = cast<detail::InMemoryDirectory>(Dir->addChild(
779           Name, std::make_unique<detail::InMemoryDirectory>(std::move(Stat))));
780       continue;
781     }
782 
783     if (auto *NewDir = dyn_cast<detail::InMemoryDirectory>(Node)) {
784       Dir = NewDir;
785     } else {
786       assert((isa<detail::InMemoryFile>(Node) ||
787               isa<detail::InMemoryHardLink>(Node)) &&
788              "Must be either file, hardlink or directory!");
789 
790       // Trying to insert a directory in place of a file.
791       if (I != E)
792         return false;
793 
794       // Return false only if the new file is different from the existing one.
795       if (auto Link = dyn_cast<detail::InMemoryHardLink>(Node)) {
796         return Link->getResolvedFile().getBuffer()->getBuffer() ==
797                Buffer->getBuffer();
798       }
799       return cast<detail::InMemoryFile>(Node)->getBuffer()->getBuffer() ==
800              Buffer->getBuffer();
801     }
802   }
803 }
804 
805 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
806                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
807                                  Optional<uint32_t> User,
808                                  Optional<uint32_t> Group,
809                                  Optional<llvm::sys::fs::file_type> Type,
810                                  Optional<llvm::sys::fs::perms> Perms) {
811   return addFile(P, ModificationTime, std::move(Buffer), User, Group, Type,
812                  Perms, /*HardLinkTarget=*/nullptr);
813 }
814 
815 bool InMemoryFileSystem::addFileNoOwn(const Twine &P, time_t ModificationTime,
816                                       const llvm::MemoryBufferRef &Buffer,
817                                       Optional<uint32_t> User,
818                                       Optional<uint32_t> Group,
819                                       Optional<llvm::sys::fs::file_type> Type,
820                                       Optional<llvm::sys::fs::perms> Perms) {
821   return addFile(P, ModificationTime, llvm::MemoryBuffer::getMemBuffer(Buffer),
822                  std::move(User), std::move(Group), std::move(Type),
823                  std::move(Perms));
824 }
825 
826 static ErrorOr<const detail::InMemoryNode *>
827 lookupInMemoryNode(const InMemoryFileSystem &FS, detail::InMemoryDirectory *Dir,
828                    const Twine &P) {
829   SmallString<128> Path;
830   P.toVector(Path);
831 
832   // Fix up relative paths. This just prepends the current working directory.
833   std::error_code EC = FS.makeAbsolute(Path);
834   assert(!EC);
835   (void)EC;
836 
837   if (FS.useNormalizedPaths())
838     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
839 
840   if (Path.empty())
841     return Dir;
842 
843   auto I = llvm::sys::path::begin(Path), E = llvm::sys::path::end(Path);
844   while (true) {
845     detail::InMemoryNode *Node = Dir->getChild(*I);
846     ++I;
847     if (!Node)
848       return errc::no_such_file_or_directory;
849 
850     // Return the file if it's at the end of the path.
851     if (auto File = dyn_cast<detail::InMemoryFile>(Node)) {
852       if (I == E)
853         return File;
854       return errc::no_such_file_or_directory;
855     }
856 
857     // If Node is HardLink then return the resolved file.
858     if (auto File = dyn_cast<detail::InMemoryHardLink>(Node)) {
859       if (I == E)
860         return &File->getResolvedFile();
861       return errc::no_such_file_or_directory;
862     }
863     // Traverse directories.
864     Dir = cast<detail::InMemoryDirectory>(Node);
865     if (I == E)
866       return Dir;
867   }
868 }
869 
870 bool InMemoryFileSystem::addHardLink(const Twine &FromPath,
871                                      const Twine &ToPath) {
872   auto FromNode = lookupInMemoryNode(*this, Root.get(), FromPath);
873   auto ToNode = lookupInMemoryNode(*this, Root.get(), ToPath);
874   // FromPath must not have been added before. ToPath must have been added
875   // before. Resolved ToPath must be a File.
876   if (!ToNode || FromNode || !isa<detail::InMemoryFile>(*ToNode))
877     return false;
878   return this->addFile(FromPath, 0, nullptr, None, None, None, None,
879                        cast<detail::InMemoryFile>(*ToNode));
880 }
881 
882 llvm::ErrorOr<Status> InMemoryFileSystem::status(const Twine &Path) {
883   auto Node = lookupInMemoryNode(*this, Root.get(), Path);
884   if (Node)
885     return detail::getNodeStatus(*Node, Path);
886   return Node.getError();
887 }
888 
889 llvm::ErrorOr<std::unique_ptr<File>>
890 InMemoryFileSystem::openFileForRead(const Twine &Path) {
891   auto Node = lookupInMemoryNode(*this, Root.get(), Path);
892   if (!Node)
893     return Node.getError();
894 
895   // When we have a file provide a heap-allocated wrapper for the memory buffer
896   // to match the ownership semantics for File.
897   if (auto *F = dyn_cast<detail::InMemoryFile>(*Node))
898     return std::unique_ptr<File>(
899         new detail::InMemoryFileAdaptor(*F, Path.str()));
900 
901   // FIXME: errc::not_a_file?
902   return make_error_code(llvm::errc::invalid_argument);
903 }
904 
905 namespace {
906 
907 /// Adaptor from InMemoryDir::iterator to directory_iterator.
908 class InMemoryDirIterator : public llvm::vfs::detail::DirIterImpl {
909   detail::InMemoryDirectory::const_iterator I;
910   detail::InMemoryDirectory::const_iterator E;
911   std::string RequestedDirName;
912 
913   void setCurrentEntry() {
914     if (I != E) {
915       SmallString<256> Path(RequestedDirName);
916       llvm::sys::path::append(Path, I->second->getFileName());
917       sys::fs::file_type Type = sys::fs::file_type::type_unknown;
918       switch (I->second->getKind()) {
919       case detail::IME_File:
920       case detail::IME_HardLink:
921         Type = sys::fs::file_type::regular_file;
922         break;
923       case detail::IME_Directory:
924         Type = sys::fs::file_type::directory_file;
925         break;
926       }
927       CurrentEntry = directory_entry(std::string(Path.str()), Type);
928     } else {
929       // When we're at the end, make CurrentEntry invalid and DirIterImpl will
930       // do the rest.
931       CurrentEntry = directory_entry();
932     }
933   }
934 
935 public:
936   InMemoryDirIterator() = default;
937 
938   explicit InMemoryDirIterator(const detail::InMemoryDirectory &Dir,
939                                std::string RequestedDirName)
940       : I(Dir.begin()), E(Dir.end()),
941         RequestedDirName(std::move(RequestedDirName)) {
942     setCurrentEntry();
943   }
944 
945   std::error_code increment() override {
946     ++I;
947     setCurrentEntry();
948     return {};
949   }
950 };
951 
952 } // namespace
953 
954 directory_iterator InMemoryFileSystem::dir_begin(const Twine &Dir,
955                                                  std::error_code &EC) {
956   auto Node = lookupInMemoryNode(*this, Root.get(), Dir);
957   if (!Node) {
958     EC = Node.getError();
959     return directory_iterator(std::make_shared<InMemoryDirIterator>());
960   }
961 
962   if (auto *DirNode = dyn_cast<detail::InMemoryDirectory>(*Node))
963     return directory_iterator(
964         std::make_shared<InMemoryDirIterator>(*DirNode, Dir.str()));
965 
966   EC = make_error_code(llvm::errc::not_a_directory);
967   return directory_iterator(std::make_shared<InMemoryDirIterator>());
968 }
969 
970 std::error_code InMemoryFileSystem::setCurrentWorkingDirectory(const Twine &P) {
971   SmallString<128> Path;
972   P.toVector(Path);
973 
974   // Fix up relative paths. This just prepends the current working directory.
975   std::error_code EC = makeAbsolute(Path);
976   assert(!EC);
977   (void)EC;
978 
979   if (useNormalizedPaths())
980     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
981 
982   if (!Path.empty())
983     WorkingDirectory = std::string(Path.str());
984   return {};
985 }
986 
987 std::error_code
988 InMemoryFileSystem::getRealPath(const Twine &Path,
989                                 SmallVectorImpl<char> &Output) const {
990   auto CWD = getCurrentWorkingDirectory();
991   if (!CWD || CWD->empty())
992     return errc::operation_not_permitted;
993   Path.toVector(Output);
994   if (auto EC = makeAbsolute(Output))
995     return EC;
996   llvm::sys::path::remove_dots(Output, /*remove_dot_dot=*/true);
997   return {};
998 }
999 
1000 std::error_code InMemoryFileSystem::isLocal(const Twine &Path, bool &Result) {
1001   Result = false;
1002   return {};
1003 }
1004 
1005 } // namespace vfs
1006 } // namespace llvm
1007 
1008 //===-----------------------------------------------------------------------===/
1009 // RedirectingFileSystem implementation
1010 //===-----------------------------------------------------------------------===/
1011 
1012 namespace {
1013 
1014 static llvm::sys::path::Style getExistingStyle(llvm::StringRef Path) {
1015   // Detect the path style in use by checking the first separator.
1016   llvm::sys::path::Style style = llvm::sys::path::Style::native;
1017   const size_t n = Path.find_first_of("/\\");
1018   if (n != static_cast<size_t>(-1))
1019     style = (Path[n] == '/') ? llvm::sys::path::Style::posix
1020                              : llvm::sys::path::Style::windows;
1021   return style;
1022 }
1023 
1024 /// Removes leading "./" as well as path components like ".." and ".".
1025 static llvm::SmallString<256> canonicalize(llvm::StringRef Path) {
1026   // First detect the path style in use by checking the first separator.
1027   llvm::sys::path::Style style = getExistingStyle(Path);
1028 
1029   // Now remove the dots.  Explicitly specifying the path style prevents the
1030   // direction of the slashes from changing.
1031   llvm::SmallString<256> result =
1032       llvm::sys::path::remove_leading_dotslash(Path, style);
1033   llvm::sys::path::remove_dots(result, /*remove_dot_dot=*/true, style);
1034   return result;
1035 }
1036 
1037 } // anonymous namespace
1038 
1039 
1040 RedirectingFileSystem::RedirectingFileSystem(IntrusiveRefCntPtr<FileSystem> FS)
1041     : ExternalFS(std::move(FS)) {
1042   if (ExternalFS)
1043     if (auto ExternalWorkingDirectory =
1044             ExternalFS->getCurrentWorkingDirectory()) {
1045       WorkingDirectory = *ExternalWorkingDirectory;
1046     }
1047 }
1048 
1049 /// Directory iterator implementation for \c RedirectingFileSystem's
1050 /// directory entries.
1051 class llvm::vfs::RedirectingFSDirIterImpl
1052     : public llvm::vfs::detail::DirIterImpl {
1053   std::string Dir;
1054   RedirectingFileSystem::DirectoryEntry::iterator Current, End;
1055 
1056   std::error_code incrementImpl(bool IsFirstTime) {
1057     assert((IsFirstTime || Current != End) && "cannot iterate past end");
1058     if (!IsFirstTime)
1059       ++Current;
1060     if (Current != End) {
1061       SmallString<128> PathStr(Dir);
1062       llvm::sys::path::append(PathStr, (*Current)->getName());
1063       sys::fs::file_type Type = sys::fs::file_type::type_unknown;
1064       switch ((*Current)->getKind()) {
1065       case RedirectingFileSystem::EK_Directory:
1066         LLVM_FALLTHROUGH;
1067       case RedirectingFileSystem::EK_DirectoryRemap:
1068         Type = sys::fs::file_type::directory_file;
1069         break;
1070       case RedirectingFileSystem::EK_File:
1071         Type = sys::fs::file_type::regular_file;
1072         break;
1073       }
1074       CurrentEntry = directory_entry(std::string(PathStr.str()), Type);
1075     } else {
1076       CurrentEntry = directory_entry();
1077     }
1078     return {};
1079   };
1080 
1081 public:
1082   RedirectingFSDirIterImpl(
1083       const Twine &Path, RedirectingFileSystem::DirectoryEntry::iterator Begin,
1084       RedirectingFileSystem::DirectoryEntry::iterator End, std::error_code &EC)
1085       : Dir(Path.str()), Current(Begin), End(End) {
1086     EC = incrementImpl(/*IsFirstTime=*/true);
1087   }
1088 
1089   std::error_code increment() override {
1090     return incrementImpl(/*IsFirstTime=*/false);
1091   }
1092 };
1093 
1094 /// Directory iterator implementation for \c RedirectingFileSystem's
1095 /// directory remap entries that maps the paths reported by the external
1096 /// file system's directory iterator back to the virtual directory's path.
1097 class RedirectingFSDirRemapIterImpl : public llvm::vfs::detail::DirIterImpl {
1098   std::string Dir;
1099   llvm::sys::path::Style DirStyle;
1100   llvm::vfs::directory_iterator ExternalIter;
1101 
1102 public:
1103   RedirectingFSDirRemapIterImpl(std::string DirPath,
1104                                 llvm::vfs::directory_iterator ExtIter)
1105       : Dir(std::move(DirPath)), DirStyle(getExistingStyle(Dir)),
1106         ExternalIter(ExtIter) {
1107     if (ExternalIter != llvm::vfs::directory_iterator())
1108       setCurrentEntry();
1109   }
1110 
1111   void setCurrentEntry() {
1112     StringRef ExternalPath = ExternalIter->path();
1113     llvm::sys::path::Style ExternalStyle = getExistingStyle(ExternalPath);
1114     StringRef File = llvm::sys::path::filename(ExternalPath, ExternalStyle);
1115 
1116     SmallString<128> NewPath(Dir);
1117     llvm::sys::path::append(NewPath, DirStyle, File);
1118 
1119     CurrentEntry = directory_entry(std::string(NewPath), ExternalIter->type());
1120   }
1121 
1122   std::error_code increment() override {
1123     std::error_code EC;
1124     ExternalIter.increment(EC);
1125     if (!EC && ExternalIter != llvm::vfs::directory_iterator())
1126       setCurrentEntry();
1127     else
1128       CurrentEntry = directory_entry();
1129     return EC;
1130   }
1131 };
1132 
1133 llvm::ErrorOr<std::string>
1134 RedirectingFileSystem::getCurrentWorkingDirectory() const {
1135   return WorkingDirectory;
1136 }
1137 
1138 std::error_code
1139 RedirectingFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
1140   // Don't change the working directory if the path doesn't exist.
1141   if (!exists(Path))
1142     return errc::no_such_file_or_directory;
1143 
1144   SmallString<128> AbsolutePath;
1145   Path.toVector(AbsolutePath);
1146   if (std::error_code EC = makeAbsolute(AbsolutePath))
1147     return EC;
1148   WorkingDirectory = std::string(AbsolutePath.str());
1149   return {};
1150 }
1151 
1152 std::error_code RedirectingFileSystem::isLocal(const Twine &Path_,
1153                                                bool &Result) {
1154   SmallString<256> Path;
1155   Path_.toVector(Path);
1156 
1157   if (std::error_code EC = makeCanonical(Path))
1158     return {};
1159 
1160   return ExternalFS->isLocal(Path, Result);
1161 }
1162 
1163 std::error_code RedirectingFileSystem::makeAbsolute(SmallVectorImpl<char> &Path) const {
1164   if (llvm::sys::path::is_absolute(Path, llvm::sys::path::Style::posix) ||
1165       llvm::sys::path::is_absolute(Path, llvm::sys::path::Style::windows))
1166     return {};
1167 
1168   auto WorkingDir = getCurrentWorkingDirectory();
1169   if (!WorkingDir)
1170     return WorkingDir.getError();
1171 
1172   // We can't use sys::fs::make_absolute because that assumes the path style
1173   // is native and there is no way to override that.  Since we know WorkingDir
1174   // is absolute, we can use it to determine which style we actually have and
1175   // append Path ourselves.
1176   sys::path::Style style = sys::path::Style::windows;
1177   if (sys::path::is_absolute(WorkingDir.get(), sys::path::Style::posix)) {
1178     style = sys::path::Style::posix;
1179   }
1180 
1181   std::string Result = WorkingDir.get();
1182   StringRef Dir(Result);
1183   if (!Dir.endswith(sys::path::get_separator(style))) {
1184     Result += sys::path::get_separator(style);
1185   }
1186   Result.append(Path.data(), Path.size());
1187   Path.assign(Result.begin(), Result.end());
1188 
1189   return {};
1190 }
1191 
1192 directory_iterator RedirectingFileSystem::dir_begin(const Twine &Dir,
1193                                                     std::error_code &EC) {
1194   SmallString<256> Path;
1195   Dir.toVector(Path);
1196 
1197   EC = makeCanonical(Path);
1198   if (EC)
1199     return {};
1200 
1201   ErrorOr<RedirectingFileSystem::LookupResult> Result = lookupPath(Path);
1202   if (!Result) {
1203     EC = Result.getError();
1204     if (shouldFallBackToExternalFS(EC))
1205       return ExternalFS->dir_begin(Path, EC);
1206     return {};
1207   }
1208 
1209   // Use status to make sure the path exists and refers to a directory.
1210   ErrorOr<Status> S = status(Path, *Result);
1211   if (!S) {
1212     if (shouldFallBackToExternalFS(S.getError(), Result->E))
1213       return ExternalFS->dir_begin(Dir, EC);
1214     EC = S.getError();
1215     return {};
1216   }
1217   if (!S->isDirectory()) {
1218     EC = std::error_code(static_cast<int>(errc::not_a_directory),
1219                          std::system_category());
1220     return {};
1221   }
1222 
1223   // Create the appropriate directory iterator based on whether we found a
1224   // DirectoryRemapEntry or DirectoryEntry.
1225   directory_iterator DirIter;
1226   if (auto ExtRedirect = Result->getExternalRedirect()) {
1227     auto RE = cast<RedirectingFileSystem::RemapEntry>(Result->E);
1228     DirIter = ExternalFS->dir_begin(*ExtRedirect, EC);
1229 
1230     if (!RE->useExternalName(UseExternalNames)) {
1231       // Update the paths in the results to use the virtual directory's path.
1232       DirIter =
1233           directory_iterator(std::make_shared<RedirectingFSDirRemapIterImpl>(
1234               std::string(Path), DirIter));
1235     }
1236   } else {
1237     auto DE = cast<DirectoryEntry>(Result->E);
1238     DirIter = directory_iterator(std::make_shared<RedirectingFSDirIterImpl>(
1239         Path, DE->contents_begin(), DE->contents_end(), EC));
1240   }
1241 
1242   if (!shouldUseExternalFS())
1243     return DirIter;
1244   return directory_iterator(std::make_shared<CombiningDirIterImpl>(
1245       DirIter, ExternalFS, std::string(Path), EC));
1246 }
1247 
1248 void RedirectingFileSystem::setExternalContentsPrefixDir(StringRef PrefixDir) {
1249   ExternalContentsPrefixDir = PrefixDir.str();
1250 }
1251 
1252 StringRef RedirectingFileSystem::getExternalContentsPrefixDir() const {
1253   return ExternalContentsPrefixDir;
1254 }
1255 
1256 void RedirectingFileSystem::setFallthrough(bool Fallthrough) {
1257   IsFallthrough = Fallthrough;
1258 }
1259 
1260 std::vector<StringRef> RedirectingFileSystem::getRoots() const {
1261   std::vector<StringRef> R;
1262   for (const auto &Root : Roots)
1263     R.push_back(Root->getName());
1264   return R;
1265 }
1266 
1267 void RedirectingFileSystem::dump(raw_ostream &OS) const {
1268   for (const auto &Root : Roots)
1269     dumpEntry(OS, Root.get());
1270 }
1271 
1272 void RedirectingFileSystem::dumpEntry(raw_ostream &OS,
1273                                       RedirectingFileSystem::Entry *E,
1274                                       int NumSpaces) const {
1275   StringRef Name = E->getName();
1276   for (int i = 0, e = NumSpaces; i < e; ++i)
1277     OS << " ";
1278   OS << "'" << Name.str().c_str() << "'"
1279      << "\n";
1280 
1281   if (E->getKind() == RedirectingFileSystem::EK_Directory) {
1282     auto *DE = dyn_cast<RedirectingFileSystem::DirectoryEntry>(E);
1283     assert(DE && "Should be a directory");
1284 
1285     for (std::unique_ptr<Entry> &SubEntry :
1286          llvm::make_range(DE->contents_begin(), DE->contents_end()))
1287       dumpEntry(OS, SubEntry.get(), NumSpaces + 2);
1288   }
1289 }
1290 
1291 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1292 LLVM_DUMP_METHOD void RedirectingFileSystem::dump() const { dump(dbgs()); }
1293 #endif
1294 
1295 /// A helper class to hold the common YAML parsing state.
1296 class llvm::vfs::RedirectingFileSystemParser {
1297   yaml::Stream &Stream;
1298 
1299   void error(yaml::Node *N, const Twine &Msg) { Stream.printError(N, Msg); }
1300 
1301   // false on error
1302   bool parseScalarString(yaml::Node *N, StringRef &Result,
1303                          SmallVectorImpl<char> &Storage) {
1304     const auto *S = dyn_cast<yaml::ScalarNode>(N);
1305 
1306     if (!S) {
1307       error(N, "expected string");
1308       return false;
1309     }
1310     Result = S->getValue(Storage);
1311     return true;
1312   }
1313 
1314   // false on error
1315   bool parseScalarBool(yaml::Node *N, bool &Result) {
1316     SmallString<5> Storage;
1317     StringRef Value;
1318     if (!parseScalarString(N, Value, Storage))
1319       return false;
1320 
1321     if (Value.equals_insensitive("true") || Value.equals_insensitive("on") ||
1322         Value.equals_insensitive("yes") || Value == "1") {
1323       Result = true;
1324       return true;
1325     } else if (Value.equals_insensitive("false") ||
1326                Value.equals_insensitive("off") ||
1327                Value.equals_insensitive("no") || Value == "0") {
1328       Result = false;
1329       return true;
1330     }
1331 
1332     error(N, "expected boolean value");
1333     return false;
1334   }
1335 
1336   struct KeyStatus {
1337     bool Required;
1338     bool Seen = false;
1339 
1340     KeyStatus(bool Required = false) : Required(Required) {}
1341   };
1342 
1343   using KeyStatusPair = std::pair<StringRef, KeyStatus>;
1344 
1345   // false on error
1346   bool checkDuplicateOrUnknownKey(yaml::Node *KeyNode, StringRef Key,
1347                                   DenseMap<StringRef, KeyStatus> &Keys) {
1348     if (!Keys.count(Key)) {
1349       error(KeyNode, "unknown key");
1350       return false;
1351     }
1352     KeyStatus &S = Keys[Key];
1353     if (S.Seen) {
1354       error(KeyNode, Twine("duplicate key '") + Key + "'");
1355       return false;
1356     }
1357     S.Seen = true;
1358     return true;
1359   }
1360 
1361   // false on error
1362   bool checkMissingKeys(yaml::Node *Obj, DenseMap<StringRef, KeyStatus> &Keys) {
1363     for (const auto &I : Keys) {
1364       if (I.second.Required && !I.second.Seen) {
1365         error(Obj, Twine("missing key '") + I.first + "'");
1366         return false;
1367       }
1368     }
1369     return true;
1370   }
1371 
1372 public:
1373   static RedirectingFileSystem::Entry *
1374   lookupOrCreateEntry(RedirectingFileSystem *FS, StringRef Name,
1375                       RedirectingFileSystem::Entry *ParentEntry = nullptr) {
1376     if (!ParentEntry) { // Look for a existent root
1377       for (const auto &Root : FS->Roots) {
1378         if (Name.equals(Root->getName())) {
1379           ParentEntry = Root.get();
1380           return ParentEntry;
1381         }
1382       }
1383     } else { // Advance to the next component
1384       auto *DE = dyn_cast<RedirectingFileSystem::DirectoryEntry>(ParentEntry);
1385       for (std::unique_ptr<RedirectingFileSystem::Entry> &Content :
1386            llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1387         auto *DirContent =
1388             dyn_cast<RedirectingFileSystem::DirectoryEntry>(Content.get());
1389         if (DirContent && Name.equals(Content->getName()))
1390           return DirContent;
1391       }
1392     }
1393 
1394     // ... or create a new one
1395     std::unique_ptr<RedirectingFileSystem::Entry> E =
1396         std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1397             Name, Status("", getNextVirtualUniqueID(),
1398                          std::chrono::system_clock::now(), 0, 0, 0,
1399                          file_type::directory_file, sys::fs::all_all));
1400 
1401     if (!ParentEntry) { // Add a new root to the overlay
1402       FS->Roots.push_back(std::move(E));
1403       ParentEntry = FS->Roots.back().get();
1404       return ParentEntry;
1405     }
1406 
1407     auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(ParentEntry);
1408     DE->addContent(std::move(E));
1409     return DE->getLastContent();
1410   }
1411 
1412 private:
1413   void uniqueOverlayTree(RedirectingFileSystem *FS,
1414                          RedirectingFileSystem::Entry *SrcE,
1415                          RedirectingFileSystem::Entry *NewParentE = nullptr) {
1416     StringRef Name = SrcE->getName();
1417     switch (SrcE->getKind()) {
1418     case RedirectingFileSystem::EK_Directory: {
1419       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(SrcE);
1420       // Empty directories could be present in the YAML as a way to
1421       // describe a file for a current directory after some of its subdir
1422       // is parsed. This only leads to redundant walks, ignore it.
1423       if (!Name.empty())
1424         NewParentE = lookupOrCreateEntry(FS, Name, NewParentE);
1425       for (std::unique_ptr<RedirectingFileSystem::Entry> &SubEntry :
1426            llvm::make_range(DE->contents_begin(), DE->contents_end()))
1427         uniqueOverlayTree(FS, SubEntry.get(), NewParentE);
1428       break;
1429     }
1430     case RedirectingFileSystem::EK_DirectoryRemap: {
1431       assert(NewParentE && "Parent entry must exist");
1432       auto *DR = cast<RedirectingFileSystem::DirectoryRemapEntry>(SrcE);
1433       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(NewParentE);
1434       DE->addContent(
1435           std::make_unique<RedirectingFileSystem::DirectoryRemapEntry>(
1436               Name, DR->getExternalContentsPath(), DR->getUseName()));
1437       break;
1438     }
1439     case RedirectingFileSystem::EK_File: {
1440       assert(NewParentE && "Parent entry must exist");
1441       auto *FE = cast<RedirectingFileSystem::FileEntry>(SrcE);
1442       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(NewParentE);
1443       DE->addContent(std::make_unique<RedirectingFileSystem::FileEntry>(
1444           Name, FE->getExternalContentsPath(), FE->getUseName()));
1445       break;
1446     }
1447     }
1448   }
1449 
1450   std::unique_ptr<RedirectingFileSystem::Entry>
1451   parseEntry(yaml::Node *N, RedirectingFileSystem *FS, bool IsRootEntry) {
1452     auto *M = dyn_cast<yaml::MappingNode>(N);
1453     if (!M) {
1454       error(N, "expected mapping node for file or directory entry");
1455       return nullptr;
1456     }
1457 
1458     KeyStatusPair Fields[] = {
1459         KeyStatusPair("name", true),
1460         KeyStatusPair("type", true),
1461         KeyStatusPair("contents", false),
1462         KeyStatusPair("external-contents", false),
1463         KeyStatusPair("use-external-name", false),
1464     };
1465 
1466     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
1467 
1468     enum { CF_NotSet, CF_List, CF_External } ContentsField = CF_NotSet;
1469     std::vector<std::unique_ptr<RedirectingFileSystem::Entry>>
1470         EntryArrayContents;
1471     SmallString<256> ExternalContentsPath;
1472     SmallString<256> Name;
1473     yaml::Node *NameValueNode = nullptr;
1474     auto UseExternalName = RedirectingFileSystem::NK_NotSet;
1475     RedirectingFileSystem::EntryKind Kind;
1476 
1477     for (auto &I : *M) {
1478       StringRef Key;
1479       // Reuse the buffer for key and value, since we don't look at key after
1480       // parsing value.
1481       SmallString<256> Buffer;
1482       if (!parseScalarString(I.getKey(), Key, Buffer))
1483         return nullptr;
1484 
1485       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
1486         return nullptr;
1487 
1488       StringRef Value;
1489       if (Key == "name") {
1490         if (!parseScalarString(I.getValue(), Value, Buffer))
1491           return nullptr;
1492 
1493         NameValueNode = I.getValue();
1494         // Guarantee that old YAML files containing paths with ".." and "."
1495         // are properly canonicalized before read into the VFS.
1496         Name = canonicalize(Value).str();
1497       } else if (Key == "type") {
1498         if (!parseScalarString(I.getValue(), Value, Buffer))
1499           return nullptr;
1500         if (Value == "file")
1501           Kind = RedirectingFileSystem::EK_File;
1502         else if (Value == "directory")
1503           Kind = RedirectingFileSystem::EK_Directory;
1504         else if (Value == "directory-remap")
1505           Kind = RedirectingFileSystem::EK_DirectoryRemap;
1506         else {
1507           error(I.getValue(), "unknown value for 'type'");
1508           return nullptr;
1509         }
1510       } else if (Key == "contents") {
1511         if (ContentsField != CF_NotSet) {
1512           error(I.getKey(),
1513                 "entry already has 'contents' or 'external-contents'");
1514           return nullptr;
1515         }
1516         ContentsField = CF_List;
1517         auto *Contents = dyn_cast<yaml::SequenceNode>(I.getValue());
1518         if (!Contents) {
1519           // FIXME: this is only for directories, what about files?
1520           error(I.getValue(), "expected array");
1521           return nullptr;
1522         }
1523 
1524         for (auto &I : *Contents) {
1525           if (std::unique_ptr<RedirectingFileSystem::Entry> E =
1526                   parseEntry(&I, FS, /*IsRootEntry*/ false))
1527             EntryArrayContents.push_back(std::move(E));
1528           else
1529             return nullptr;
1530         }
1531       } else if (Key == "external-contents") {
1532         if (ContentsField != CF_NotSet) {
1533           error(I.getKey(),
1534                 "entry already has 'contents' or 'external-contents'");
1535           return nullptr;
1536         }
1537         ContentsField = CF_External;
1538         if (!parseScalarString(I.getValue(), Value, Buffer))
1539           return nullptr;
1540 
1541         SmallString<256> FullPath;
1542         if (FS->IsRelativeOverlay) {
1543           FullPath = FS->getExternalContentsPrefixDir();
1544           assert(!FullPath.empty() &&
1545                  "External contents prefix directory must exist");
1546           llvm::sys::path::append(FullPath, Value);
1547         } else {
1548           FullPath = Value;
1549         }
1550 
1551         // Guarantee that old YAML files containing paths with ".." and "."
1552         // are properly canonicalized before read into the VFS.
1553         FullPath = canonicalize(FullPath);
1554         ExternalContentsPath = FullPath.str();
1555       } else if (Key == "use-external-name") {
1556         bool Val;
1557         if (!parseScalarBool(I.getValue(), Val))
1558           return nullptr;
1559         UseExternalName = Val ? RedirectingFileSystem::NK_External
1560                               : RedirectingFileSystem::NK_Virtual;
1561       } else {
1562         llvm_unreachable("key missing from Keys");
1563       }
1564     }
1565 
1566     if (Stream.failed())
1567       return nullptr;
1568 
1569     // check for missing keys
1570     if (ContentsField == CF_NotSet) {
1571       error(N, "missing key 'contents' or 'external-contents'");
1572       return nullptr;
1573     }
1574     if (!checkMissingKeys(N, Keys))
1575       return nullptr;
1576 
1577     // check invalid configuration
1578     if (Kind == RedirectingFileSystem::EK_Directory &&
1579         UseExternalName != RedirectingFileSystem::NK_NotSet) {
1580       error(N, "'use-external-name' is not supported for 'directory' entries");
1581       return nullptr;
1582     }
1583 
1584     if (Kind == RedirectingFileSystem::EK_DirectoryRemap &&
1585         ContentsField == CF_List) {
1586       error(N, "'contents' is not supported for 'directory-remap' entries");
1587       return nullptr;
1588     }
1589 
1590     sys::path::Style path_style = sys::path::Style::native;
1591     if (IsRootEntry) {
1592       // VFS root entries may be in either Posix or Windows style.  Figure out
1593       // which style we have, and use it consistently.
1594       if (sys::path::is_absolute(Name, sys::path::Style::posix)) {
1595         path_style = sys::path::Style::posix;
1596       } else if (sys::path::is_absolute(Name, sys::path::Style::windows)) {
1597         path_style = sys::path::Style::windows;
1598       } else {
1599         assert(NameValueNode && "Name presence should be checked earlier");
1600         error(NameValueNode,
1601               "entry with relative path at the root level is not discoverable");
1602         return nullptr;
1603       }
1604     }
1605 
1606     // Remove trailing slash(es), being careful not to remove the root path
1607     StringRef Trimmed = Name;
1608     size_t RootPathLen = sys::path::root_path(Trimmed, path_style).size();
1609     while (Trimmed.size() > RootPathLen &&
1610            sys::path::is_separator(Trimmed.back(), path_style))
1611       Trimmed = Trimmed.slice(0, Trimmed.size() - 1);
1612 
1613     // Get the last component
1614     StringRef LastComponent = sys::path::filename(Trimmed, path_style);
1615 
1616     std::unique_ptr<RedirectingFileSystem::Entry> Result;
1617     switch (Kind) {
1618     case RedirectingFileSystem::EK_File:
1619       Result = std::make_unique<RedirectingFileSystem::FileEntry>(
1620           LastComponent, std::move(ExternalContentsPath), UseExternalName);
1621       break;
1622     case RedirectingFileSystem::EK_DirectoryRemap:
1623       Result = std::make_unique<RedirectingFileSystem::DirectoryRemapEntry>(
1624           LastComponent, std::move(ExternalContentsPath), UseExternalName);
1625       break;
1626     case RedirectingFileSystem::EK_Directory:
1627       Result = std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1628           LastComponent, std::move(EntryArrayContents),
1629           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1630                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1631       break;
1632     }
1633 
1634     StringRef Parent = sys::path::parent_path(Trimmed, path_style);
1635     if (Parent.empty())
1636       return Result;
1637 
1638     // if 'name' contains multiple components, create implicit directory entries
1639     for (sys::path::reverse_iterator I = sys::path::rbegin(Parent, path_style),
1640                                      E = sys::path::rend(Parent);
1641          I != E; ++I) {
1642       std::vector<std::unique_ptr<RedirectingFileSystem::Entry>> Entries;
1643       Entries.push_back(std::move(Result));
1644       Result = std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1645           *I, std::move(Entries),
1646           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1647                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1648     }
1649     return Result;
1650   }
1651 
1652 public:
1653   RedirectingFileSystemParser(yaml::Stream &S) : Stream(S) {}
1654 
1655   // false on error
1656   bool parse(yaml::Node *Root, RedirectingFileSystem *FS) {
1657     auto *Top = dyn_cast<yaml::MappingNode>(Root);
1658     if (!Top) {
1659       error(Root, "expected mapping node");
1660       return false;
1661     }
1662 
1663     KeyStatusPair Fields[] = {
1664         KeyStatusPair("version", true),
1665         KeyStatusPair("case-sensitive", false),
1666         KeyStatusPair("use-external-names", false),
1667         KeyStatusPair("overlay-relative", false),
1668         KeyStatusPair("fallthrough", false),
1669         KeyStatusPair("roots", true),
1670     };
1671 
1672     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
1673     std::vector<std::unique_ptr<RedirectingFileSystem::Entry>> RootEntries;
1674 
1675     // Parse configuration and 'roots'
1676     for (auto &I : *Top) {
1677       SmallString<10> KeyBuffer;
1678       StringRef Key;
1679       if (!parseScalarString(I.getKey(), Key, KeyBuffer))
1680         return false;
1681 
1682       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
1683         return false;
1684 
1685       if (Key == "roots") {
1686         auto *Roots = dyn_cast<yaml::SequenceNode>(I.getValue());
1687         if (!Roots) {
1688           error(I.getValue(), "expected array");
1689           return false;
1690         }
1691 
1692         for (auto &I : *Roots) {
1693           if (std::unique_ptr<RedirectingFileSystem::Entry> E =
1694                   parseEntry(&I, FS, /*IsRootEntry*/ true))
1695             RootEntries.push_back(std::move(E));
1696           else
1697             return false;
1698         }
1699       } else if (Key == "version") {
1700         StringRef VersionString;
1701         SmallString<4> Storage;
1702         if (!parseScalarString(I.getValue(), VersionString, Storage))
1703           return false;
1704         int Version;
1705         if (VersionString.getAsInteger<int>(10, Version)) {
1706           error(I.getValue(), "expected integer");
1707           return false;
1708         }
1709         if (Version < 0) {
1710           error(I.getValue(), "invalid version number");
1711           return false;
1712         }
1713         if (Version != 0) {
1714           error(I.getValue(), "version mismatch, expected 0");
1715           return false;
1716         }
1717       } else if (Key == "case-sensitive") {
1718         if (!parseScalarBool(I.getValue(), FS->CaseSensitive))
1719           return false;
1720       } else if (Key == "overlay-relative") {
1721         if (!parseScalarBool(I.getValue(), FS->IsRelativeOverlay))
1722           return false;
1723       } else if (Key == "use-external-names") {
1724         if (!parseScalarBool(I.getValue(), FS->UseExternalNames))
1725           return false;
1726       } else if (Key == "fallthrough") {
1727         if (!parseScalarBool(I.getValue(), FS->IsFallthrough))
1728           return false;
1729       } else {
1730         llvm_unreachable("key missing from Keys");
1731       }
1732     }
1733 
1734     if (Stream.failed())
1735       return false;
1736 
1737     if (!checkMissingKeys(Top, Keys))
1738       return false;
1739 
1740     // Now that we sucessefully parsed the YAML file, canonicalize the internal
1741     // representation to a proper directory tree so that we can search faster
1742     // inside the VFS.
1743     for (auto &E : RootEntries)
1744       uniqueOverlayTree(FS, E.get());
1745 
1746     return true;
1747   }
1748 };
1749 
1750 std::unique_ptr<RedirectingFileSystem>
1751 RedirectingFileSystem::create(std::unique_ptr<MemoryBuffer> Buffer,
1752                               SourceMgr::DiagHandlerTy DiagHandler,
1753                               StringRef YAMLFilePath, void *DiagContext,
1754                               IntrusiveRefCntPtr<FileSystem> ExternalFS) {
1755   SourceMgr SM;
1756   yaml::Stream Stream(Buffer->getMemBufferRef(), SM);
1757 
1758   SM.setDiagHandler(DiagHandler, DiagContext);
1759   yaml::document_iterator DI = Stream.begin();
1760   yaml::Node *Root = DI->getRoot();
1761   if (DI == Stream.end() || !Root) {
1762     SM.PrintMessage(SMLoc(), SourceMgr::DK_Error, "expected root node");
1763     return nullptr;
1764   }
1765 
1766   RedirectingFileSystemParser P(Stream);
1767 
1768   std::unique_ptr<RedirectingFileSystem> FS(
1769       new RedirectingFileSystem(ExternalFS));
1770 
1771   if (!YAMLFilePath.empty()) {
1772     // Use the YAML path from -ivfsoverlay to compute the dir to be prefixed
1773     // to each 'external-contents' path.
1774     //
1775     // Example:
1776     //    -ivfsoverlay dummy.cache/vfs/vfs.yaml
1777     // yields:
1778     //  FS->ExternalContentsPrefixDir => /<absolute_path_to>/dummy.cache/vfs
1779     //
1780     SmallString<256> OverlayAbsDir = sys::path::parent_path(YAMLFilePath);
1781     std::error_code EC = llvm::sys::fs::make_absolute(OverlayAbsDir);
1782     assert(!EC && "Overlay dir final path must be absolute");
1783     (void)EC;
1784     FS->setExternalContentsPrefixDir(OverlayAbsDir);
1785   }
1786 
1787   if (!P.parse(Root, FS.get()))
1788     return nullptr;
1789 
1790   return FS;
1791 }
1792 
1793 std::unique_ptr<RedirectingFileSystem> RedirectingFileSystem::create(
1794     ArrayRef<std::pair<std::string, std::string>> RemappedFiles,
1795     bool UseExternalNames, FileSystem &ExternalFS) {
1796   std::unique_ptr<RedirectingFileSystem> FS(
1797       new RedirectingFileSystem(&ExternalFS));
1798   FS->UseExternalNames = UseExternalNames;
1799 
1800   StringMap<RedirectingFileSystem::Entry *> Entries;
1801 
1802   for (auto &Mapping : llvm::reverse(RemappedFiles)) {
1803     SmallString<128> From = StringRef(Mapping.first);
1804     SmallString<128> To = StringRef(Mapping.second);
1805     {
1806       auto EC = ExternalFS.makeAbsolute(From);
1807       (void)EC;
1808       assert(!EC && "Could not make absolute path");
1809     }
1810 
1811     // Check if we've already mapped this file. The first one we see (in the
1812     // reverse iteration) wins.
1813     RedirectingFileSystem::Entry *&ToEntry = Entries[From];
1814     if (ToEntry)
1815       continue;
1816 
1817     // Add parent directories.
1818     RedirectingFileSystem::Entry *Parent = nullptr;
1819     StringRef FromDirectory = llvm::sys::path::parent_path(From);
1820     for (auto I = llvm::sys::path::begin(FromDirectory),
1821               E = llvm::sys::path::end(FromDirectory);
1822          I != E; ++I) {
1823       Parent = RedirectingFileSystemParser::lookupOrCreateEntry(FS.get(), *I,
1824                                                                 Parent);
1825     }
1826     assert(Parent && "File without a directory?");
1827     {
1828       auto EC = ExternalFS.makeAbsolute(To);
1829       (void)EC;
1830       assert(!EC && "Could not make absolute path");
1831     }
1832 
1833     // Add the file.
1834     auto NewFile = std::make_unique<RedirectingFileSystem::FileEntry>(
1835         llvm::sys::path::filename(From), To,
1836         UseExternalNames ? RedirectingFileSystem::NK_External
1837                          : RedirectingFileSystem::NK_Virtual);
1838     ToEntry = NewFile.get();
1839     cast<RedirectingFileSystem::DirectoryEntry>(Parent)->addContent(
1840         std::move(NewFile));
1841   }
1842 
1843   return FS;
1844 }
1845 
1846 RedirectingFileSystem::LookupResult::LookupResult(
1847     Entry *E, sys::path::const_iterator Start, sys::path::const_iterator End)
1848     : E(E) {
1849   assert(E != nullptr);
1850   // If the matched entry is a DirectoryRemapEntry, set ExternalRedirect to the
1851   // path of the directory it maps to in the external file system plus any
1852   // remaining path components in the provided iterator.
1853   if (auto *DRE = dyn_cast<RedirectingFileSystem::DirectoryRemapEntry>(E)) {
1854     SmallString<256> Redirect(DRE->getExternalContentsPath());
1855     sys::path::append(Redirect, Start, End,
1856                       getExistingStyle(DRE->getExternalContentsPath()));
1857     ExternalRedirect = std::string(Redirect);
1858   }
1859 }
1860 
1861 bool RedirectingFileSystem::shouldFallBackToExternalFS(
1862     std::error_code EC, RedirectingFileSystem::Entry *E) const {
1863   if (E && !isa<RedirectingFileSystem::DirectoryRemapEntry>(E))
1864     return false;
1865   return shouldUseExternalFS() && EC == llvm::errc::no_such_file_or_directory;
1866 }
1867 
1868 std::error_code
1869 RedirectingFileSystem::makeCanonical(SmallVectorImpl<char> &Path) const {
1870   if (std::error_code EC = makeAbsolute(Path))
1871     return EC;
1872 
1873   llvm::SmallString<256> CanonicalPath =
1874       canonicalize(StringRef(Path.data(), Path.size()));
1875   if (CanonicalPath.empty())
1876     return make_error_code(llvm::errc::invalid_argument);
1877 
1878   Path.assign(CanonicalPath.begin(), CanonicalPath.end());
1879   return {};
1880 }
1881 
1882 ErrorOr<RedirectingFileSystem::LookupResult>
1883 RedirectingFileSystem::lookupPath(StringRef Path) const {
1884   sys::path::const_iterator Start = sys::path::begin(Path);
1885   sys::path::const_iterator End = sys::path::end(Path);
1886   for (const auto &Root : Roots) {
1887     ErrorOr<RedirectingFileSystem::LookupResult> Result =
1888         lookupPathImpl(Start, End, Root.get());
1889     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
1890       return Result;
1891   }
1892   return make_error_code(llvm::errc::no_such_file_or_directory);
1893 }
1894 
1895 ErrorOr<RedirectingFileSystem::LookupResult>
1896 RedirectingFileSystem::lookupPathImpl(
1897     sys::path::const_iterator Start, sys::path::const_iterator End,
1898     RedirectingFileSystem::Entry *From) const {
1899   assert(!isTraversalComponent(*Start) &&
1900          !isTraversalComponent(From->getName()) &&
1901          "Paths should not contain traversal components");
1902 
1903   StringRef FromName = From->getName();
1904 
1905   // Forward the search to the next component in case this is an empty one.
1906   if (!FromName.empty()) {
1907     if (!pathComponentMatches(*Start, FromName))
1908       return make_error_code(llvm::errc::no_such_file_or_directory);
1909 
1910     ++Start;
1911 
1912     if (Start == End) {
1913       // Match!
1914       return LookupResult(From, Start, End);
1915     }
1916   }
1917 
1918   if (isa<RedirectingFileSystem::FileEntry>(From))
1919     return make_error_code(llvm::errc::not_a_directory);
1920 
1921   if (isa<RedirectingFileSystem::DirectoryRemapEntry>(From))
1922     return LookupResult(From, Start, End);
1923 
1924   auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(From);
1925   for (const std::unique_ptr<RedirectingFileSystem::Entry> &DirEntry :
1926        llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1927     ErrorOr<RedirectingFileSystem::LookupResult> Result =
1928         lookupPathImpl(Start, End, DirEntry.get());
1929     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
1930       return Result;
1931   }
1932 
1933   return make_error_code(llvm::errc::no_such_file_or_directory);
1934 }
1935 
1936 static Status getRedirectedFileStatus(const Twine &Path, bool UseExternalNames,
1937                                       Status ExternalStatus) {
1938   Status S = ExternalStatus;
1939   if (!UseExternalNames)
1940     S = Status::copyWithNewName(S, Path);
1941   S.IsVFSMapped = true;
1942   return S;
1943 }
1944 
1945 ErrorOr<Status> RedirectingFileSystem::status(
1946     const Twine &Path, const RedirectingFileSystem::LookupResult &Result) {
1947   if (Optional<StringRef> ExtRedirect = Result.getExternalRedirect()) {
1948     ErrorOr<Status> S = ExternalFS->status(*ExtRedirect);
1949     if (!S)
1950       return S;
1951     auto *RE = cast<RedirectingFileSystem::RemapEntry>(Result.E);
1952     return getRedirectedFileStatus(Path, RE->useExternalName(UseExternalNames),
1953                                    *S);
1954   }
1955 
1956   auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(Result.E);
1957   return Status::copyWithNewName(DE->getStatus(), Path);
1958 }
1959 
1960 ErrorOr<Status> RedirectingFileSystem::status(const Twine &Path_) {
1961   SmallString<256> Path;
1962   Path_.toVector(Path);
1963 
1964   if (std::error_code EC = makeCanonical(Path))
1965     return EC;
1966 
1967   ErrorOr<RedirectingFileSystem::LookupResult> Result = lookupPath(Path);
1968   if (!Result) {
1969     if (shouldFallBackToExternalFS(Result.getError()))
1970       return ExternalFS->status(Path);
1971     return Result.getError();
1972   }
1973 
1974   ErrorOr<Status> S = status(Path, *Result);
1975   if (!S && shouldFallBackToExternalFS(S.getError(), Result->E))
1976     S = ExternalFS->status(Path);
1977   return S;
1978 }
1979 
1980 namespace {
1981 
1982 /// Provide a file wrapper with an overriden status.
1983 class FileWithFixedStatus : public File {
1984   std::unique_ptr<File> InnerFile;
1985   Status S;
1986 
1987 public:
1988   FileWithFixedStatus(std::unique_ptr<File> InnerFile, Status S)
1989       : InnerFile(std::move(InnerFile)), S(std::move(S)) {}
1990 
1991   ErrorOr<Status> status() override { return S; }
1992   ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
1993 
1994   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
1995             bool IsVolatile) override {
1996     return InnerFile->getBuffer(Name, FileSize, RequiresNullTerminator,
1997                                 IsVolatile);
1998   }
1999 
2000   std::error_code close() override { return InnerFile->close(); }
2001 };
2002 
2003 } // namespace
2004 
2005 ErrorOr<std::unique_ptr<File>>
2006 RedirectingFileSystem::openFileForRead(const Twine &Path_) {
2007   SmallString<256> Path;
2008   Path_.toVector(Path);
2009 
2010   if (std::error_code EC = makeCanonical(Path))
2011     return EC;
2012 
2013   ErrorOr<RedirectingFileSystem::LookupResult> Result = lookupPath(Path);
2014   if (!Result) {
2015     if (shouldFallBackToExternalFS(Result.getError()))
2016       return ExternalFS->openFileForRead(Path);
2017     return Result.getError();
2018   }
2019 
2020   if (!Result->getExternalRedirect()) // FIXME: errc::not_a_file?
2021     return make_error_code(llvm::errc::invalid_argument);
2022 
2023   StringRef ExtRedirect = *Result->getExternalRedirect();
2024   auto *RE = cast<RedirectingFileSystem::RemapEntry>(Result->E);
2025 
2026   auto ExternalFile = ExternalFS->openFileForRead(ExtRedirect);
2027   if (!ExternalFile) {
2028     if (shouldFallBackToExternalFS(ExternalFile.getError(), Result->E))
2029       return ExternalFS->openFileForRead(Path);
2030     return ExternalFile;
2031   }
2032 
2033   auto ExternalStatus = (*ExternalFile)->status();
2034   if (!ExternalStatus)
2035     return ExternalStatus.getError();
2036 
2037   // FIXME: Update the status with the name and VFSMapped.
2038   Status S = getRedirectedFileStatus(
2039       Path, RE->useExternalName(UseExternalNames), *ExternalStatus);
2040   return std::unique_ptr<File>(
2041       std::make_unique<FileWithFixedStatus>(std::move(*ExternalFile), S));
2042 }
2043 
2044 std::error_code
2045 RedirectingFileSystem::getRealPath(const Twine &Path_,
2046                                    SmallVectorImpl<char> &Output) const {
2047   SmallString<256> Path;
2048   Path_.toVector(Path);
2049 
2050   if (std::error_code EC = makeCanonical(Path))
2051     return EC;
2052 
2053   ErrorOr<RedirectingFileSystem::LookupResult> Result = lookupPath(Path);
2054   if (!Result) {
2055     if (shouldFallBackToExternalFS(Result.getError()))
2056       return ExternalFS->getRealPath(Path, Output);
2057     return Result.getError();
2058   }
2059 
2060   // If we found FileEntry or DirectoryRemapEntry, look up the mapped
2061   // path in the external file system.
2062   if (auto ExtRedirect = Result->getExternalRedirect()) {
2063     auto P = ExternalFS->getRealPath(*ExtRedirect, Output);
2064     if (!P && shouldFallBackToExternalFS(P, Result->E)) {
2065       return ExternalFS->getRealPath(Path, Output);
2066     }
2067     return P;
2068   }
2069 
2070   // If we found a DirectoryEntry, still fall back to ExternalFS if allowed,
2071   // because directories don't have a single external contents path.
2072   return shouldUseExternalFS() ? ExternalFS->getRealPath(Path, Output)
2073                                : llvm::errc::invalid_argument;
2074 }
2075 
2076 std::unique_ptr<FileSystem>
2077 vfs::getVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
2078                     SourceMgr::DiagHandlerTy DiagHandler,
2079                     StringRef YAMLFilePath, void *DiagContext,
2080                     IntrusiveRefCntPtr<FileSystem> ExternalFS) {
2081   return RedirectingFileSystem::create(std::move(Buffer), DiagHandler,
2082                                        YAMLFilePath, DiagContext,
2083                                        std::move(ExternalFS));
2084 }
2085 
2086 static void getVFSEntries(RedirectingFileSystem::Entry *SrcE,
2087                           SmallVectorImpl<StringRef> &Path,
2088                           SmallVectorImpl<YAMLVFSEntry> &Entries) {
2089   auto Kind = SrcE->getKind();
2090   if (Kind == RedirectingFileSystem::EK_Directory) {
2091     auto *DE = dyn_cast<RedirectingFileSystem::DirectoryEntry>(SrcE);
2092     assert(DE && "Must be a directory");
2093     for (std::unique_ptr<RedirectingFileSystem::Entry> &SubEntry :
2094          llvm::make_range(DE->contents_begin(), DE->contents_end())) {
2095       Path.push_back(SubEntry->getName());
2096       getVFSEntries(SubEntry.get(), Path, Entries);
2097       Path.pop_back();
2098     }
2099     return;
2100   }
2101 
2102   if (Kind == RedirectingFileSystem::EK_DirectoryRemap) {
2103     auto *DR = dyn_cast<RedirectingFileSystem::DirectoryRemapEntry>(SrcE);
2104     assert(DR && "Must be a directory remap");
2105     SmallString<128> VPath;
2106     for (auto &Comp : Path)
2107       llvm::sys::path::append(VPath, Comp);
2108     Entries.push_back(
2109         YAMLVFSEntry(VPath.c_str(), DR->getExternalContentsPath()));
2110     return;
2111   }
2112 
2113   assert(Kind == RedirectingFileSystem::EK_File && "Must be a EK_File");
2114   auto *FE = dyn_cast<RedirectingFileSystem::FileEntry>(SrcE);
2115   assert(FE && "Must be a file");
2116   SmallString<128> VPath;
2117   for (auto &Comp : Path)
2118     llvm::sys::path::append(VPath, Comp);
2119   Entries.push_back(YAMLVFSEntry(VPath.c_str(), FE->getExternalContentsPath()));
2120 }
2121 
2122 void vfs::collectVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
2123                              SourceMgr::DiagHandlerTy DiagHandler,
2124                              StringRef YAMLFilePath,
2125                              SmallVectorImpl<YAMLVFSEntry> &CollectedEntries,
2126                              void *DiagContext,
2127                              IntrusiveRefCntPtr<FileSystem> ExternalFS) {
2128   std::unique_ptr<RedirectingFileSystem> VFS = RedirectingFileSystem::create(
2129       std::move(Buffer), DiagHandler, YAMLFilePath, DiagContext,
2130       std::move(ExternalFS));
2131   if (!VFS)
2132     return;
2133   ErrorOr<RedirectingFileSystem::LookupResult> RootResult =
2134       VFS->lookupPath("/");
2135   if (!RootResult)
2136     return;
2137   SmallVector<StringRef, 8> Components;
2138   Components.push_back("/");
2139   getVFSEntries(RootResult->E, Components, CollectedEntries);
2140 }
2141 
2142 UniqueID vfs::getNextVirtualUniqueID() {
2143   static std::atomic<unsigned> UID;
2144   unsigned ID = ++UID;
2145   // The following assumes that uint64_t max will never collide with a real
2146   // dev_t value from the OS.
2147   return UniqueID(std::numeric_limits<uint64_t>::max(), ID);
2148 }
2149 
2150 void YAMLVFSWriter::addEntry(StringRef VirtualPath, StringRef RealPath,
2151                              bool IsDirectory) {
2152   assert(sys::path::is_absolute(VirtualPath) && "virtual path not absolute");
2153   assert(sys::path::is_absolute(RealPath) && "real path not absolute");
2154   assert(!pathHasTraversal(VirtualPath) && "path traversal is not supported");
2155   Mappings.emplace_back(VirtualPath, RealPath, IsDirectory);
2156 }
2157 
2158 void YAMLVFSWriter::addFileMapping(StringRef VirtualPath, StringRef RealPath) {
2159   addEntry(VirtualPath, RealPath, /*IsDirectory=*/false);
2160 }
2161 
2162 void YAMLVFSWriter::addDirectoryMapping(StringRef VirtualPath,
2163                                         StringRef RealPath) {
2164   addEntry(VirtualPath, RealPath, /*IsDirectory=*/true);
2165 }
2166 
2167 namespace {
2168 
2169 class JSONWriter {
2170   llvm::raw_ostream &OS;
2171   SmallVector<StringRef, 16> DirStack;
2172 
2173   unsigned getDirIndent() { return 4 * DirStack.size(); }
2174   unsigned getFileIndent() { return 4 * (DirStack.size() + 1); }
2175   bool containedIn(StringRef Parent, StringRef Path);
2176   StringRef containedPart(StringRef Parent, StringRef Path);
2177   void startDirectory(StringRef Path);
2178   void endDirectory();
2179   void writeEntry(StringRef VPath, StringRef RPath);
2180 
2181 public:
2182   JSONWriter(llvm::raw_ostream &OS) : OS(OS) {}
2183 
2184   void write(ArrayRef<YAMLVFSEntry> Entries, Optional<bool> UseExternalNames,
2185              Optional<bool> IsCaseSensitive, Optional<bool> IsOverlayRelative,
2186              StringRef OverlayDir);
2187 };
2188 
2189 } // namespace
2190 
2191 bool JSONWriter::containedIn(StringRef Parent, StringRef Path) {
2192   using namespace llvm::sys;
2193 
2194   // Compare each path component.
2195   auto IParent = path::begin(Parent), EParent = path::end(Parent);
2196   for (auto IChild = path::begin(Path), EChild = path::end(Path);
2197        IParent != EParent && IChild != EChild; ++IParent, ++IChild) {
2198     if (*IParent != *IChild)
2199       return false;
2200   }
2201   // Have we exhausted the parent path?
2202   return IParent == EParent;
2203 }
2204 
2205 StringRef JSONWriter::containedPart(StringRef Parent, StringRef Path) {
2206   assert(!Parent.empty());
2207   assert(containedIn(Parent, Path));
2208   return Path.slice(Parent.size() + 1, StringRef::npos);
2209 }
2210 
2211 void JSONWriter::startDirectory(StringRef Path) {
2212   StringRef Name =
2213       DirStack.empty() ? Path : containedPart(DirStack.back(), Path);
2214   DirStack.push_back(Path);
2215   unsigned Indent = getDirIndent();
2216   OS.indent(Indent) << "{\n";
2217   OS.indent(Indent + 2) << "'type': 'directory',\n";
2218   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(Name) << "\",\n";
2219   OS.indent(Indent + 2) << "'contents': [\n";
2220 }
2221 
2222 void JSONWriter::endDirectory() {
2223   unsigned Indent = getDirIndent();
2224   OS.indent(Indent + 2) << "]\n";
2225   OS.indent(Indent) << "}";
2226 
2227   DirStack.pop_back();
2228 }
2229 
2230 void JSONWriter::writeEntry(StringRef VPath, StringRef RPath) {
2231   unsigned Indent = getFileIndent();
2232   OS.indent(Indent) << "{\n";
2233   OS.indent(Indent + 2) << "'type': 'file',\n";
2234   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(VPath) << "\",\n";
2235   OS.indent(Indent + 2) << "'external-contents': \""
2236                         << llvm::yaml::escape(RPath) << "\"\n";
2237   OS.indent(Indent) << "}";
2238 }
2239 
2240 void JSONWriter::write(ArrayRef<YAMLVFSEntry> Entries,
2241                        Optional<bool> UseExternalNames,
2242                        Optional<bool> IsCaseSensitive,
2243                        Optional<bool> IsOverlayRelative,
2244                        StringRef OverlayDir) {
2245   using namespace llvm::sys;
2246 
2247   OS << "{\n"
2248         "  'version': 0,\n";
2249   if (IsCaseSensitive.hasValue())
2250     OS << "  'case-sensitive': '"
2251        << (IsCaseSensitive.getValue() ? "true" : "false") << "',\n";
2252   if (UseExternalNames.hasValue())
2253     OS << "  'use-external-names': '"
2254        << (UseExternalNames.getValue() ? "true" : "false") << "',\n";
2255   bool UseOverlayRelative = false;
2256   if (IsOverlayRelative.hasValue()) {
2257     UseOverlayRelative = IsOverlayRelative.getValue();
2258     OS << "  'overlay-relative': '" << (UseOverlayRelative ? "true" : "false")
2259        << "',\n";
2260   }
2261   OS << "  'roots': [\n";
2262 
2263   if (!Entries.empty()) {
2264     const YAMLVFSEntry &Entry = Entries.front();
2265 
2266     startDirectory(
2267       Entry.IsDirectory ? Entry.VPath : path::parent_path(Entry.VPath)
2268     );
2269 
2270     StringRef RPath = Entry.RPath;
2271     if (UseOverlayRelative) {
2272       unsigned OverlayDirLen = OverlayDir.size();
2273       assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2274              "Overlay dir must be contained in RPath");
2275       RPath = RPath.slice(OverlayDirLen, RPath.size());
2276     }
2277 
2278     bool IsCurrentDirEmpty = true;
2279     if (!Entry.IsDirectory) {
2280       writeEntry(path::filename(Entry.VPath), RPath);
2281       IsCurrentDirEmpty = false;
2282     }
2283 
2284     for (const auto &Entry : Entries.slice(1)) {
2285       StringRef Dir =
2286           Entry.IsDirectory ? Entry.VPath : path::parent_path(Entry.VPath);
2287       if (Dir == DirStack.back()) {
2288         if (!IsCurrentDirEmpty) {
2289           OS << ",\n";
2290         }
2291       } else {
2292         bool IsDirPoppedFromStack = false;
2293         while (!DirStack.empty() && !containedIn(DirStack.back(), Dir)) {
2294           OS << "\n";
2295           endDirectory();
2296           IsDirPoppedFromStack = true;
2297         }
2298         if (IsDirPoppedFromStack || !IsCurrentDirEmpty) {
2299           OS << ",\n";
2300         }
2301         startDirectory(Dir);
2302         IsCurrentDirEmpty = true;
2303       }
2304       StringRef RPath = Entry.RPath;
2305       if (UseOverlayRelative) {
2306         unsigned OverlayDirLen = OverlayDir.size();
2307         assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2308                "Overlay dir must be contained in RPath");
2309         RPath = RPath.slice(OverlayDirLen, RPath.size());
2310       }
2311       if (!Entry.IsDirectory) {
2312         writeEntry(path::filename(Entry.VPath), RPath);
2313         IsCurrentDirEmpty = false;
2314       }
2315     }
2316 
2317     while (!DirStack.empty()) {
2318       OS << "\n";
2319       endDirectory();
2320     }
2321     OS << "\n";
2322   }
2323 
2324   OS << "  ]\n"
2325      << "}\n";
2326 }
2327 
2328 void YAMLVFSWriter::write(llvm::raw_ostream &OS) {
2329   llvm::sort(Mappings, [](const YAMLVFSEntry &LHS, const YAMLVFSEntry &RHS) {
2330     return LHS.VPath < RHS.VPath;
2331   });
2332 
2333   JSONWriter(OS).write(Mappings, UseExternalNames, IsCaseSensitive,
2334                        IsOverlayRelative, OverlayDir);
2335 }
2336 
2337 vfs::recursive_directory_iterator::recursive_directory_iterator(
2338     FileSystem &FS_, const Twine &Path, std::error_code &EC)
2339     : FS(&FS_) {
2340   directory_iterator I = FS->dir_begin(Path, EC);
2341   if (I != directory_iterator()) {
2342     State = std::make_shared<detail::RecDirIterState>();
2343     State->Stack.push(I);
2344   }
2345 }
2346 
2347 vfs::recursive_directory_iterator &
2348 recursive_directory_iterator::increment(std::error_code &EC) {
2349   assert(FS && State && !State->Stack.empty() && "incrementing past end");
2350   assert(!State->Stack.top()->path().empty() && "non-canonical end iterator");
2351   vfs::directory_iterator End;
2352 
2353   if (State->HasNoPushRequest)
2354     State->HasNoPushRequest = false;
2355   else {
2356     if (State->Stack.top()->type() == sys::fs::file_type::directory_file) {
2357       vfs::directory_iterator I = FS->dir_begin(State->Stack.top()->path(), EC);
2358       if (I != End) {
2359         State->Stack.push(I);
2360         return *this;
2361       }
2362     }
2363   }
2364 
2365   while (!State->Stack.empty() && State->Stack.top().increment(EC) == End)
2366     State->Stack.pop();
2367 
2368   if (State->Stack.empty())
2369     State.reset(); // end iterator
2370 
2371   return *this;
2372 }
2373