xref: /llvm-project/llvm/lib/Support/VirtualFileSystem.cpp (revision a903ecb4a26d8cf9a2e9e8369105682fd98f3982)
1 //===- VirtualFileSystem.cpp - Virtual File System Layer ------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the VirtualFileSystem interface.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/Support/VirtualFileSystem.h"
14 #include "llvm/ADT/ArrayRef.h"
15 #include "llvm/ADT/DenseMap.h"
16 #include "llvm/ADT/IntrusiveRefCntPtr.h"
17 #include "llvm/ADT/Optional.h"
18 #include "llvm/ADT/STLExtras.h"
19 #include "llvm/ADT/SmallString.h"
20 #include "llvm/ADT/SmallVector.h"
21 #include "llvm/ADT/StringRef.h"
22 #include "llvm/ADT/StringSet.h"
23 #include "llvm/ADT/Twine.h"
24 #include "llvm/ADT/iterator_range.h"
25 #include "llvm/Config/llvm-config.h"
26 #include "llvm/Support/Casting.h"
27 #include "llvm/Support/Chrono.h"
28 #include "llvm/Support/Compiler.h"
29 #include "llvm/Support/Debug.h"
30 #include "llvm/Support/Errc.h"
31 #include "llvm/Support/ErrorHandling.h"
32 #include "llvm/Support/ErrorOr.h"
33 #include "llvm/Support/FileSystem.h"
34 #include "llvm/Support/FileSystem/UniqueID.h"
35 #include "llvm/Support/MemoryBuffer.h"
36 #include "llvm/Support/Path.h"
37 #include "llvm/Support/SMLoc.h"
38 #include "llvm/Support/SourceMgr.h"
39 #include "llvm/Support/YAMLParser.h"
40 #include "llvm/Support/raw_ostream.h"
41 #include <algorithm>
42 #include <atomic>
43 #include <cassert>
44 #include <cstdint>
45 #include <iterator>
46 #include <limits>
47 #include <memory>
48 #include <optional>
49 #include <string>
50 #include <system_error>
51 #include <utility>
52 #include <vector>
53 
54 using namespace llvm;
55 using namespace llvm::vfs;
56 
57 using llvm::sys::fs::file_t;
58 using llvm::sys::fs::file_status;
59 using llvm::sys::fs::file_type;
60 using llvm::sys::fs::kInvalidFile;
61 using llvm::sys::fs::perms;
62 using llvm::sys::fs::UniqueID;
63 
64 Status::Status(const file_status &Status)
65     : UID(Status.getUniqueID()), MTime(Status.getLastModificationTime()),
66       User(Status.getUser()), Group(Status.getGroup()), Size(Status.getSize()),
67       Type(Status.type()), Perms(Status.permissions()) {}
68 
69 Status::Status(const Twine &Name, UniqueID UID, sys::TimePoint<> MTime,
70                uint32_t User, uint32_t Group, uint64_t Size, file_type Type,
71                perms Perms)
72     : Name(Name.str()), UID(UID), MTime(MTime), User(User), Group(Group),
73       Size(Size), Type(Type), Perms(Perms) {}
74 
75 Status Status::copyWithNewSize(const Status &In, uint64_t NewSize) {
76   return Status(In.getName(), In.getUniqueID(), In.getLastModificationTime(),
77                 In.getUser(), In.getGroup(), NewSize, In.getType(),
78                 In.getPermissions());
79 }
80 
81 Status Status::copyWithNewName(const Status &In, const Twine &NewName) {
82   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
83                 In.getUser(), In.getGroup(), In.getSize(), In.getType(),
84                 In.getPermissions());
85 }
86 
87 Status Status::copyWithNewName(const file_status &In, const Twine &NewName) {
88   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
89                 In.getUser(), In.getGroup(), In.getSize(), In.type(),
90                 In.permissions());
91 }
92 
93 bool Status::equivalent(const Status &Other) const {
94   assert(isStatusKnown() && Other.isStatusKnown());
95   return getUniqueID() == Other.getUniqueID();
96 }
97 
98 bool Status::isDirectory() const { return Type == file_type::directory_file; }
99 
100 bool Status::isRegularFile() const { return Type == file_type::regular_file; }
101 
102 bool Status::isOther() const {
103   return exists() && !isRegularFile() && !isDirectory() && !isSymlink();
104 }
105 
106 bool Status::isSymlink() const { return Type == file_type::symlink_file; }
107 
108 bool Status::isStatusKnown() const { return Type != file_type::status_error; }
109 
110 bool Status::exists() const {
111   return isStatusKnown() && Type != file_type::file_not_found;
112 }
113 
114 File::~File() = default;
115 
116 FileSystem::~FileSystem() = default;
117 
118 ErrorOr<std::unique_ptr<MemoryBuffer>>
119 FileSystem::getBufferForFile(const llvm::Twine &Name, int64_t FileSize,
120                              bool RequiresNullTerminator, bool IsVolatile) {
121   auto F = openFileForRead(Name);
122   if (!F)
123     return F.getError();
124 
125   return (*F)->getBuffer(Name, FileSize, RequiresNullTerminator, IsVolatile);
126 }
127 
128 std::error_code FileSystem::makeAbsolute(SmallVectorImpl<char> &Path) const {
129   if (llvm::sys::path::is_absolute(Path))
130     return {};
131 
132   auto WorkingDir = getCurrentWorkingDirectory();
133   if (!WorkingDir)
134     return WorkingDir.getError();
135 
136   llvm::sys::fs::make_absolute(WorkingDir.get(), Path);
137   return {};
138 }
139 
140 std::error_code FileSystem::getRealPath(const Twine &Path,
141                                         SmallVectorImpl<char> &Output) const {
142   return errc::operation_not_permitted;
143 }
144 
145 std::error_code FileSystem::isLocal(const Twine &Path, bool &Result) {
146   return errc::operation_not_permitted;
147 }
148 
149 bool FileSystem::exists(const Twine &Path) {
150   auto Status = status(Path);
151   return Status && Status->exists();
152 }
153 
154 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
155 void FileSystem::dump() const { print(dbgs(), PrintType::RecursiveContents); }
156 #endif
157 
158 #ifndef NDEBUG
159 static bool isTraversalComponent(StringRef Component) {
160   return Component.equals("..") || Component.equals(".");
161 }
162 
163 static bool pathHasTraversal(StringRef Path) {
164   using namespace llvm::sys;
165 
166   for (StringRef Comp : llvm::make_range(path::begin(Path), path::end(Path)))
167     if (isTraversalComponent(Comp))
168       return true;
169   return false;
170 }
171 #endif
172 
173 //===-----------------------------------------------------------------------===/
174 // RealFileSystem implementation
175 //===-----------------------------------------------------------------------===/
176 
177 namespace {
178 
179 /// Wrapper around a raw file descriptor.
180 class RealFile : public File {
181   friend class RealFileSystem;
182 
183   file_t FD;
184   Status S;
185   std::string RealName;
186 
187   RealFile(file_t RawFD, StringRef NewName, StringRef NewRealPathName)
188       : FD(RawFD), S(NewName, {}, {}, {}, {}, {},
189                      llvm::sys::fs::file_type::status_error, {}),
190         RealName(NewRealPathName.str()) {
191     assert(FD != kInvalidFile && "Invalid or inactive file descriptor");
192   }
193 
194 public:
195   ~RealFile() override;
196 
197   ErrorOr<Status> status() override;
198   ErrorOr<std::string> getName() override;
199   ErrorOr<std::unique_ptr<MemoryBuffer>> getBuffer(const Twine &Name,
200                                                    int64_t FileSize,
201                                                    bool RequiresNullTerminator,
202                                                    bool IsVolatile) override;
203   std::error_code close() override;
204   void setPath(const Twine &Path) override;
205 };
206 
207 } // namespace
208 
209 RealFile::~RealFile() { close(); }
210 
211 ErrorOr<Status> RealFile::status() {
212   assert(FD != kInvalidFile && "cannot stat closed file");
213   if (!S.isStatusKnown()) {
214     file_status RealStatus;
215     if (std::error_code EC = sys::fs::status(FD, RealStatus))
216       return EC;
217     S = Status::copyWithNewName(RealStatus, S.getName());
218   }
219   return S;
220 }
221 
222 ErrorOr<std::string> RealFile::getName() {
223   return RealName.empty() ? S.getName().str() : RealName;
224 }
225 
226 ErrorOr<std::unique_ptr<MemoryBuffer>>
227 RealFile::getBuffer(const Twine &Name, int64_t FileSize,
228                     bool RequiresNullTerminator, bool IsVolatile) {
229   assert(FD != kInvalidFile && "cannot get buffer for closed file");
230   return MemoryBuffer::getOpenFile(FD, Name, FileSize, RequiresNullTerminator,
231                                    IsVolatile);
232 }
233 
234 std::error_code RealFile::close() {
235   std::error_code EC = sys::fs::closeFile(FD);
236   FD = kInvalidFile;
237   return EC;
238 }
239 
240 void RealFile::setPath(const Twine &Path) {
241   RealName = Path.str();
242   if (auto Status = status())
243     S = Status.get().copyWithNewName(Status.get(), Path);
244 }
245 
246 namespace {
247 
248 /// A file system according to your operating system.
249 /// This may be linked to the process's working directory, or maintain its own.
250 ///
251 /// Currently, its own working directory is emulated by storing the path and
252 /// sending absolute paths to llvm::sys::fs:: functions.
253 /// A more principled approach would be to push this down a level, modelling
254 /// the working dir as an llvm::sys::fs::WorkingDir or similar.
255 /// This would enable the use of openat()-style functions on some platforms.
256 class RealFileSystem : public FileSystem {
257 public:
258   explicit RealFileSystem(bool LinkCWDToProcess) {
259     if (!LinkCWDToProcess) {
260       SmallString<128> PWD, RealPWD;
261       if (llvm::sys::fs::current_path(PWD))
262         return; // Awful, but nothing to do here.
263       if (llvm::sys::fs::real_path(PWD, RealPWD))
264         WD = {PWD, PWD};
265       else
266         WD = {PWD, RealPWD};
267     }
268   }
269 
270   ErrorOr<Status> status(const Twine &Path) override;
271   ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine &Path) override;
272   directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override;
273 
274   llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override;
275   std::error_code setCurrentWorkingDirectory(const Twine &Path) override;
276   std::error_code isLocal(const Twine &Path, bool &Result) override;
277   std::error_code getRealPath(const Twine &Path,
278                               SmallVectorImpl<char> &Output) const override;
279 
280 protected:
281   void printImpl(raw_ostream &OS, PrintType Type,
282                  unsigned IndentLevel) const override;
283 
284 private:
285   // If this FS has its own working dir, use it to make Path absolute.
286   // The returned twine is safe to use as long as both Storage and Path live.
287   Twine adjustPath(const Twine &Path, SmallVectorImpl<char> &Storage) const {
288     if (!WD)
289       return Path;
290     Path.toVector(Storage);
291     sys::fs::make_absolute(WD->Resolved, Storage);
292     return Storage;
293   }
294 
295   struct WorkingDirectory {
296     // The current working directory, without symlinks resolved. (echo $PWD).
297     SmallString<128> Specified;
298     // The current working directory, with links resolved. (readlink .).
299     SmallString<128> Resolved;
300   };
301   std::optional<WorkingDirectory> WD;
302 };
303 
304 } // namespace
305 
306 ErrorOr<Status> RealFileSystem::status(const Twine &Path) {
307   SmallString<256> Storage;
308   sys::fs::file_status RealStatus;
309   if (std::error_code EC =
310           sys::fs::status(adjustPath(Path, Storage), RealStatus))
311     return EC;
312   return Status::copyWithNewName(RealStatus, Path);
313 }
314 
315 ErrorOr<std::unique_ptr<File>>
316 RealFileSystem::openFileForRead(const Twine &Name) {
317   SmallString<256> RealName, Storage;
318   Expected<file_t> FDOrErr = sys::fs::openNativeFileForRead(
319       adjustPath(Name, Storage), sys::fs::OF_None, &RealName);
320   if (!FDOrErr)
321     return errorToErrorCode(FDOrErr.takeError());
322   return std::unique_ptr<File>(
323       new RealFile(*FDOrErr, Name.str(), RealName.str()));
324 }
325 
326 llvm::ErrorOr<std::string> RealFileSystem::getCurrentWorkingDirectory() const {
327   if (WD)
328     return std::string(WD->Specified.str());
329 
330   SmallString<128> Dir;
331   if (std::error_code EC = llvm::sys::fs::current_path(Dir))
332     return EC;
333   return std::string(Dir.str());
334 }
335 
336 std::error_code RealFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
337   if (!WD)
338     return llvm::sys::fs::set_current_path(Path);
339 
340   SmallString<128> Absolute, Resolved, Storage;
341   adjustPath(Path, Storage).toVector(Absolute);
342   bool IsDir;
343   if (auto Err = llvm::sys::fs::is_directory(Absolute, IsDir))
344     return Err;
345   if (!IsDir)
346     return std::make_error_code(std::errc::not_a_directory);
347   if (auto Err = llvm::sys::fs::real_path(Absolute, Resolved))
348     return Err;
349   WD = {Absolute, Resolved};
350   return std::error_code();
351 }
352 
353 std::error_code RealFileSystem::isLocal(const Twine &Path, bool &Result) {
354   SmallString<256> Storage;
355   return llvm::sys::fs::is_local(adjustPath(Path, Storage), Result);
356 }
357 
358 std::error_code
359 RealFileSystem::getRealPath(const Twine &Path,
360                             SmallVectorImpl<char> &Output) const {
361   SmallString<256> Storage;
362   return llvm::sys::fs::real_path(adjustPath(Path, Storage), Output);
363 }
364 
365 void RealFileSystem::printImpl(raw_ostream &OS, PrintType Type,
366                                unsigned IndentLevel) const {
367   printIndent(OS, IndentLevel);
368   OS << "RealFileSystem using ";
369   if (WD)
370     OS << "own";
371   else
372     OS << "process";
373   OS << " CWD\n";
374 }
375 
376 IntrusiveRefCntPtr<FileSystem> vfs::getRealFileSystem() {
377   static IntrusiveRefCntPtr<FileSystem> FS(new RealFileSystem(true));
378   return FS;
379 }
380 
381 std::unique_ptr<FileSystem> vfs::createPhysicalFileSystem() {
382   return std::make_unique<RealFileSystem>(false);
383 }
384 
385 namespace {
386 
387 class RealFSDirIter : public llvm::vfs::detail::DirIterImpl {
388   llvm::sys::fs::directory_iterator Iter;
389 
390 public:
391   RealFSDirIter(const Twine &Path, std::error_code &EC) : Iter(Path, EC) {
392     if (Iter != llvm::sys::fs::directory_iterator())
393       CurrentEntry = directory_entry(Iter->path(), Iter->type());
394   }
395 
396   std::error_code increment() override {
397     std::error_code EC;
398     Iter.increment(EC);
399     CurrentEntry = (Iter == llvm::sys::fs::directory_iterator())
400                        ? directory_entry()
401                        : directory_entry(Iter->path(), Iter->type());
402     return EC;
403   }
404 };
405 
406 } // namespace
407 
408 directory_iterator RealFileSystem::dir_begin(const Twine &Dir,
409                                              std::error_code &EC) {
410   SmallString<128> Storage;
411   return directory_iterator(
412       std::make_shared<RealFSDirIter>(adjustPath(Dir, Storage), EC));
413 }
414 
415 //===-----------------------------------------------------------------------===/
416 // OverlayFileSystem implementation
417 //===-----------------------------------------------------------------------===/
418 
419 OverlayFileSystem::OverlayFileSystem(IntrusiveRefCntPtr<FileSystem> BaseFS) {
420   FSList.push_back(std::move(BaseFS));
421 }
422 
423 void OverlayFileSystem::pushOverlay(IntrusiveRefCntPtr<FileSystem> FS) {
424   FSList.push_back(FS);
425   // Synchronize added file systems by duplicating the working directory from
426   // the first one in the list.
427   FS->setCurrentWorkingDirectory(getCurrentWorkingDirectory().get());
428 }
429 
430 ErrorOr<Status> OverlayFileSystem::status(const Twine &Path) {
431   // FIXME: handle symlinks that cross file systems
432   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
433     ErrorOr<Status> Status = (*I)->status(Path);
434     if (Status || Status.getError() != llvm::errc::no_such_file_or_directory)
435       return Status;
436   }
437   return make_error_code(llvm::errc::no_such_file_or_directory);
438 }
439 
440 ErrorOr<std::unique_ptr<File>>
441 OverlayFileSystem::openFileForRead(const llvm::Twine &Path) {
442   // FIXME: handle symlinks that cross file systems
443   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
444     auto Result = (*I)->openFileForRead(Path);
445     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
446       return Result;
447   }
448   return make_error_code(llvm::errc::no_such_file_or_directory);
449 }
450 
451 llvm::ErrorOr<std::string>
452 OverlayFileSystem::getCurrentWorkingDirectory() const {
453   // All file systems are synchronized, just take the first working directory.
454   return FSList.front()->getCurrentWorkingDirectory();
455 }
456 
457 std::error_code
458 OverlayFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
459   for (auto &FS : FSList)
460     if (std::error_code EC = FS->setCurrentWorkingDirectory(Path))
461       return EC;
462   return {};
463 }
464 
465 std::error_code OverlayFileSystem::isLocal(const Twine &Path, bool &Result) {
466   for (auto &FS : FSList)
467     if (FS->exists(Path))
468       return FS->isLocal(Path, Result);
469   return errc::no_such_file_or_directory;
470 }
471 
472 std::error_code
473 OverlayFileSystem::getRealPath(const Twine &Path,
474                                SmallVectorImpl<char> &Output) const {
475   for (const auto &FS : FSList)
476     if (FS->exists(Path))
477       return FS->getRealPath(Path, Output);
478   return errc::no_such_file_or_directory;
479 }
480 
481 void OverlayFileSystem::printImpl(raw_ostream &OS, PrintType Type,
482                                   unsigned IndentLevel) const {
483   printIndent(OS, IndentLevel);
484   OS << "OverlayFileSystem\n";
485   if (Type == PrintType::Summary)
486     return;
487 
488   if (Type == PrintType::Contents)
489     Type = PrintType::Summary;
490   for (auto FS : overlays_range())
491     FS->print(OS, Type, IndentLevel + 1);
492 }
493 
494 llvm::vfs::detail::DirIterImpl::~DirIterImpl() = default;
495 
496 namespace {
497 
498 /// Combines and deduplicates directory entries across multiple file systems.
499 class CombiningDirIterImpl : public llvm::vfs::detail::DirIterImpl {
500   using FileSystemPtr = llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem>;
501 
502   /// Iterators to combine, processed in reverse order.
503   SmallVector<directory_iterator, 8> IterList;
504   /// The iterator currently being traversed.
505   directory_iterator CurrentDirIter;
506   /// The set of names already returned as entries.
507   llvm::StringSet<> SeenNames;
508 
509   /// Sets \c CurrentDirIter to the next iterator in the list, or leaves it as
510   /// is (at its end position) if we've already gone through them all.
511   std::error_code incrementIter(bool IsFirstTime) {
512     while (!IterList.empty()) {
513       CurrentDirIter = IterList.back();
514       IterList.pop_back();
515       if (CurrentDirIter != directory_iterator())
516         break; // found
517     }
518 
519     if (IsFirstTime && CurrentDirIter == directory_iterator())
520       return errc::no_such_file_or_directory;
521     return {};
522   }
523 
524   std::error_code incrementDirIter(bool IsFirstTime) {
525     assert((IsFirstTime || CurrentDirIter != directory_iterator()) &&
526            "incrementing past end");
527     std::error_code EC;
528     if (!IsFirstTime)
529       CurrentDirIter.increment(EC);
530     if (!EC && CurrentDirIter == directory_iterator())
531       EC = incrementIter(IsFirstTime);
532     return EC;
533   }
534 
535   std::error_code incrementImpl(bool IsFirstTime) {
536     while (true) {
537       std::error_code EC = incrementDirIter(IsFirstTime);
538       if (EC || CurrentDirIter == directory_iterator()) {
539         CurrentEntry = directory_entry();
540         return EC;
541       }
542       CurrentEntry = *CurrentDirIter;
543       StringRef Name = llvm::sys::path::filename(CurrentEntry.path());
544       if (SeenNames.insert(Name).second)
545         return EC; // name not seen before
546     }
547     llvm_unreachable("returned above");
548   }
549 
550 public:
551   CombiningDirIterImpl(ArrayRef<FileSystemPtr> FileSystems, std::string Dir,
552                        std::error_code &EC) {
553     for (auto FS : FileSystems) {
554       std::error_code FEC;
555       directory_iterator Iter = FS->dir_begin(Dir, FEC);
556       if (FEC && FEC != errc::no_such_file_or_directory) {
557         EC = FEC;
558         return;
559       }
560       if (!FEC)
561         IterList.push_back(Iter);
562     }
563     EC = incrementImpl(true);
564   }
565 
566   CombiningDirIterImpl(ArrayRef<directory_iterator> DirIters,
567                        std::error_code &EC)
568       : IterList(DirIters.begin(), DirIters.end()) {
569     EC = incrementImpl(true);
570   }
571 
572   std::error_code increment() override { return incrementImpl(false); }
573 };
574 
575 } // namespace
576 
577 directory_iterator OverlayFileSystem::dir_begin(const Twine &Dir,
578                                                 std::error_code &EC) {
579   directory_iterator Combined = directory_iterator(
580       std::make_shared<CombiningDirIterImpl>(FSList, Dir.str(), EC));
581   if (EC)
582     return {};
583   return Combined;
584 }
585 
586 void ProxyFileSystem::anchor() {}
587 
588 namespace llvm {
589 namespace vfs {
590 
591 namespace detail {
592 
593 enum InMemoryNodeKind {
594   IME_File,
595   IME_Directory,
596   IME_HardLink,
597   IME_SymbolicLink,
598 };
599 
600 /// The in memory file system is a tree of Nodes. Every node can either be a
601 /// file, symlink, hardlink or a directory.
602 class InMemoryNode {
603   InMemoryNodeKind Kind;
604   std::string FileName;
605 
606 public:
607   InMemoryNode(llvm::StringRef FileName, InMemoryNodeKind Kind)
608       : Kind(Kind), FileName(std::string(llvm::sys::path::filename(FileName))) {
609   }
610   virtual ~InMemoryNode() = default;
611 
612   /// Return the \p Status for this node. \p RequestedName should be the name
613   /// through which the caller referred to this node. It will override
614   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
615   virtual Status getStatus(const Twine &RequestedName) const = 0;
616 
617   /// Get the filename of this node (the name without the directory part).
618   StringRef getFileName() const { return FileName; }
619   InMemoryNodeKind getKind() const { return Kind; }
620   virtual std::string toString(unsigned Indent) const = 0;
621 };
622 
623 class InMemoryFile : public InMemoryNode {
624   Status Stat;
625   std::unique_ptr<llvm::MemoryBuffer> Buffer;
626 
627 public:
628   InMemoryFile(Status Stat, std::unique_ptr<llvm::MemoryBuffer> Buffer)
629       : InMemoryNode(Stat.getName(), IME_File), Stat(std::move(Stat)),
630         Buffer(std::move(Buffer)) {}
631 
632   Status getStatus(const Twine &RequestedName) const override {
633     return Status::copyWithNewName(Stat, RequestedName);
634   }
635   llvm::MemoryBuffer *getBuffer() const { return Buffer.get(); }
636 
637   std::string toString(unsigned Indent) const override {
638     return (std::string(Indent, ' ') + Stat.getName() + "\n").str();
639   }
640 
641   static bool classof(const InMemoryNode *N) {
642     return N->getKind() == IME_File;
643   }
644 };
645 
646 namespace {
647 
648 class InMemoryHardLink : public InMemoryNode {
649   const InMemoryFile &ResolvedFile;
650 
651 public:
652   InMemoryHardLink(StringRef Path, const InMemoryFile &ResolvedFile)
653       : InMemoryNode(Path, IME_HardLink), ResolvedFile(ResolvedFile) {}
654   const InMemoryFile &getResolvedFile() const { return ResolvedFile; }
655 
656   Status getStatus(const Twine &RequestedName) const override {
657     return ResolvedFile.getStatus(RequestedName);
658   }
659 
660   std::string toString(unsigned Indent) const override {
661     return std::string(Indent, ' ') + "HardLink to -> " +
662            ResolvedFile.toString(0);
663   }
664 
665   static bool classof(const InMemoryNode *N) {
666     return N->getKind() == IME_HardLink;
667   }
668 };
669 
670 class InMemorySymbolicLink : public InMemoryNode {
671   std::string TargetPath;
672   Status Stat;
673 
674 public:
675   InMemorySymbolicLink(StringRef Path, StringRef TargetPath, Status Stat)
676       : InMemoryNode(Path, IME_SymbolicLink), TargetPath(std::move(TargetPath)),
677         Stat(Stat) {}
678 
679   std::string toString(unsigned Indent) const override {
680     return std::string(Indent, ' ') + "SymbolicLink to -> " + TargetPath;
681   }
682 
683   Status getStatus(const Twine &RequestedName) const override {
684     return Status::copyWithNewName(Stat, RequestedName);
685   }
686 
687   StringRef getTargetPath() const { return TargetPath; }
688 
689   static bool classof(const InMemoryNode *N) {
690     return N->getKind() == IME_SymbolicLink;
691   }
692 };
693 
694 /// Adapt a InMemoryFile for VFS' File interface.  The goal is to make
695 /// \p InMemoryFileAdaptor mimic as much as possible the behavior of
696 /// \p RealFile.
697 class InMemoryFileAdaptor : public File {
698   const InMemoryFile &Node;
699   /// The name to use when returning a Status for this file.
700   std::string RequestedName;
701 
702 public:
703   explicit InMemoryFileAdaptor(const InMemoryFile &Node,
704                                std::string RequestedName)
705       : Node(Node), RequestedName(std::move(RequestedName)) {}
706 
707   llvm::ErrorOr<Status> status() override {
708     return Node.getStatus(RequestedName);
709   }
710 
711   llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
712   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
713             bool IsVolatile) override {
714     llvm::MemoryBuffer *Buf = Node.getBuffer();
715     return llvm::MemoryBuffer::getMemBuffer(
716         Buf->getBuffer(), Buf->getBufferIdentifier(), RequiresNullTerminator);
717   }
718 
719   std::error_code close() override { return {}; }
720 
721   void setPath(const Twine &Path) override { RequestedName = Path.str(); }
722 };
723 } // namespace
724 
725 class InMemoryDirectory : public InMemoryNode {
726   Status Stat;
727   llvm::StringMap<std::unique_ptr<InMemoryNode>> Entries;
728 
729 public:
730   InMemoryDirectory(Status Stat)
731       : InMemoryNode(Stat.getName(), IME_Directory), Stat(std::move(Stat)) {}
732 
733   /// Return the \p Status for this node. \p RequestedName should be the name
734   /// through which the caller referred to this node. It will override
735   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
736   Status getStatus(const Twine &RequestedName) const override {
737     return Status::copyWithNewName(Stat, RequestedName);
738   }
739 
740   UniqueID getUniqueID() const { return Stat.getUniqueID(); }
741 
742   InMemoryNode *getChild(StringRef Name) const {
743     auto I = Entries.find(Name);
744     if (I != Entries.end())
745       return I->second.get();
746     return nullptr;
747   }
748 
749   InMemoryNode *addChild(StringRef Name, std::unique_ptr<InMemoryNode> Child) {
750     return Entries.insert(make_pair(Name, std::move(Child)))
751         .first->second.get();
752   }
753 
754   using const_iterator = decltype(Entries)::const_iterator;
755 
756   const_iterator begin() const { return Entries.begin(); }
757   const_iterator end() const { return Entries.end(); }
758 
759   std::string toString(unsigned Indent) const override {
760     std::string Result =
761         (std::string(Indent, ' ') + Stat.getName() + "\n").str();
762     for (const auto &Entry : Entries)
763       Result += Entry.second->toString(Indent + 2);
764     return Result;
765   }
766 
767   static bool classof(const InMemoryNode *N) {
768     return N->getKind() == IME_Directory;
769   }
770 };
771 
772 } // namespace detail
773 
774 // The UniqueID of in-memory files is derived from path and content.
775 // This avoids difficulties in creating exactly equivalent in-memory FSes,
776 // as often needed in multithreaded programs.
777 static sys::fs::UniqueID getUniqueID(hash_code Hash) {
778   return sys::fs::UniqueID(std::numeric_limits<uint64_t>::max(),
779                            uint64_t(size_t(Hash)));
780 }
781 static sys::fs::UniqueID getFileID(sys::fs::UniqueID Parent,
782                                    llvm::StringRef Name,
783                                    llvm::StringRef Contents) {
784   return getUniqueID(llvm::hash_combine(Parent.getFile(), Name, Contents));
785 }
786 static sys::fs::UniqueID getDirectoryID(sys::fs::UniqueID Parent,
787                                         llvm::StringRef Name) {
788   return getUniqueID(llvm::hash_combine(Parent.getFile(), Name));
789 }
790 
791 Status detail::NewInMemoryNodeInfo::makeStatus() const {
792   UniqueID UID =
793       (Type == sys::fs::file_type::directory_file)
794           ? getDirectoryID(DirUID, Name)
795           : getFileID(DirUID, Name, Buffer ? Buffer->getBuffer() : "");
796 
797   return Status(Path, UID, llvm::sys::toTimePoint(ModificationTime), User,
798                 Group, Buffer ? Buffer->getBufferSize() : 0, Type, Perms);
799 }
800 
801 InMemoryFileSystem::InMemoryFileSystem(bool UseNormalizedPaths)
802     : Root(new detail::InMemoryDirectory(
803           Status("", getDirectoryID(llvm::sys::fs::UniqueID(), ""),
804                  llvm::sys::TimePoint<>(), 0, 0, 0,
805                  llvm::sys::fs::file_type::directory_file,
806                  llvm::sys::fs::perms::all_all))),
807       UseNormalizedPaths(UseNormalizedPaths) {}
808 
809 InMemoryFileSystem::~InMemoryFileSystem() = default;
810 
811 std::string InMemoryFileSystem::toString() const {
812   return Root->toString(/*Indent=*/0);
813 }
814 
815 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
816                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
817                                  std::optional<uint32_t> User,
818                                  std::optional<uint32_t> Group,
819                                  std::optional<llvm::sys::fs::file_type> Type,
820                                  std::optional<llvm::sys::fs::perms> Perms,
821                                  MakeNodeFn MakeNode) {
822   SmallString<128> Path;
823   P.toVector(Path);
824 
825   // Fix up relative paths. This just prepends the current working directory.
826   std::error_code EC = makeAbsolute(Path);
827   assert(!EC);
828   (void)EC;
829 
830   if (useNormalizedPaths())
831     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
832 
833   if (Path.empty())
834     return false;
835 
836   detail::InMemoryDirectory *Dir = Root.get();
837   auto I = llvm::sys::path::begin(Path), E = sys::path::end(Path);
838   const auto ResolvedUser = User.value_or(0);
839   const auto ResolvedGroup = Group.value_or(0);
840   const auto ResolvedType = Type.value_or(sys::fs::file_type::regular_file);
841   const auto ResolvedPerms = Perms.value_or(sys::fs::all_all);
842   // Any intermediate directories we create should be accessible by
843   // the owner, even if Perms says otherwise for the final path.
844   const auto NewDirectoryPerms = ResolvedPerms | sys::fs::owner_all;
845   while (true) {
846     StringRef Name = *I;
847     detail::InMemoryNode *Node = Dir->getChild(Name);
848     ++I;
849     if (!Node) {
850       if (I == E) {
851         // End of the path.
852         Dir->addChild(
853             Name, MakeNode({Dir->getUniqueID(), Path, Name, ModificationTime,
854                             std::move(Buffer), ResolvedUser, ResolvedGroup,
855                             ResolvedType, ResolvedPerms}));
856         return true;
857       }
858 
859       // Create a new directory. Use the path up to here.
860       Status Stat(
861           StringRef(Path.str().begin(), Name.end() - Path.str().begin()),
862           getDirectoryID(Dir->getUniqueID(), Name),
863           llvm::sys::toTimePoint(ModificationTime), ResolvedUser, ResolvedGroup,
864           0, sys::fs::file_type::directory_file, NewDirectoryPerms);
865       Dir = cast<detail::InMemoryDirectory>(Dir->addChild(
866           Name, std::make_unique<detail::InMemoryDirectory>(std::move(Stat))));
867       continue;
868     }
869 
870     if (auto *NewDir = dyn_cast<detail::InMemoryDirectory>(Node)) {
871       Dir = NewDir;
872     } else {
873       assert((isa<detail::InMemoryFile>(Node) ||
874               isa<detail::InMemoryHardLink>(Node)) &&
875              "Must be either file, hardlink or directory!");
876 
877       // Trying to insert a directory in place of a file.
878       if (I != E)
879         return false;
880 
881       // Return false only if the new file is different from the existing one.
882       if (auto Link = dyn_cast<detail::InMemoryHardLink>(Node)) {
883         return Link->getResolvedFile().getBuffer()->getBuffer() ==
884                Buffer->getBuffer();
885       }
886       return cast<detail::InMemoryFile>(Node)->getBuffer()->getBuffer() ==
887              Buffer->getBuffer();
888     }
889   }
890 }
891 
892 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
893                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
894                                  std::optional<uint32_t> User,
895                                  std::optional<uint32_t> Group,
896                                  std::optional<llvm::sys::fs::file_type> Type,
897                                  std::optional<llvm::sys::fs::perms> Perms) {
898   return addFile(P, ModificationTime, std::move(Buffer), User, Group, Type,
899                  Perms,
900                  [](detail::NewInMemoryNodeInfo NNI)
901                      -> std::unique_ptr<detail::InMemoryNode> {
902                    Status Stat = NNI.makeStatus();
903                    if (Stat.getType() == sys::fs::file_type::directory_file)
904                      return std::make_unique<detail::InMemoryDirectory>(Stat);
905                    return std::make_unique<detail::InMemoryFile>(
906                        Stat, std::move(NNI.Buffer));
907                  });
908 }
909 
910 bool InMemoryFileSystem::addFileNoOwn(
911     const Twine &P, time_t ModificationTime,
912     const llvm::MemoryBufferRef &Buffer, std::optional<uint32_t> User,
913     std::optional<uint32_t> Group, std::optional<llvm::sys::fs::file_type> Type,
914     std::optional<llvm::sys::fs::perms> Perms) {
915   return addFile(P, ModificationTime, llvm::MemoryBuffer::getMemBuffer(Buffer),
916                  std::move(User), std::move(Group), std::move(Type),
917                  std::move(Perms),
918                  [](detail::NewInMemoryNodeInfo NNI)
919                      -> std::unique_ptr<detail::InMemoryNode> {
920                    Status Stat = NNI.makeStatus();
921                    if (Stat.getType() == sys::fs::file_type::directory_file)
922                      return std::make_unique<detail::InMemoryDirectory>(Stat);
923                    return std::make_unique<detail::InMemoryFile>(
924                        Stat, std::move(NNI.Buffer));
925                  });
926 }
927 
928 detail::NamedNodeOrError
929 InMemoryFileSystem::lookupNode(const Twine &P, bool FollowFinalSymlink,
930                                size_t SymlinkDepth) const {
931   SmallString<128> Path;
932   P.toVector(Path);
933 
934   // Fix up relative paths. This just prepends the current working directory.
935   std::error_code EC = makeAbsolute(Path);
936   assert(!EC);
937   (void)EC;
938 
939   if (useNormalizedPaths())
940     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
941 
942   const detail::InMemoryDirectory *Dir = Root.get();
943   if (Path.empty())
944     return detail::NamedNodeOrError(Path, Dir);
945 
946   auto I = llvm::sys::path::begin(Path), E = llvm::sys::path::end(Path);
947   while (true) {
948     detail::InMemoryNode *Node = Dir->getChild(*I);
949     ++I;
950     if (!Node)
951       return errc::no_such_file_or_directory;
952 
953     if (auto Symlink = dyn_cast<detail::InMemorySymbolicLink>(Node)) {
954       // If we're at the end of the path, and we're not following through
955       // terminal symlinks, then we're done.
956       if (I == E && !FollowFinalSymlink)
957         return detail::NamedNodeOrError(Path, Symlink);
958 
959       if (SymlinkDepth > InMemoryFileSystem::MaxSymlinkDepth)
960         return errc::no_such_file_or_directory;
961 
962       SmallString<128> TargetPath = Symlink->getTargetPath();
963       if (std::error_code EC = makeAbsolute(TargetPath))
964         return EC;
965 
966       // Keep going with the target. We always want to follow symlinks here
967       // because we're either at the end of a path that we want to follow, or
968       // not at the end of a path, in which case we need to follow the symlink
969       // regardless.
970       auto Target =
971           lookupNode(TargetPath, /*FollowFinalSymlink=*/true, SymlinkDepth + 1);
972       if (!Target || I == E)
973         return Target;
974 
975       if (!isa<detail::InMemoryDirectory>(*Target))
976         return errc::no_such_file_or_directory;
977 
978       // Otherwise, continue on the search in the symlinked directory.
979       Dir = cast<detail::InMemoryDirectory>(*Target);
980       continue;
981     }
982 
983     // Return the file if it's at the end of the path.
984     if (auto File = dyn_cast<detail::InMemoryFile>(Node)) {
985       if (I == E)
986         return detail::NamedNodeOrError(Path, File);
987       return errc::no_such_file_or_directory;
988     }
989 
990     // If Node is HardLink then return the resolved file.
991     if (auto File = dyn_cast<detail::InMemoryHardLink>(Node)) {
992       if (I == E)
993         return detail::NamedNodeOrError(Path, &File->getResolvedFile());
994       return errc::no_such_file_or_directory;
995     }
996     // Traverse directories.
997     Dir = cast<detail::InMemoryDirectory>(Node);
998     if (I == E)
999       return detail::NamedNodeOrError(Path, Dir);
1000   }
1001 }
1002 
1003 bool InMemoryFileSystem::addHardLink(const Twine &NewLink,
1004                                      const Twine &Target) {
1005   auto NewLinkNode = lookupNode(NewLink, /*FollowFinalSymlink=*/false);
1006   // Whether symlinks in the hardlink target are followed is
1007   // implementation-defined in POSIX.
1008   // We're following symlinks here to be consistent with macOS.
1009   auto TargetNode = lookupNode(Target, /*FollowFinalSymlink=*/true);
1010   // FromPath must not have been added before. ToPath must have been added
1011   // before. Resolved ToPath must be a File.
1012   if (!TargetNode || NewLinkNode || !isa<detail::InMemoryFile>(*TargetNode))
1013     return false;
1014   return addFile(NewLink, 0, nullptr, std::nullopt, std::nullopt, std::nullopt,
1015                  std::nullopt, [&](detail::NewInMemoryNodeInfo NNI) {
1016                    return std::make_unique<detail::InMemoryHardLink>(
1017                        NNI.Path.str(),
1018                        *cast<detail::InMemoryFile>(*TargetNode));
1019                  });
1020 }
1021 
1022 bool InMemoryFileSystem::addSymbolicLink(
1023     const Twine &NewLink, const Twine &Target, time_t ModificationTime,
1024     std::optional<uint32_t> User, std::optional<uint32_t> Group,
1025     std::optional<llvm::sys::fs::perms> Perms) {
1026   auto NewLinkNode = lookupNode(NewLink, /*FollowFinalSymlink=*/false);
1027   if (NewLinkNode)
1028     return false;
1029 
1030   SmallString<128> NewLinkStr, TargetStr;
1031   NewLink.toVector(NewLinkStr);
1032   Target.toVector(TargetStr);
1033 
1034   return addFile(NewLinkStr, ModificationTime, nullptr, User, Group,
1035                  sys::fs::file_type::symlink_file, Perms,
1036                  [&](detail::NewInMemoryNodeInfo NNI) {
1037                    return std::make_unique<detail::InMemorySymbolicLink>(
1038                        NewLinkStr, TargetStr, NNI.makeStatus());
1039                  });
1040 }
1041 
1042 llvm::ErrorOr<Status> InMemoryFileSystem::status(const Twine &Path) {
1043   auto Node = lookupNode(Path, /*FollowFinalSymlink=*/true);
1044   if (Node)
1045     return (*Node)->getStatus(Path);
1046   return Node.getError();
1047 }
1048 
1049 llvm::ErrorOr<std::unique_ptr<File>>
1050 InMemoryFileSystem::openFileForRead(const Twine &Path) {
1051   auto Node = lookupNode(Path,/*FollowFinalSymlink=*/true);
1052   if (!Node)
1053     return Node.getError();
1054 
1055   // When we have a file provide a heap-allocated wrapper for the memory buffer
1056   // to match the ownership semantics for File.
1057   if (auto *F = dyn_cast<detail::InMemoryFile>(*Node))
1058     return std::unique_ptr<File>(
1059         new detail::InMemoryFileAdaptor(*F, Path.str()));
1060 
1061   // FIXME: errc::not_a_file?
1062   return make_error_code(llvm::errc::invalid_argument);
1063 }
1064 
1065 /// Adaptor from InMemoryDir::iterator to directory_iterator.
1066 class InMemoryFileSystem::DirIterator : public llvm::vfs::detail::DirIterImpl {
1067   const InMemoryFileSystem *FS;
1068   detail::InMemoryDirectory::const_iterator I;
1069   detail::InMemoryDirectory::const_iterator E;
1070   std::string RequestedDirName;
1071 
1072   void setCurrentEntry() {
1073     if (I != E) {
1074       SmallString<256> Path(RequestedDirName);
1075       llvm::sys::path::append(Path, I->second->getFileName());
1076       sys::fs::file_type Type = sys::fs::file_type::type_unknown;
1077       switch (I->second->getKind()) {
1078       case detail::IME_File:
1079       case detail::IME_HardLink:
1080         Type = sys::fs::file_type::regular_file;
1081         break;
1082       case detail::IME_Directory:
1083         Type = sys::fs::file_type::directory_file;
1084         break;
1085       case detail::IME_SymbolicLink:
1086         if (auto SymlinkTarget =
1087                 FS->lookupNode(Path, /*FollowFinalSymlink=*/true)) {
1088           Path = SymlinkTarget.getName();
1089           Type = (*SymlinkTarget)->getStatus(Path).getType();
1090         }
1091         break;
1092       }
1093       CurrentEntry = directory_entry(std::string(Path.str()), Type);
1094     } else {
1095       // When we're at the end, make CurrentEntry invalid and DirIterImpl will
1096       // do the rest.
1097       CurrentEntry = directory_entry();
1098     }
1099   }
1100 
1101 public:
1102   DirIterator() = default;
1103 
1104   DirIterator(const InMemoryFileSystem *FS,
1105               const detail::InMemoryDirectory &Dir,
1106               std::string RequestedDirName)
1107       : FS(FS), I(Dir.begin()), E(Dir.end()),
1108         RequestedDirName(std::move(RequestedDirName)) {
1109     setCurrentEntry();
1110   }
1111 
1112   std::error_code increment() override {
1113     ++I;
1114     setCurrentEntry();
1115     return {};
1116   }
1117 };
1118 
1119 directory_iterator InMemoryFileSystem::dir_begin(const Twine &Dir,
1120                                                  std::error_code &EC) {
1121   auto Node = lookupNode(Dir, /*FollowFinalSymlink=*/true);
1122   if (!Node) {
1123     EC = Node.getError();
1124     return directory_iterator(std::make_shared<DirIterator>());
1125   }
1126 
1127   if (auto *DirNode = dyn_cast<detail::InMemoryDirectory>(*Node))
1128     return directory_iterator(
1129         std::make_shared<DirIterator>(this, *DirNode, Dir.str()));
1130 
1131   EC = make_error_code(llvm::errc::not_a_directory);
1132   return directory_iterator(std::make_shared<DirIterator>());
1133 }
1134 
1135 std::error_code InMemoryFileSystem::setCurrentWorkingDirectory(const Twine &P) {
1136   SmallString<128> Path;
1137   P.toVector(Path);
1138 
1139   // Fix up relative paths. This just prepends the current working directory.
1140   std::error_code EC = makeAbsolute(Path);
1141   assert(!EC);
1142   (void)EC;
1143 
1144   if (useNormalizedPaths())
1145     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
1146 
1147   if (!Path.empty())
1148     WorkingDirectory = std::string(Path.str());
1149   return {};
1150 }
1151 
1152 std::error_code
1153 InMemoryFileSystem::getRealPath(const Twine &Path,
1154                                 SmallVectorImpl<char> &Output) const {
1155   auto CWD = getCurrentWorkingDirectory();
1156   if (!CWD || CWD->empty())
1157     return errc::operation_not_permitted;
1158   Path.toVector(Output);
1159   if (auto EC = makeAbsolute(Output))
1160     return EC;
1161   llvm::sys::path::remove_dots(Output, /*remove_dot_dot=*/true);
1162   return {};
1163 }
1164 
1165 std::error_code InMemoryFileSystem::isLocal(const Twine &Path, bool &Result) {
1166   Result = false;
1167   return {};
1168 }
1169 
1170 void InMemoryFileSystem::printImpl(raw_ostream &OS, PrintType PrintContents,
1171                                    unsigned IndentLevel) const {
1172   printIndent(OS, IndentLevel);
1173   OS << "InMemoryFileSystem\n";
1174 }
1175 
1176 } // namespace vfs
1177 } // namespace llvm
1178 
1179 //===-----------------------------------------------------------------------===/
1180 // RedirectingFileSystem implementation
1181 //===-----------------------------------------------------------------------===/
1182 
1183 namespace {
1184 
1185 static llvm::sys::path::Style getExistingStyle(llvm::StringRef Path) {
1186   // Detect the path style in use by checking the first separator.
1187   llvm::sys::path::Style style = llvm::sys::path::Style::native;
1188   const size_t n = Path.find_first_of("/\\");
1189   // Can't distinguish between posix and windows_slash here.
1190   if (n != static_cast<size_t>(-1))
1191     style = (Path[n] == '/') ? llvm::sys::path::Style::posix
1192                              : llvm::sys::path::Style::windows_backslash;
1193   return style;
1194 }
1195 
1196 /// Removes leading "./" as well as path components like ".." and ".".
1197 static llvm::SmallString<256> canonicalize(llvm::StringRef Path) {
1198   // First detect the path style in use by checking the first separator.
1199   llvm::sys::path::Style style = getExistingStyle(Path);
1200 
1201   // Now remove the dots.  Explicitly specifying the path style prevents the
1202   // direction of the slashes from changing.
1203   llvm::SmallString<256> result =
1204       llvm::sys::path::remove_leading_dotslash(Path, style);
1205   llvm::sys::path::remove_dots(result, /*remove_dot_dot=*/true, style);
1206   return result;
1207 }
1208 
1209 /// Whether the error and entry specify a file/directory that was not found.
1210 static bool isFileNotFound(std::error_code EC,
1211                            RedirectingFileSystem::Entry *E = nullptr) {
1212   if (E && !isa<RedirectingFileSystem::DirectoryRemapEntry>(E))
1213     return false;
1214   return EC == llvm::errc::no_such_file_or_directory;
1215 }
1216 
1217 } // anonymous namespace
1218 
1219 
1220 RedirectingFileSystem::RedirectingFileSystem(IntrusiveRefCntPtr<FileSystem> FS)
1221     : ExternalFS(std::move(FS)) {
1222   if (ExternalFS)
1223     if (auto ExternalWorkingDirectory =
1224             ExternalFS->getCurrentWorkingDirectory()) {
1225       WorkingDirectory = *ExternalWorkingDirectory;
1226     }
1227 }
1228 
1229 /// Directory iterator implementation for \c RedirectingFileSystem's
1230 /// directory entries.
1231 class llvm::vfs::RedirectingFSDirIterImpl
1232     : public llvm::vfs::detail::DirIterImpl {
1233   std::string Dir;
1234   RedirectingFileSystem::DirectoryEntry::iterator Current, End;
1235 
1236   std::error_code incrementImpl(bool IsFirstTime) {
1237     assert((IsFirstTime || Current != End) && "cannot iterate past end");
1238     if (!IsFirstTime)
1239       ++Current;
1240     if (Current != End) {
1241       SmallString<128> PathStr(Dir);
1242       llvm::sys::path::append(PathStr, (*Current)->getName());
1243       sys::fs::file_type Type = sys::fs::file_type::type_unknown;
1244       switch ((*Current)->getKind()) {
1245       case RedirectingFileSystem::EK_Directory:
1246         [[fallthrough]];
1247       case RedirectingFileSystem::EK_DirectoryRemap:
1248         Type = sys::fs::file_type::directory_file;
1249         break;
1250       case RedirectingFileSystem::EK_File:
1251         Type = sys::fs::file_type::regular_file;
1252         break;
1253       }
1254       CurrentEntry = directory_entry(std::string(PathStr.str()), Type);
1255     } else {
1256       CurrentEntry = directory_entry();
1257     }
1258     return {};
1259   };
1260 
1261 public:
1262   RedirectingFSDirIterImpl(
1263       const Twine &Path, RedirectingFileSystem::DirectoryEntry::iterator Begin,
1264       RedirectingFileSystem::DirectoryEntry::iterator End, std::error_code &EC)
1265       : Dir(Path.str()), Current(Begin), End(End) {
1266     EC = incrementImpl(/*IsFirstTime=*/true);
1267   }
1268 
1269   std::error_code increment() override {
1270     return incrementImpl(/*IsFirstTime=*/false);
1271   }
1272 };
1273 
1274 namespace {
1275 /// Directory iterator implementation for \c RedirectingFileSystem's
1276 /// directory remap entries that maps the paths reported by the external
1277 /// file system's directory iterator back to the virtual directory's path.
1278 class RedirectingFSDirRemapIterImpl : public llvm::vfs::detail::DirIterImpl {
1279   std::string Dir;
1280   llvm::sys::path::Style DirStyle;
1281   llvm::vfs::directory_iterator ExternalIter;
1282 
1283 public:
1284   RedirectingFSDirRemapIterImpl(std::string DirPath,
1285                                 llvm::vfs::directory_iterator ExtIter)
1286       : Dir(std::move(DirPath)), DirStyle(getExistingStyle(Dir)),
1287         ExternalIter(ExtIter) {
1288     if (ExternalIter != llvm::vfs::directory_iterator())
1289       setCurrentEntry();
1290   }
1291 
1292   void setCurrentEntry() {
1293     StringRef ExternalPath = ExternalIter->path();
1294     llvm::sys::path::Style ExternalStyle = getExistingStyle(ExternalPath);
1295     StringRef File = llvm::sys::path::filename(ExternalPath, ExternalStyle);
1296 
1297     SmallString<128> NewPath(Dir);
1298     llvm::sys::path::append(NewPath, DirStyle, File);
1299 
1300     CurrentEntry = directory_entry(std::string(NewPath), ExternalIter->type());
1301   }
1302 
1303   std::error_code increment() override {
1304     std::error_code EC;
1305     ExternalIter.increment(EC);
1306     if (!EC && ExternalIter != llvm::vfs::directory_iterator())
1307       setCurrentEntry();
1308     else
1309       CurrentEntry = directory_entry();
1310     return EC;
1311   }
1312 };
1313 } // namespace
1314 
1315 llvm::ErrorOr<std::string>
1316 RedirectingFileSystem::getCurrentWorkingDirectory() const {
1317   return WorkingDirectory;
1318 }
1319 
1320 std::error_code
1321 RedirectingFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
1322   // Don't change the working directory if the path doesn't exist.
1323   if (!exists(Path))
1324     return errc::no_such_file_or_directory;
1325 
1326   SmallString<128> AbsolutePath;
1327   Path.toVector(AbsolutePath);
1328   if (std::error_code EC = makeAbsolute(AbsolutePath))
1329     return EC;
1330   WorkingDirectory = std::string(AbsolutePath.str());
1331   return {};
1332 }
1333 
1334 std::error_code RedirectingFileSystem::isLocal(const Twine &Path_,
1335                                                bool &Result) {
1336   SmallString<256> Path;
1337   Path_.toVector(Path);
1338 
1339   if (std::error_code EC = makeCanonical(Path))
1340     return {};
1341 
1342   return ExternalFS->isLocal(Path, Result);
1343 }
1344 
1345 std::error_code RedirectingFileSystem::makeAbsolute(SmallVectorImpl<char> &Path) const {
1346   // is_absolute(..., Style::windows_*) accepts paths with both slash types.
1347   if (llvm::sys::path::is_absolute(Path, llvm::sys::path::Style::posix) ||
1348       llvm::sys::path::is_absolute(Path,
1349                                    llvm::sys::path::Style::windows_backslash))
1350     // This covers windows absolute path with forward slash as well, as the
1351     // forward slashes are treated as path seperation in llvm::path
1352     // regardless of what path::Style is used.
1353     return {};
1354 
1355   auto WorkingDir = getCurrentWorkingDirectory();
1356   if (!WorkingDir)
1357     return WorkingDir.getError();
1358 
1359   return makeAbsolute(WorkingDir.get(), Path);
1360 }
1361 
1362 std::error_code
1363 RedirectingFileSystem::makeAbsolute(StringRef WorkingDir,
1364                                     SmallVectorImpl<char> &Path) const {
1365   // We can't use sys::fs::make_absolute because that assumes the path style
1366   // is native and there is no way to override that.  Since we know WorkingDir
1367   // is absolute, we can use it to determine which style we actually have and
1368   // append Path ourselves.
1369   if (!WorkingDir.empty() &&
1370       !sys::path::is_absolute(WorkingDir, sys::path::Style::posix) &&
1371       !sys::path::is_absolute(WorkingDir,
1372                               sys::path::Style::windows_backslash)) {
1373     return std::error_code();
1374   }
1375   sys::path::Style style = sys::path::Style::windows_backslash;
1376   if (sys::path::is_absolute(WorkingDir, sys::path::Style::posix)) {
1377     style = sys::path::Style::posix;
1378   } else {
1379     // Distinguish between windows_backslash and windows_slash; getExistingStyle
1380     // returns posix for a path with windows_slash.
1381     if (getExistingStyle(WorkingDir) != sys::path::Style::windows_backslash)
1382       style = sys::path::Style::windows_slash;
1383   }
1384 
1385   std::string Result = std::string(WorkingDir);
1386   StringRef Dir(Result);
1387   if (!Dir.endswith(sys::path::get_separator(style))) {
1388     Result += sys::path::get_separator(style);
1389   }
1390   // backslashes '\' are legit path charactors under POSIX. Windows APIs
1391   // like CreateFile accepts forward slashes '/' as path
1392   // separator (even when mixed with backslashes). Therefore,
1393   // `Path` should be directly appended to `WorkingDir` without converting
1394   // path separator.
1395   Result.append(Path.data(), Path.size());
1396   Path.assign(Result.begin(), Result.end());
1397 
1398   return {};
1399 }
1400 
1401 directory_iterator RedirectingFileSystem::dir_begin(const Twine &Dir,
1402                                                     std::error_code &EC) {
1403   SmallString<256> Path;
1404   Dir.toVector(Path);
1405 
1406   EC = makeCanonical(Path);
1407   if (EC)
1408     return {};
1409 
1410   ErrorOr<RedirectingFileSystem::LookupResult> Result = lookupPath(Path);
1411   if (!Result) {
1412     if (Redirection != RedirectKind::RedirectOnly &&
1413         isFileNotFound(Result.getError()))
1414       return ExternalFS->dir_begin(Path, EC);
1415 
1416     EC = Result.getError();
1417     return {};
1418   }
1419 
1420   // Use status to make sure the path exists and refers to a directory.
1421   ErrorOr<Status> S = status(Path, Dir, *Result);
1422   if (!S) {
1423     if (Redirection != RedirectKind::RedirectOnly &&
1424         isFileNotFound(S.getError(), Result->E))
1425       return ExternalFS->dir_begin(Dir, EC);
1426 
1427     EC = S.getError();
1428     return {};
1429   }
1430 
1431   if (!S->isDirectory()) {
1432     EC = errc::not_a_directory;
1433     return {};
1434   }
1435 
1436   // Create the appropriate directory iterator based on whether we found a
1437   // DirectoryRemapEntry or DirectoryEntry.
1438   directory_iterator RedirectIter;
1439   std::error_code RedirectEC;
1440   if (auto ExtRedirect = Result->getExternalRedirect()) {
1441     auto RE = cast<RedirectingFileSystem::RemapEntry>(Result->E);
1442     RedirectIter = ExternalFS->dir_begin(*ExtRedirect, RedirectEC);
1443 
1444     if (!RE->useExternalName(UseExternalNames)) {
1445       // Update the paths in the results to use the virtual directory's path.
1446       RedirectIter =
1447           directory_iterator(std::make_shared<RedirectingFSDirRemapIterImpl>(
1448               std::string(Path), RedirectIter));
1449     }
1450   } else {
1451     auto DE = cast<DirectoryEntry>(Result->E);
1452     RedirectIter =
1453         directory_iterator(std::make_shared<RedirectingFSDirIterImpl>(
1454             Path, DE->contents_begin(), DE->contents_end(), RedirectEC));
1455   }
1456 
1457   if (RedirectEC) {
1458     if (RedirectEC != errc::no_such_file_or_directory) {
1459       EC = RedirectEC;
1460       return {};
1461     }
1462     RedirectIter = {};
1463   }
1464 
1465   if (Redirection == RedirectKind::RedirectOnly) {
1466     EC = RedirectEC;
1467     return RedirectIter;
1468   }
1469 
1470   std::error_code ExternalEC;
1471   directory_iterator ExternalIter = ExternalFS->dir_begin(Path, ExternalEC);
1472   if (ExternalEC) {
1473     if (ExternalEC != errc::no_such_file_or_directory) {
1474       EC = ExternalEC;
1475       return {};
1476     }
1477     ExternalIter = {};
1478   }
1479 
1480   SmallVector<directory_iterator, 2> Iters;
1481   switch (Redirection) {
1482   case RedirectKind::Fallthrough:
1483     Iters.push_back(ExternalIter);
1484     Iters.push_back(RedirectIter);
1485     break;
1486   case RedirectKind::Fallback:
1487     Iters.push_back(RedirectIter);
1488     Iters.push_back(ExternalIter);
1489     break;
1490   default:
1491     llvm_unreachable("unhandled RedirectKind");
1492   }
1493 
1494   directory_iterator Combined{
1495       std::make_shared<CombiningDirIterImpl>(Iters, EC)};
1496   if (EC)
1497     return {};
1498   return Combined;
1499 }
1500 
1501 void RedirectingFileSystem::setOverlayFileDir(StringRef Dir) {
1502   OverlayFileDir = Dir.str();
1503 }
1504 
1505 StringRef RedirectingFileSystem::getOverlayFileDir() const {
1506   return OverlayFileDir;
1507 }
1508 
1509 void RedirectingFileSystem::setFallthrough(bool Fallthrough) {
1510   if (Fallthrough) {
1511     Redirection = RedirectingFileSystem::RedirectKind::Fallthrough;
1512   } else {
1513     Redirection = RedirectingFileSystem::RedirectKind::RedirectOnly;
1514   }
1515 }
1516 
1517 void RedirectingFileSystem::setRedirection(
1518     RedirectingFileSystem::RedirectKind Kind) {
1519   Redirection = Kind;
1520 }
1521 
1522 std::vector<StringRef> RedirectingFileSystem::getRoots() const {
1523   std::vector<StringRef> R;
1524   R.reserve(Roots.size());
1525   for (const auto &Root : Roots)
1526     R.push_back(Root->getName());
1527   return R;
1528 }
1529 
1530 void RedirectingFileSystem::printImpl(raw_ostream &OS, PrintType Type,
1531                                       unsigned IndentLevel) const {
1532   printIndent(OS, IndentLevel);
1533   OS << "RedirectingFileSystem (UseExternalNames: "
1534      << (UseExternalNames ? "true" : "false") << ")\n";
1535   if (Type == PrintType::Summary)
1536     return;
1537 
1538   for (const auto &Root : Roots)
1539     printEntry(OS, Root.get(), IndentLevel);
1540 
1541   printIndent(OS, IndentLevel);
1542   OS << "ExternalFS:\n";
1543   ExternalFS->print(OS, Type == PrintType::Contents ? PrintType::Summary : Type,
1544                     IndentLevel + 1);
1545 }
1546 
1547 void RedirectingFileSystem::printEntry(raw_ostream &OS,
1548                                        RedirectingFileSystem::Entry *E,
1549                                        unsigned IndentLevel) const {
1550   printIndent(OS, IndentLevel);
1551   OS << "'" << E->getName() << "'";
1552 
1553   switch (E->getKind()) {
1554   case EK_Directory: {
1555     auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(E);
1556 
1557     OS << "\n";
1558     for (std::unique_ptr<Entry> &SubEntry :
1559          llvm::make_range(DE->contents_begin(), DE->contents_end()))
1560       printEntry(OS, SubEntry.get(), IndentLevel + 1);
1561     break;
1562   }
1563   case EK_DirectoryRemap:
1564   case EK_File: {
1565     auto *RE = cast<RedirectingFileSystem::RemapEntry>(E);
1566     OS << " -> '" << RE->getExternalContentsPath() << "'";
1567     switch (RE->getUseName()) {
1568     case NK_NotSet:
1569       break;
1570     case NK_External:
1571       OS << " (UseExternalName: true)";
1572       break;
1573     case NK_Virtual:
1574       OS << " (UseExternalName: false)";
1575       break;
1576     }
1577     OS << "\n";
1578     break;
1579   }
1580   }
1581 }
1582 
1583 /// A helper class to hold the common YAML parsing state.
1584 class llvm::vfs::RedirectingFileSystemParser {
1585   yaml::Stream &Stream;
1586 
1587   void error(yaml::Node *N, const Twine &Msg) { Stream.printError(N, Msg); }
1588 
1589   // false on error
1590   bool parseScalarString(yaml::Node *N, StringRef &Result,
1591                          SmallVectorImpl<char> &Storage) {
1592     const auto *S = dyn_cast<yaml::ScalarNode>(N);
1593 
1594     if (!S) {
1595       error(N, "expected string");
1596       return false;
1597     }
1598     Result = S->getValue(Storage);
1599     return true;
1600   }
1601 
1602   // false on error
1603   bool parseScalarBool(yaml::Node *N, bool &Result) {
1604     SmallString<5> Storage;
1605     StringRef Value;
1606     if (!parseScalarString(N, Value, Storage))
1607       return false;
1608 
1609     if (Value.equals_insensitive("true") || Value.equals_insensitive("on") ||
1610         Value.equals_insensitive("yes") || Value == "1") {
1611       Result = true;
1612       return true;
1613     } else if (Value.equals_insensitive("false") ||
1614                Value.equals_insensitive("off") ||
1615                Value.equals_insensitive("no") || Value == "0") {
1616       Result = false;
1617       return true;
1618     }
1619 
1620     error(N, "expected boolean value");
1621     return false;
1622   }
1623 
1624   std::optional<RedirectingFileSystem::RedirectKind>
1625   parseRedirectKind(yaml::Node *N) {
1626     SmallString<12> Storage;
1627     StringRef Value;
1628     if (!parseScalarString(N, Value, Storage))
1629       return std::nullopt;
1630 
1631     if (Value.equals_insensitive("fallthrough")) {
1632       return RedirectingFileSystem::RedirectKind::Fallthrough;
1633     } else if (Value.equals_insensitive("fallback")) {
1634       return RedirectingFileSystem::RedirectKind::Fallback;
1635     } else if (Value.equals_insensitive("redirect-only")) {
1636       return RedirectingFileSystem::RedirectKind::RedirectOnly;
1637     }
1638     return std::nullopt;
1639   }
1640 
1641   Optional<RedirectingFileSystem::RootRelativeKind>
1642   parseRootRelativeKind(yaml::Node *N) {
1643     SmallString<12> Storage;
1644     StringRef Value;
1645     if (!parseScalarString(N, Value, Storage))
1646       return std::nullopt;
1647     if (Value.equals_insensitive("cwd")) {
1648       return RedirectingFileSystem::RootRelativeKind::CWD;
1649     } else if (Value.equals_insensitive("overlay-dir")) {
1650       return RedirectingFileSystem::RootRelativeKind::OverlayDir;
1651     }
1652     return std::nullopt;
1653   }
1654 
1655   struct KeyStatus {
1656     bool Required;
1657     bool Seen = false;
1658 
1659     KeyStatus(bool Required = false) : Required(Required) {}
1660   };
1661 
1662   using KeyStatusPair = std::pair<StringRef, KeyStatus>;
1663 
1664   // false on error
1665   bool checkDuplicateOrUnknownKey(yaml::Node *KeyNode, StringRef Key,
1666                                   DenseMap<StringRef, KeyStatus> &Keys) {
1667     if (!Keys.count(Key)) {
1668       error(KeyNode, "unknown key");
1669       return false;
1670     }
1671     KeyStatus &S = Keys[Key];
1672     if (S.Seen) {
1673       error(KeyNode, Twine("duplicate key '") + Key + "'");
1674       return false;
1675     }
1676     S.Seen = true;
1677     return true;
1678   }
1679 
1680   // false on error
1681   bool checkMissingKeys(yaml::Node *Obj, DenseMap<StringRef, KeyStatus> &Keys) {
1682     for (const auto &I : Keys) {
1683       if (I.second.Required && !I.second.Seen) {
1684         error(Obj, Twine("missing key '") + I.first + "'");
1685         return false;
1686       }
1687     }
1688     return true;
1689   }
1690 
1691 public:
1692   static RedirectingFileSystem::Entry *
1693   lookupOrCreateEntry(RedirectingFileSystem *FS, StringRef Name,
1694                       RedirectingFileSystem::Entry *ParentEntry = nullptr) {
1695     if (!ParentEntry) { // Look for a existent root
1696       for (const auto &Root : FS->Roots) {
1697         if (Name.equals(Root->getName())) {
1698           ParentEntry = Root.get();
1699           return ParentEntry;
1700         }
1701       }
1702     } else { // Advance to the next component
1703       auto *DE = dyn_cast<RedirectingFileSystem::DirectoryEntry>(ParentEntry);
1704       for (std::unique_ptr<RedirectingFileSystem::Entry> &Content :
1705            llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1706         auto *DirContent =
1707             dyn_cast<RedirectingFileSystem::DirectoryEntry>(Content.get());
1708         if (DirContent && Name.equals(Content->getName()))
1709           return DirContent;
1710       }
1711     }
1712 
1713     // ... or create a new one
1714     std::unique_ptr<RedirectingFileSystem::Entry> E =
1715         std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1716             Name, Status("", getNextVirtualUniqueID(),
1717                          std::chrono::system_clock::now(), 0, 0, 0,
1718                          file_type::directory_file, sys::fs::all_all));
1719 
1720     if (!ParentEntry) { // Add a new root to the overlay
1721       FS->Roots.push_back(std::move(E));
1722       ParentEntry = FS->Roots.back().get();
1723       return ParentEntry;
1724     }
1725 
1726     auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(ParentEntry);
1727     DE->addContent(std::move(E));
1728     return DE->getLastContent();
1729   }
1730 
1731 private:
1732   void uniqueOverlayTree(RedirectingFileSystem *FS,
1733                          RedirectingFileSystem::Entry *SrcE,
1734                          RedirectingFileSystem::Entry *NewParentE = nullptr) {
1735     StringRef Name = SrcE->getName();
1736     switch (SrcE->getKind()) {
1737     case RedirectingFileSystem::EK_Directory: {
1738       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(SrcE);
1739       // Empty directories could be present in the YAML as a way to
1740       // describe a file for a current directory after some of its subdir
1741       // is parsed. This only leads to redundant walks, ignore it.
1742       if (!Name.empty())
1743         NewParentE = lookupOrCreateEntry(FS, Name, NewParentE);
1744       for (std::unique_ptr<RedirectingFileSystem::Entry> &SubEntry :
1745            llvm::make_range(DE->contents_begin(), DE->contents_end()))
1746         uniqueOverlayTree(FS, SubEntry.get(), NewParentE);
1747       break;
1748     }
1749     case RedirectingFileSystem::EK_DirectoryRemap: {
1750       assert(NewParentE && "Parent entry must exist");
1751       auto *DR = cast<RedirectingFileSystem::DirectoryRemapEntry>(SrcE);
1752       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(NewParentE);
1753       DE->addContent(
1754           std::make_unique<RedirectingFileSystem::DirectoryRemapEntry>(
1755               Name, DR->getExternalContentsPath(), DR->getUseName()));
1756       break;
1757     }
1758     case RedirectingFileSystem::EK_File: {
1759       assert(NewParentE && "Parent entry must exist");
1760       auto *FE = cast<RedirectingFileSystem::FileEntry>(SrcE);
1761       auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(NewParentE);
1762       DE->addContent(std::make_unique<RedirectingFileSystem::FileEntry>(
1763           Name, FE->getExternalContentsPath(), FE->getUseName()));
1764       break;
1765     }
1766     }
1767   }
1768 
1769   std::unique_ptr<RedirectingFileSystem::Entry>
1770   parseEntry(yaml::Node *N, RedirectingFileSystem *FS, bool IsRootEntry) {
1771     auto *M = dyn_cast<yaml::MappingNode>(N);
1772     if (!M) {
1773       error(N, "expected mapping node for file or directory entry");
1774       return nullptr;
1775     }
1776 
1777     KeyStatusPair Fields[] = {
1778         KeyStatusPair("name", true),
1779         KeyStatusPair("type", true),
1780         KeyStatusPair("contents", false),
1781         KeyStatusPair("external-contents", false),
1782         KeyStatusPair("use-external-name", false),
1783     };
1784 
1785     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
1786 
1787     enum { CF_NotSet, CF_List, CF_External } ContentsField = CF_NotSet;
1788     std::vector<std::unique_ptr<RedirectingFileSystem::Entry>>
1789         EntryArrayContents;
1790     SmallString<256> ExternalContentsPath;
1791     SmallString<256> Name;
1792     yaml::Node *NameValueNode = nullptr;
1793     auto UseExternalName = RedirectingFileSystem::NK_NotSet;
1794     RedirectingFileSystem::EntryKind Kind;
1795 
1796     for (auto &I : *M) {
1797       StringRef Key;
1798       // Reuse the buffer for key and value, since we don't look at key after
1799       // parsing value.
1800       SmallString<256> Buffer;
1801       if (!parseScalarString(I.getKey(), Key, Buffer))
1802         return nullptr;
1803 
1804       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
1805         return nullptr;
1806 
1807       StringRef Value;
1808       if (Key == "name") {
1809         if (!parseScalarString(I.getValue(), Value, Buffer))
1810           return nullptr;
1811 
1812         NameValueNode = I.getValue();
1813         // Guarantee that old YAML files containing paths with ".." and "."
1814         // are properly canonicalized before read into the VFS.
1815         Name = canonicalize(Value).str();
1816       } else if (Key == "type") {
1817         if (!parseScalarString(I.getValue(), Value, Buffer))
1818           return nullptr;
1819         if (Value == "file")
1820           Kind = RedirectingFileSystem::EK_File;
1821         else if (Value == "directory")
1822           Kind = RedirectingFileSystem::EK_Directory;
1823         else if (Value == "directory-remap")
1824           Kind = RedirectingFileSystem::EK_DirectoryRemap;
1825         else {
1826           error(I.getValue(), "unknown value for 'type'");
1827           return nullptr;
1828         }
1829       } else if (Key == "contents") {
1830         if (ContentsField != CF_NotSet) {
1831           error(I.getKey(),
1832                 "entry already has 'contents' or 'external-contents'");
1833           return nullptr;
1834         }
1835         ContentsField = CF_List;
1836         auto *Contents = dyn_cast<yaml::SequenceNode>(I.getValue());
1837         if (!Contents) {
1838           // FIXME: this is only for directories, what about files?
1839           error(I.getValue(), "expected array");
1840           return nullptr;
1841         }
1842 
1843         for (auto &I : *Contents) {
1844           if (std::unique_ptr<RedirectingFileSystem::Entry> E =
1845                   parseEntry(&I, FS, /*IsRootEntry*/ false))
1846             EntryArrayContents.push_back(std::move(E));
1847           else
1848             return nullptr;
1849         }
1850       } else if (Key == "external-contents") {
1851         if (ContentsField != CF_NotSet) {
1852           error(I.getKey(),
1853                 "entry already has 'contents' or 'external-contents'");
1854           return nullptr;
1855         }
1856         ContentsField = CF_External;
1857         if (!parseScalarString(I.getValue(), Value, Buffer))
1858           return nullptr;
1859 
1860         SmallString<256> FullPath;
1861         if (FS->IsRelativeOverlay) {
1862           FullPath = FS->getOverlayFileDir();
1863           assert(!FullPath.empty() &&
1864                  "External contents prefix directory must exist");
1865           llvm::sys::path::append(FullPath, Value);
1866         } else {
1867           FullPath = Value;
1868         }
1869 
1870         // Guarantee that old YAML files containing paths with ".." and "."
1871         // are properly canonicalized before read into the VFS.
1872         FullPath = canonicalize(FullPath);
1873         ExternalContentsPath = FullPath.str();
1874       } else if (Key == "use-external-name") {
1875         bool Val;
1876         if (!parseScalarBool(I.getValue(), Val))
1877           return nullptr;
1878         UseExternalName = Val ? RedirectingFileSystem::NK_External
1879                               : RedirectingFileSystem::NK_Virtual;
1880       } else {
1881         llvm_unreachable("key missing from Keys");
1882       }
1883     }
1884 
1885     if (Stream.failed())
1886       return nullptr;
1887 
1888     // check for missing keys
1889     if (ContentsField == CF_NotSet) {
1890       error(N, "missing key 'contents' or 'external-contents'");
1891       return nullptr;
1892     }
1893     if (!checkMissingKeys(N, Keys))
1894       return nullptr;
1895 
1896     // check invalid configuration
1897     if (Kind == RedirectingFileSystem::EK_Directory &&
1898         UseExternalName != RedirectingFileSystem::NK_NotSet) {
1899       error(N, "'use-external-name' is not supported for 'directory' entries");
1900       return nullptr;
1901     }
1902 
1903     if (Kind == RedirectingFileSystem::EK_DirectoryRemap &&
1904         ContentsField == CF_List) {
1905       error(N, "'contents' is not supported for 'directory-remap' entries");
1906       return nullptr;
1907     }
1908 
1909     sys::path::Style path_style = sys::path::Style::native;
1910     if (IsRootEntry) {
1911       // VFS root entries may be in either Posix or Windows style.  Figure out
1912       // which style we have, and use it consistently.
1913       if (sys::path::is_absolute(Name, sys::path::Style::posix)) {
1914         path_style = sys::path::Style::posix;
1915       } else if (sys::path::is_absolute(Name,
1916                                         sys::path::Style::windows_backslash)) {
1917         path_style = sys::path::Style::windows_backslash;
1918       } else {
1919         // Relative VFS root entries are made absolute to either the overlay
1920         // directory, or the current working directory, then we can determine
1921         // the path style from that.
1922         std::error_code EC;
1923         if (FS->RootRelative ==
1924             RedirectingFileSystem::RootRelativeKind::OverlayDir) {
1925           StringRef FullPath = FS->getOverlayFileDir();
1926           assert(!FullPath.empty() && "Overlay file directory must exist");
1927           EC = FS->makeAbsolute(FullPath, Name);
1928           Name = canonicalize(Name);
1929         } else {
1930           EC = sys::fs::make_absolute(Name);
1931         }
1932         if (EC) {
1933           assert(NameValueNode && "Name presence should be checked earlier");
1934           error(
1935               NameValueNode,
1936               "entry with relative path at the root level is not discoverable");
1937           return nullptr;
1938         }
1939         path_style = sys::path::is_absolute(Name, sys::path::Style::posix)
1940                          ? sys::path::Style::posix
1941                          : sys::path::Style::windows_backslash;
1942       }
1943       // is::path::is_absolute(Name, sys::path::Style::windows_backslash) will
1944       // return true even if `Name` is using forward slashes. Distinguish
1945       // between windows_backslash and windows_slash.
1946       if (path_style == sys::path::Style::windows_backslash &&
1947           getExistingStyle(Name) != sys::path::Style::windows_backslash)
1948         path_style = sys::path::Style::windows_slash;
1949     }
1950 
1951     // Remove trailing slash(es), being careful not to remove the root path
1952     StringRef Trimmed = Name;
1953     size_t RootPathLen = sys::path::root_path(Trimmed, path_style).size();
1954     while (Trimmed.size() > RootPathLen &&
1955            sys::path::is_separator(Trimmed.back(), path_style))
1956       Trimmed = Trimmed.slice(0, Trimmed.size() - 1);
1957 
1958     // Get the last component
1959     StringRef LastComponent = sys::path::filename(Trimmed, path_style);
1960 
1961     std::unique_ptr<RedirectingFileSystem::Entry> Result;
1962     switch (Kind) {
1963     case RedirectingFileSystem::EK_File:
1964       Result = std::make_unique<RedirectingFileSystem::FileEntry>(
1965           LastComponent, std::move(ExternalContentsPath), UseExternalName);
1966       break;
1967     case RedirectingFileSystem::EK_DirectoryRemap:
1968       Result = std::make_unique<RedirectingFileSystem::DirectoryRemapEntry>(
1969           LastComponent, std::move(ExternalContentsPath), UseExternalName);
1970       break;
1971     case RedirectingFileSystem::EK_Directory:
1972       Result = std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1973           LastComponent, std::move(EntryArrayContents),
1974           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1975                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1976       break;
1977     }
1978 
1979     StringRef Parent = sys::path::parent_path(Trimmed, path_style);
1980     if (Parent.empty())
1981       return Result;
1982 
1983     // if 'name' contains multiple components, create implicit directory entries
1984     for (sys::path::reverse_iterator I = sys::path::rbegin(Parent, path_style),
1985                                      E = sys::path::rend(Parent);
1986          I != E; ++I) {
1987       std::vector<std::unique_ptr<RedirectingFileSystem::Entry>> Entries;
1988       Entries.push_back(std::move(Result));
1989       Result = std::make_unique<RedirectingFileSystem::DirectoryEntry>(
1990           *I, std::move(Entries),
1991           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1992                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1993     }
1994     return Result;
1995   }
1996 
1997 public:
1998   RedirectingFileSystemParser(yaml::Stream &S) : Stream(S) {}
1999 
2000   // false on error
2001   bool parse(yaml::Node *Root, RedirectingFileSystem *FS) {
2002     auto *Top = dyn_cast<yaml::MappingNode>(Root);
2003     if (!Top) {
2004       error(Root, "expected mapping node");
2005       return false;
2006     }
2007 
2008     KeyStatusPair Fields[] = {
2009         KeyStatusPair("version", true),
2010         KeyStatusPair("case-sensitive", false),
2011         KeyStatusPair("use-external-names", false),
2012         KeyStatusPair("root-relative", false),
2013         KeyStatusPair("overlay-relative", false),
2014         KeyStatusPair("fallthrough", false),
2015         KeyStatusPair("redirecting-with", false),
2016         KeyStatusPair("roots", true),
2017     };
2018 
2019     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
2020     std::vector<std::unique_ptr<RedirectingFileSystem::Entry>> RootEntries;
2021 
2022     // Parse configuration and 'roots'
2023     for (auto &I : *Top) {
2024       SmallString<10> KeyBuffer;
2025       StringRef Key;
2026       if (!parseScalarString(I.getKey(), Key, KeyBuffer))
2027         return false;
2028 
2029       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
2030         return false;
2031 
2032       if (Key == "roots") {
2033         auto *Roots = dyn_cast<yaml::SequenceNode>(I.getValue());
2034         if (!Roots) {
2035           error(I.getValue(), "expected array");
2036           return false;
2037         }
2038 
2039         for (auto &I : *Roots) {
2040           if (std::unique_ptr<RedirectingFileSystem::Entry> E =
2041                   parseEntry(&I, FS, /*IsRootEntry*/ true))
2042             RootEntries.push_back(std::move(E));
2043           else
2044             return false;
2045         }
2046       } else if (Key == "version") {
2047         StringRef VersionString;
2048         SmallString<4> Storage;
2049         if (!parseScalarString(I.getValue(), VersionString, Storage))
2050           return false;
2051         int Version;
2052         if (VersionString.getAsInteger<int>(10, Version)) {
2053           error(I.getValue(), "expected integer");
2054           return false;
2055         }
2056         if (Version < 0) {
2057           error(I.getValue(), "invalid version number");
2058           return false;
2059         }
2060         if (Version != 0) {
2061           error(I.getValue(), "version mismatch, expected 0");
2062           return false;
2063         }
2064       } else if (Key == "case-sensitive") {
2065         if (!parseScalarBool(I.getValue(), FS->CaseSensitive))
2066           return false;
2067       } else if (Key == "overlay-relative") {
2068         if (!parseScalarBool(I.getValue(), FS->IsRelativeOverlay))
2069           return false;
2070       } else if (Key == "use-external-names") {
2071         if (!parseScalarBool(I.getValue(), FS->UseExternalNames))
2072           return false;
2073       } else if (Key == "fallthrough") {
2074         if (Keys["redirecting-with"].Seen) {
2075           error(I.getValue(),
2076                 "'fallthrough' and 'redirecting-with' are mutually exclusive");
2077           return false;
2078         }
2079 
2080         bool ShouldFallthrough = false;
2081         if (!parseScalarBool(I.getValue(), ShouldFallthrough))
2082           return false;
2083 
2084         if (ShouldFallthrough) {
2085           FS->Redirection = RedirectingFileSystem::RedirectKind::Fallthrough;
2086         } else {
2087           FS->Redirection = RedirectingFileSystem::RedirectKind::RedirectOnly;
2088         }
2089       } else if (Key == "redirecting-with") {
2090         if (Keys["fallthrough"].Seen) {
2091           error(I.getValue(),
2092                 "'fallthrough' and 'redirecting-with' are mutually exclusive");
2093           return false;
2094         }
2095 
2096         if (auto Kind = parseRedirectKind(I.getValue())) {
2097           FS->Redirection = *Kind;
2098         } else {
2099           error(I.getValue(), "expected valid redirect kind");
2100           return false;
2101         }
2102       } else if (Key == "root-relative") {
2103         if (auto Kind = parseRootRelativeKind(I.getValue())) {
2104           FS->RootRelative = *Kind;
2105         } else {
2106           error(I.getValue(), "expected valid root-relative kind");
2107           return false;
2108         }
2109       } else {
2110         llvm_unreachable("key missing from Keys");
2111       }
2112     }
2113 
2114     if (Stream.failed())
2115       return false;
2116 
2117     if (!checkMissingKeys(Top, Keys))
2118       return false;
2119 
2120     // Now that we sucessefully parsed the YAML file, canonicalize the internal
2121     // representation to a proper directory tree so that we can search faster
2122     // inside the VFS.
2123     for (auto &E : RootEntries)
2124       uniqueOverlayTree(FS, E.get());
2125 
2126     return true;
2127   }
2128 };
2129 
2130 std::unique_ptr<RedirectingFileSystem>
2131 RedirectingFileSystem::create(std::unique_ptr<MemoryBuffer> Buffer,
2132                               SourceMgr::DiagHandlerTy DiagHandler,
2133                               StringRef YAMLFilePath, void *DiagContext,
2134                               IntrusiveRefCntPtr<FileSystem> ExternalFS) {
2135   SourceMgr SM;
2136   yaml::Stream Stream(Buffer->getMemBufferRef(), SM);
2137 
2138   SM.setDiagHandler(DiagHandler, DiagContext);
2139   yaml::document_iterator DI = Stream.begin();
2140   yaml::Node *Root = DI->getRoot();
2141   if (DI == Stream.end() || !Root) {
2142     SM.PrintMessage(SMLoc(), SourceMgr::DK_Error, "expected root node");
2143     return nullptr;
2144   }
2145 
2146   RedirectingFileSystemParser P(Stream);
2147 
2148   std::unique_ptr<RedirectingFileSystem> FS(
2149       new RedirectingFileSystem(ExternalFS));
2150 
2151   if (!YAMLFilePath.empty()) {
2152     // Use the YAML path from -ivfsoverlay to compute the dir to be prefixed
2153     // to each 'external-contents' path.
2154     //
2155     // Example:
2156     //    -ivfsoverlay dummy.cache/vfs/vfs.yaml
2157     // yields:
2158     //  FS->OverlayFileDir => /<absolute_path_to>/dummy.cache/vfs
2159     //
2160     SmallString<256> OverlayAbsDir = sys::path::parent_path(YAMLFilePath);
2161     std::error_code EC = llvm::sys::fs::make_absolute(OverlayAbsDir);
2162     assert(!EC && "Overlay dir final path must be absolute");
2163     (void)EC;
2164     FS->setOverlayFileDir(OverlayAbsDir);
2165   }
2166 
2167   if (!P.parse(Root, FS.get()))
2168     return nullptr;
2169 
2170   return FS;
2171 }
2172 
2173 std::unique_ptr<RedirectingFileSystem> RedirectingFileSystem::create(
2174     ArrayRef<std::pair<std::string, std::string>> RemappedFiles,
2175     bool UseExternalNames, FileSystem &ExternalFS) {
2176   std::unique_ptr<RedirectingFileSystem> FS(
2177       new RedirectingFileSystem(&ExternalFS));
2178   FS->UseExternalNames = UseExternalNames;
2179 
2180   StringMap<RedirectingFileSystem::Entry *> Entries;
2181 
2182   for (auto &Mapping : llvm::reverse(RemappedFiles)) {
2183     SmallString<128> From = StringRef(Mapping.first);
2184     SmallString<128> To = StringRef(Mapping.second);
2185     {
2186       auto EC = ExternalFS.makeAbsolute(From);
2187       (void)EC;
2188       assert(!EC && "Could not make absolute path");
2189     }
2190 
2191     // Check if we've already mapped this file. The first one we see (in the
2192     // reverse iteration) wins.
2193     RedirectingFileSystem::Entry *&ToEntry = Entries[From];
2194     if (ToEntry)
2195       continue;
2196 
2197     // Add parent directories.
2198     RedirectingFileSystem::Entry *Parent = nullptr;
2199     StringRef FromDirectory = llvm::sys::path::parent_path(From);
2200     for (auto I = llvm::sys::path::begin(FromDirectory),
2201               E = llvm::sys::path::end(FromDirectory);
2202          I != E; ++I) {
2203       Parent = RedirectingFileSystemParser::lookupOrCreateEntry(FS.get(), *I,
2204                                                                 Parent);
2205     }
2206     assert(Parent && "File without a directory?");
2207     {
2208       auto EC = ExternalFS.makeAbsolute(To);
2209       (void)EC;
2210       assert(!EC && "Could not make absolute path");
2211     }
2212 
2213     // Add the file.
2214     auto NewFile = std::make_unique<RedirectingFileSystem::FileEntry>(
2215         llvm::sys::path::filename(From), To,
2216         UseExternalNames ? RedirectingFileSystem::NK_External
2217                          : RedirectingFileSystem::NK_Virtual);
2218     ToEntry = NewFile.get();
2219     cast<RedirectingFileSystem::DirectoryEntry>(Parent)->addContent(
2220         std::move(NewFile));
2221   }
2222 
2223   return FS;
2224 }
2225 
2226 RedirectingFileSystem::LookupResult::LookupResult(
2227     Entry *E, sys::path::const_iterator Start, sys::path::const_iterator End)
2228     : E(E) {
2229   assert(E != nullptr);
2230   // If the matched entry is a DirectoryRemapEntry, set ExternalRedirect to the
2231   // path of the directory it maps to in the external file system plus any
2232   // remaining path components in the provided iterator.
2233   if (auto *DRE = dyn_cast<RedirectingFileSystem::DirectoryRemapEntry>(E)) {
2234     SmallString<256> Redirect(DRE->getExternalContentsPath());
2235     sys::path::append(Redirect, Start, End,
2236                       getExistingStyle(DRE->getExternalContentsPath()));
2237     ExternalRedirect = std::string(Redirect);
2238   }
2239 }
2240 
2241 std::error_code
2242 RedirectingFileSystem::makeCanonical(SmallVectorImpl<char> &Path) const {
2243   if (std::error_code EC = makeAbsolute(Path))
2244     return EC;
2245 
2246   llvm::SmallString<256> CanonicalPath =
2247       canonicalize(StringRef(Path.data(), Path.size()));
2248   if (CanonicalPath.empty())
2249     return make_error_code(llvm::errc::invalid_argument);
2250 
2251   Path.assign(CanonicalPath.begin(), CanonicalPath.end());
2252   return {};
2253 }
2254 
2255 ErrorOr<RedirectingFileSystem::LookupResult>
2256 RedirectingFileSystem::lookupPath(StringRef Path) const {
2257   sys::path::const_iterator Start = sys::path::begin(Path);
2258   sys::path::const_iterator End = sys::path::end(Path);
2259   for (const auto &Root : Roots) {
2260     ErrorOr<RedirectingFileSystem::LookupResult> Result =
2261         lookupPathImpl(Start, End, Root.get());
2262     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
2263       return Result;
2264   }
2265   return make_error_code(llvm::errc::no_such_file_or_directory);
2266 }
2267 
2268 ErrorOr<RedirectingFileSystem::LookupResult>
2269 RedirectingFileSystem::lookupPathImpl(
2270     sys::path::const_iterator Start, sys::path::const_iterator End,
2271     RedirectingFileSystem::Entry *From) const {
2272   assert(!isTraversalComponent(*Start) &&
2273          !isTraversalComponent(From->getName()) &&
2274          "Paths should not contain traversal components");
2275 
2276   StringRef FromName = From->getName();
2277 
2278   // Forward the search to the next component in case this is an empty one.
2279   if (!FromName.empty()) {
2280     if (!pathComponentMatches(*Start, FromName))
2281       return make_error_code(llvm::errc::no_such_file_or_directory);
2282 
2283     ++Start;
2284 
2285     if (Start == End) {
2286       // Match!
2287       return LookupResult(From, Start, End);
2288     }
2289   }
2290 
2291   if (isa<RedirectingFileSystem::FileEntry>(From))
2292     return make_error_code(llvm::errc::not_a_directory);
2293 
2294   if (isa<RedirectingFileSystem::DirectoryRemapEntry>(From))
2295     return LookupResult(From, Start, End);
2296 
2297   auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(From);
2298   for (const std::unique_ptr<RedirectingFileSystem::Entry> &DirEntry :
2299        llvm::make_range(DE->contents_begin(), DE->contents_end())) {
2300     ErrorOr<RedirectingFileSystem::LookupResult> Result =
2301         lookupPathImpl(Start, End, DirEntry.get());
2302     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
2303       return Result;
2304   }
2305 
2306   return make_error_code(llvm::errc::no_such_file_or_directory);
2307 }
2308 
2309 static Status getRedirectedFileStatus(const Twine &OriginalPath,
2310                                       bool UseExternalNames,
2311                                       Status ExternalStatus) {
2312   // The path has been mapped by some nested VFS and exposes an external path,
2313   // don't override it with the original path.
2314   if (ExternalStatus.ExposesExternalVFSPath)
2315     return ExternalStatus;
2316 
2317   Status S = ExternalStatus;
2318   if (!UseExternalNames)
2319     S = Status::copyWithNewName(S, OriginalPath);
2320   else
2321     S.ExposesExternalVFSPath = true;
2322   S.IsVFSMapped = true;
2323   return S;
2324 }
2325 
2326 ErrorOr<Status> RedirectingFileSystem::status(
2327     const Twine &CanonicalPath, const Twine &OriginalPath,
2328     const RedirectingFileSystem::LookupResult &Result) {
2329   if (std::optional<StringRef> ExtRedirect = Result.getExternalRedirect()) {
2330     SmallString<256> CanonicalRemappedPath((*ExtRedirect).str());
2331     if (std::error_code EC = makeCanonical(CanonicalRemappedPath))
2332       return EC;
2333 
2334     ErrorOr<Status> S = ExternalFS->status(CanonicalRemappedPath);
2335     if (!S)
2336       return S;
2337     S = Status::copyWithNewName(*S, *ExtRedirect);
2338     auto *RE = cast<RedirectingFileSystem::RemapEntry>(Result.E);
2339     return getRedirectedFileStatus(OriginalPath,
2340                                    RE->useExternalName(UseExternalNames), *S);
2341   }
2342 
2343   auto *DE = cast<RedirectingFileSystem::DirectoryEntry>(Result.E);
2344   return Status::copyWithNewName(DE->getStatus(), CanonicalPath);
2345 }
2346 
2347 ErrorOr<Status>
2348 RedirectingFileSystem::getExternalStatus(const Twine &CanonicalPath,
2349                                          const Twine &OriginalPath) const {
2350   auto Result = ExternalFS->status(CanonicalPath);
2351 
2352   // The path has been mapped by some nested VFS, don't override it with the
2353   // original path.
2354   if (!Result || Result->ExposesExternalVFSPath)
2355     return Result;
2356   return Status::copyWithNewName(Result.get(), OriginalPath);
2357 }
2358 
2359 ErrorOr<Status> RedirectingFileSystem::status(const Twine &OriginalPath) {
2360   SmallString<256> CanonicalPath;
2361   OriginalPath.toVector(CanonicalPath);
2362 
2363   if (std::error_code EC = makeCanonical(CanonicalPath))
2364     return EC;
2365 
2366   if (Redirection == RedirectKind::Fallback) {
2367     // Attempt to find the original file first, only falling back to the
2368     // mapped file if that fails.
2369     ErrorOr<Status> S = getExternalStatus(CanonicalPath, OriginalPath);
2370     if (S)
2371       return S;
2372   }
2373 
2374   ErrorOr<RedirectingFileSystem::LookupResult> Result =
2375       lookupPath(CanonicalPath);
2376   if (!Result) {
2377     // Was not able to map file, fallthrough to using the original path if
2378     // that was the specified redirection type.
2379     if (Redirection == RedirectKind::Fallthrough &&
2380         isFileNotFound(Result.getError()))
2381       return getExternalStatus(CanonicalPath, OriginalPath);
2382     return Result.getError();
2383   }
2384 
2385   ErrorOr<Status> S = status(CanonicalPath, OriginalPath, *Result);
2386   if (!S && Redirection == RedirectKind::Fallthrough &&
2387       isFileNotFound(S.getError(), Result->E)) {
2388     // Mapped the file but it wasn't found in the underlying filesystem,
2389     // fallthrough to using the original path if that was the specified
2390     // redirection type.
2391     return getExternalStatus(CanonicalPath, OriginalPath);
2392   }
2393 
2394   return S;
2395 }
2396 
2397 namespace {
2398 
2399 /// Provide a file wrapper with an overriden status.
2400 class FileWithFixedStatus : public File {
2401   std::unique_ptr<File> InnerFile;
2402   Status S;
2403 
2404 public:
2405   FileWithFixedStatus(std::unique_ptr<File> InnerFile, Status S)
2406       : InnerFile(std::move(InnerFile)), S(std::move(S)) {}
2407 
2408   ErrorOr<Status> status() override { return S; }
2409   ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
2410 
2411   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
2412             bool IsVolatile) override {
2413     return InnerFile->getBuffer(Name, FileSize, RequiresNullTerminator,
2414                                 IsVolatile);
2415   }
2416 
2417   std::error_code close() override { return InnerFile->close(); }
2418 
2419   void setPath(const Twine &Path) override { S = S.copyWithNewName(S, Path); }
2420 };
2421 
2422 } // namespace
2423 
2424 ErrorOr<std::unique_ptr<File>>
2425 File::getWithPath(ErrorOr<std::unique_ptr<File>> Result, const Twine &P) {
2426   // See \c getRedirectedFileStatus - don't update path if it's exposing an
2427   // external path.
2428   if (!Result || (*Result)->status()->ExposesExternalVFSPath)
2429     return Result;
2430 
2431   ErrorOr<std::unique_ptr<File>> F = std::move(*Result);
2432   auto Name = F->get()->getName();
2433   if (Name && Name.get() != P.str())
2434     F->get()->setPath(P);
2435   return F;
2436 }
2437 
2438 ErrorOr<std::unique_ptr<File>>
2439 RedirectingFileSystem::openFileForRead(const Twine &OriginalPath) {
2440   SmallString<256> CanonicalPath;
2441   OriginalPath.toVector(CanonicalPath);
2442 
2443   if (std::error_code EC = makeCanonical(CanonicalPath))
2444     return EC;
2445 
2446   if (Redirection == RedirectKind::Fallback) {
2447     // Attempt to find the original file first, only falling back to the
2448     // mapped file if that fails.
2449     auto F = File::getWithPath(ExternalFS->openFileForRead(CanonicalPath),
2450                                OriginalPath);
2451     if (F)
2452       return F;
2453   }
2454 
2455   ErrorOr<RedirectingFileSystem::LookupResult> Result =
2456       lookupPath(CanonicalPath);
2457   if (!Result) {
2458     // Was not able to map file, fallthrough to using the original path if
2459     // that was the specified redirection type.
2460     if (Redirection == RedirectKind::Fallthrough &&
2461         isFileNotFound(Result.getError()))
2462       return File::getWithPath(ExternalFS->openFileForRead(CanonicalPath),
2463                                OriginalPath);
2464     return Result.getError();
2465   }
2466 
2467   if (!Result->getExternalRedirect()) // FIXME: errc::not_a_file?
2468     return make_error_code(llvm::errc::invalid_argument);
2469 
2470   StringRef ExtRedirect = *Result->getExternalRedirect();
2471   SmallString<256> CanonicalRemappedPath(ExtRedirect.str());
2472   if (std::error_code EC = makeCanonical(CanonicalRemappedPath))
2473     return EC;
2474 
2475   auto *RE = cast<RedirectingFileSystem::RemapEntry>(Result->E);
2476 
2477   auto ExternalFile = File::getWithPath(
2478       ExternalFS->openFileForRead(CanonicalRemappedPath), ExtRedirect);
2479   if (!ExternalFile) {
2480     if (Redirection == RedirectKind::Fallthrough &&
2481         isFileNotFound(ExternalFile.getError(), Result->E)) {
2482       // Mapped the file but it wasn't found in the underlying filesystem,
2483       // fallthrough to using the original path if that was the specified
2484       // redirection type.
2485       return File::getWithPath(ExternalFS->openFileForRead(CanonicalPath),
2486                                OriginalPath);
2487     }
2488     return ExternalFile;
2489   }
2490 
2491   auto ExternalStatus = (*ExternalFile)->status();
2492   if (!ExternalStatus)
2493     return ExternalStatus.getError();
2494 
2495   // Otherwise, the file was successfully remapped. Mark it as such. Also
2496   // replace the underlying path if the external name is being used.
2497   Status S = getRedirectedFileStatus(
2498       OriginalPath, RE->useExternalName(UseExternalNames), *ExternalStatus);
2499   return std::unique_ptr<File>(
2500       std::make_unique<FileWithFixedStatus>(std::move(*ExternalFile), S));
2501 }
2502 
2503 std::error_code
2504 RedirectingFileSystem::getRealPath(const Twine &OriginalPath,
2505                                    SmallVectorImpl<char> &Output) const {
2506   SmallString<256> CanonicalPath;
2507   OriginalPath.toVector(CanonicalPath);
2508 
2509   if (std::error_code EC = makeCanonical(CanonicalPath))
2510     return EC;
2511 
2512   if (Redirection == RedirectKind::Fallback) {
2513     // Attempt to find the original file first, only falling back to the
2514     // mapped file if that fails.
2515     std::error_code EC = ExternalFS->getRealPath(CanonicalPath, Output);
2516     if (!EC)
2517       return EC;
2518   }
2519 
2520   ErrorOr<RedirectingFileSystem::LookupResult> Result =
2521       lookupPath(CanonicalPath);
2522   if (!Result) {
2523     // Was not able to map file, fallthrough to using the original path if
2524     // that was the specified redirection type.
2525     if (Redirection == RedirectKind::Fallthrough &&
2526         isFileNotFound(Result.getError()))
2527       return ExternalFS->getRealPath(CanonicalPath, Output);
2528     return Result.getError();
2529   }
2530 
2531   // If we found FileEntry or DirectoryRemapEntry, look up the mapped
2532   // path in the external file system.
2533   if (auto ExtRedirect = Result->getExternalRedirect()) {
2534     auto P = ExternalFS->getRealPath(*ExtRedirect, Output);
2535     if (P && Redirection == RedirectKind::Fallthrough &&
2536         isFileNotFound(P, Result->E)) {
2537       // Mapped the file but it wasn't found in the underlying filesystem,
2538       // fallthrough to using the original path if that was the specified
2539       // redirection type.
2540       return ExternalFS->getRealPath(CanonicalPath, Output);
2541     }
2542     return P;
2543   }
2544 
2545   // If we found a DirectoryEntry, still fallthrough to the original path if
2546   // allowed, because directories don't have a single external contents path.
2547   if (Redirection == RedirectKind::Fallthrough)
2548     return ExternalFS->getRealPath(CanonicalPath, Output);
2549   return llvm::errc::invalid_argument;
2550 }
2551 
2552 std::unique_ptr<FileSystem>
2553 vfs::getVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
2554                     SourceMgr::DiagHandlerTy DiagHandler,
2555                     StringRef YAMLFilePath, void *DiagContext,
2556                     IntrusiveRefCntPtr<FileSystem> ExternalFS) {
2557   return RedirectingFileSystem::create(std::move(Buffer), DiagHandler,
2558                                        YAMLFilePath, DiagContext,
2559                                        std::move(ExternalFS));
2560 }
2561 
2562 static void getVFSEntries(RedirectingFileSystem::Entry *SrcE,
2563                           SmallVectorImpl<StringRef> &Path,
2564                           SmallVectorImpl<YAMLVFSEntry> &Entries) {
2565   auto Kind = SrcE->getKind();
2566   if (Kind == RedirectingFileSystem::EK_Directory) {
2567     auto *DE = dyn_cast<RedirectingFileSystem::DirectoryEntry>(SrcE);
2568     assert(DE && "Must be a directory");
2569     for (std::unique_ptr<RedirectingFileSystem::Entry> &SubEntry :
2570          llvm::make_range(DE->contents_begin(), DE->contents_end())) {
2571       Path.push_back(SubEntry->getName());
2572       getVFSEntries(SubEntry.get(), Path, Entries);
2573       Path.pop_back();
2574     }
2575     return;
2576   }
2577 
2578   if (Kind == RedirectingFileSystem::EK_DirectoryRemap) {
2579     auto *DR = dyn_cast<RedirectingFileSystem::DirectoryRemapEntry>(SrcE);
2580     assert(DR && "Must be a directory remap");
2581     SmallString<128> VPath;
2582     for (auto &Comp : Path)
2583       llvm::sys::path::append(VPath, Comp);
2584     Entries.push_back(
2585         YAMLVFSEntry(VPath.c_str(), DR->getExternalContentsPath()));
2586     return;
2587   }
2588 
2589   assert(Kind == RedirectingFileSystem::EK_File && "Must be a EK_File");
2590   auto *FE = dyn_cast<RedirectingFileSystem::FileEntry>(SrcE);
2591   assert(FE && "Must be a file");
2592   SmallString<128> VPath;
2593   for (auto &Comp : Path)
2594     llvm::sys::path::append(VPath, Comp);
2595   Entries.push_back(YAMLVFSEntry(VPath.c_str(), FE->getExternalContentsPath()));
2596 }
2597 
2598 void vfs::collectVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
2599                              SourceMgr::DiagHandlerTy DiagHandler,
2600                              StringRef YAMLFilePath,
2601                              SmallVectorImpl<YAMLVFSEntry> &CollectedEntries,
2602                              void *DiagContext,
2603                              IntrusiveRefCntPtr<FileSystem> ExternalFS) {
2604   std::unique_ptr<RedirectingFileSystem> VFS = RedirectingFileSystem::create(
2605       std::move(Buffer), DiagHandler, YAMLFilePath, DiagContext,
2606       std::move(ExternalFS));
2607   if (!VFS)
2608     return;
2609   ErrorOr<RedirectingFileSystem::LookupResult> RootResult =
2610       VFS->lookupPath("/");
2611   if (!RootResult)
2612     return;
2613   SmallVector<StringRef, 8> Components;
2614   Components.push_back("/");
2615   getVFSEntries(RootResult->E, Components, CollectedEntries);
2616 }
2617 
2618 UniqueID vfs::getNextVirtualUniqueID() {
2619   static std::atomic<unsigned> UID;
2620   unsigned ID = ++UID;
2621   // The following assumes that uint64_t max will never collide with a real
2622   // dev_t value from the OS.
2623   return UniqueID(std::numeric_limits<uint64_t>::max(), ID);
2624 }
2625 
2626 void YAMLVFSWriter::addEntry(StringRef VirtualPath, StringRef RealPath,
2627                              bool IsDirectory) {
2628   assert(sys::path::is_absolute(VirtualPath) && "virtual path not absolute");
2629   assert(sys::path::is_absolute(RealPath) && "real path not absolute");
2630   assert(!pathHasTraversal(VirtualPath) && "path traversal is not supported");
2631   Mappings.emplace_back(VirtualPath, RealPath, IsDirectory);
2632 }
2633 
2634 void YAMLVFSWriter::addFileMapping(StringRef VirtualPath, StringRef RealPath) {
2635   addEntry(VirtualPath, RealPath, /*IsDirectory=*/false);
2636 }
2637 
2638 void YAMLVFSWriter::addDirectoryMapping(StringRef VirtualPath,
2639                                         StringRef RealPath) {
2640   addEntry(VirtualPath, RealPath, /*IsDirectory=*/true);
2641 }
2642 
2643 namespace {
2644 
2645 class JSONWriter {
2646   llvm::raw_ostream &OS;
2647   SmallVector<StringRef, 16> DirStack;
2648 
2649   unsigned getDirIndent() { return 4 * DirStack.size(); }
2650   unsigned getFileIndent() { return 4 * (DirStack.size() + 1); }
2651   bool containedIn(StringRef Parent, StringRef Path);
2652   StringRef containedPart(StringRef Parent, StringRef Path);
2653   void startDirectory(StringRef Path);
2654   void endDirectory();
2655   void writeEntry(StringRef VPath, StringRef RPath);
2656 
2657 public:
2658   JSONWriter(llvm::raw_ostream &OS) : OS(OS) {}
2659 
2660   void write(ArrayRef<YAMLVFSEntry> Entries,
2661              std::optional<bool> UseExternalNames,
2662              std::optional<bool> IsCaseSensitive,
2663              std::optional<bool> IsOverlayRelative, StringRef OverlayDir);
2664 };
2665 
2666 } // namespace
2667 
2668 bool JSONWriter::containedIn(StringRef Parent, StringRef Path) {
2669   using namespace llvm::sys;
2670 
2671   // Compare each path component.
2672   auto IParent = path::begin(Parent), EParent = path::end(Parent);
2673   for (auto IChild = path::begin(Path), EChild = path::end(Path);
2674        IParent != EParent && IChild != EChild; ++IParent, ++IChild) {
2675     if (*IParent != *IChild)
2676       return false;
2677   }
2678   // Have we exhausted the parent path?
2679   return IParent == EParent;
2680 }
2681 
2682 StringRef JSONWriter::containedPart(StringRef Parent, StringRef Path) {
2683   assert(!Parent.empty());
2684   assert(containedIn(Parent, Path));
2685   return Path.slice(Parent.size() + 1, StringRef::npos);
2686 }
2687 
2688 void JSONWriter::startDirectory(StringRef Path) {
2689   StringRef Name =
2690       DirStack.empty() ? Path : containedPart(DirStack.back(), Path);
2691   DirStack.push_back(Path);
2692   unsigned Indent = getDirIndent();
2693   OS.indent(Indent) << "{\n";
2694   OS.indent(Indent + 2) << "'type': 'directory',\n";
2695   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(Name) << "\",\n";
2696   OS.indent(Indent + 2) << "'contents': [\n";
2697 }
2698 
2699 void JSONWriter::endDirectory() {
2700   unsigned Indent = getDirIndent();
2701   OS.indent(Indent + 2) << "]\n";
2702   OS.indent(Indent) << "}";
2703 
2704   DirStack.pop_back();
2705 }
2706 
2707 void JSONWriter::writeEntry(StringRef VPath, StringRef RPath) {
2708   unsigned Indent = getFileIndent();
2709   OS.indent(Indent) << "{\n";
2710   OS.indent(Indent + 2) << "'type': 'file',\n";
2711   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(VPath) << "\",\n";
2712   OS.indent(Indent + 2) << "'external-contents': \""
2713                         << llvm::yaml::escape(RPath) << "\"\n";
2714   OS.indent(Indent) << "}";
2715 }
2716 
2717 void JSONWriter::write(ArrayRef<YAMLVFSEntry> Entries,
2718                        std::optional<bool> UseExternalNames,
2719                        std::optional<bool> IsCaseSensitive,
2720                        std::optional<bool> IsOverlayRelative,
2721                        StringRef OverlayDir) {
2722   using namespace llvm::sys;
2723 
2724   OS << "{\n"
2725         "  'version': 0,\n";
2726   if (IsCaseSensitive)
2727     OS << "  'case-sensitive': '"
2728        << (IsCaseSensitive.value() ? "true" : "false") << "',\n";
2729   if (UseExternalNames)
2730     OS << "  'use-external-names': '"
2731        << (UseExternalNames.value() ? "true" : "false") << "',\n";
2732   bool UseOverlayRelative = false;
2733   if (IsOverlayRelative) {
2734     UseOverlayRelative = IsOverlayRelative.value();
2735     OS << "  'overlay-relative': '" << (UseOverlayRelative ? "true" : "false")
2736        << "',\n";
2737   }
2738   OS << "  'roots': [\n";
2739 
2740   if (!Entries.empty()) {
2741     const YAMLVFSEntry &Entry = Entries.front();
2742 
2743     startDirectory(
2744       Entry.IsDirectory ? Entry.VPath : path::parent_path(Entry.VPath)
2745     );
2746 
2747     StringRef RPath = Entry.RPath;
2748     if (UseOverlayRelative) {
2749       unsigned OverlayDirLen = OverlayDir.size();
2750       assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2751              "Overlay dir must be contained in RPath");
2752       RPath = RPath.slice(OverlayDirLen, RPath.size());
2753     }
2754 
2755     bool IsCurrentDirEmpty = true;
2756     if (!Entry.IsDirectory) {
2757       writeEntry(path::filename(Entry.VPath), RPath);
2758       IsCurrentDirEmpty = false;
2759     }
2760 
2761     for (const auto &Entry : Entries.slice(1)) {
2762       StringRef Dir =
2763           Entry.IsDirectory ? Entry.VPath : path::parent_path(Entry.VPath);
2764       if (Dir == DirStack.back()) {
2765         if (!IsCurrentDirEmpty) {
2766           OS << ",\n";
2767         }
2768       } else {
2769         bool IsDirPoppedFromStack = false;
2770         while (!DirStack.empty() && !containedIn(DirStack.back(), Dir)) {
2771           OS << "\n";
2772           endDirectory();
2773           IsDirPoppedFromStack = true;
2774         }
2775         if (IsDirPoppedFromStack || !IsCurrentDirEmpty) {
2776           OS << ",\n";
2777         }
2778         startDirectory(Dir);
2779         IsCurrentDirEmpty = true;
2780       }
2781       StringRef RPath = Entry.RPath;
2782       if (UseOverlayRelative) {
2783         unsigned OverlayDirLen = OverlayDir.size();
2784         assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2785                "Overlay dir must be contained in RPath");
2786         RPath = RPath.slice(OverlayDirLen, RPath.size());
2787       }
2788       if (!Entry.IsDirectory) {
2789         writeEntry(path::filename(Entry.VPath), RPath);
2790         IsCurrentDirEmpty = false;
2791       }
2792     }
2793 
2794     while (!DirStack.empty()) {
2795       OS << "\n";
2796       endDirectory();
2797     }
2798     OS << "\n";
2799   }
2800 
2801   OS << "  ]\n"
2802      << "}\n";
2803 }
2804 
2805 void YAMLVFSWriter::write(llvm::raw_ostream &OS) {
2806   llvm::sort(Mappings, [](const YAMLVFSEntry &LHS, const YAMLVFSEntry &RHS) {
2807     return LHS.VPath < RHS.VPath;
2808   });
2809 
2810   JSONWriter(OS).write(Mappings, UseExternalNames, IsCaseSensitive,
2811                        IsOverlayRelative, OverlayDir);
2812 }
2813 
2814 vfs::recursive_directory_iterator::recursive_directory_iterator(
2815     FileSystem &FS_, const Twine &Path, std::error_code &EC)
2816     : FS(&FS_) {
2817   directory_iterator I = FS->dir_begin(Path, EC);
2818   if (I != directory_iterator()) {
2819     State = std::make_shared<detail::RecDirIterState>();
2820     State->Stack.push(I);
2821   }
2822 }
2823 
2824 vfs::recursive_directory_iterator &
2825 recursive_directory_iterator::increment(std::error_code &EC) {
2826   assert(FS && State && !State->Stack.empty() && "incrementing past end");
2827   assert(!State->Stack.top()->path().empty() && "non-canonical end iterator");
2828   vfs::directory_iterator End;
2829 
2830   if (State->HasNoPushRequest)
2831     State->HasNoPushRequest = false;
2832   else {
2833     if (State->Stack.top()->type() == sys::fs::file_type::directory_file) {
2834       vfs::directory_iterator I = FS->dir_begin(State->Stack.top()->path(), EC);
2835       if (I != End) {
2836         State->Stack.push(I);
2837         return *this;
2838       }
2839     }
2840   }
2841 
2842   while (!State->Stack.empty() && State->Stack.top().increment(EC) == End)
2843     State->Stack.pop();
2844 
2845   if (State->Stack.empty())
2846     State.reset(); // end iterator
2847 
2848   return *this;
2849 }
2850