1 //===- VirtualFileSystem.cpp - Virtual File System Layer ------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements the VirtualFileSystem interface.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/Support/VirtualFileSystem.h"
15 #include "llvm/ADT/ArrayRef.h"
16 #include "llvm/ADT/DenseMap.h"
17 #include "llvm/ADT/IntrusiveRefCntPtr.h"
18 #include "llvm/ADT/None.h"
19 #include "llvm/ADT/Optional.h"
20 #include "llvm/ADT/STLExtras.h"
21 #include "llvm/ADT/SmallString.h"
22 #include "llvm/ADT/SmallVector.h"
23 #include "llvm/ADT/StringRef.h"
24 #include "llvm/ADT/StringSet.h"
25 #include "llvm/ADT/Twine.h"
26 #include "llvm/ADT/iterator_range.h"
27 #include "llvm/Config/llvm-config.h"
28 #include "llvm/Support/Casting.h"
29 #include "llvm/Support/Chrono.h"
30 #include "llvm/Support/Compiler.h"
31 #include "llvm/Support/Debug.h"
32 #include "llvm/Support/Errc.h"
33 #include "llvm/Support/ErrorHandling.h"
34 #include "llvm/Support/ErrorOr.h"
35 #include "llvm/Support/FileSystem.h"
36 #include "llvm/Support/MemoryBuffer.h"
37 #include "llvm/Support/Path.h"
38 #include "llvm/Support/Process.h"
39 #include "llvm/Support/SMLoc.h"
40 #include "llvm/Support/SourceMgr.h"
41 #include "llvm/Support/YAMLParser.h"
42 #include "llvm/Support/raw_ostream.h"
43 #include <algorithm>
44 #include <atomic>
45 #include <cassert>
46 #include <cstdint>
47 #include <iterator>
48 #include <limits>
49 #include <map>
50 #include <memory>
51 #include <mutex>
52 #include <string>
53 #include <system_error>
54 #include <utility>
55 #include <vector>
56 
57 using namespace llvm;
58 using namespace llvm::vfs;
59 
60 using llvm::sys::fs::file_status;
61 using llvm::sys::fs::file_type;
62 using llvm::sys::fs::perms;
63 using llvm::sys::fs::UniqueID;
64 
65 Status::Status(const file_status &Status)
66     : UID(Status.getUniqueID()), MTime(Status.getLastModificationTime()),
67       User(Status.getUser()), Group(Status.getGroup()), Size(Status.getSize()),
68       Type(Status.type()), Perms(Status.permissions()) {}
69 
70 Status::Status(StringRef Name, UniqueID UID, sys::TimePoint<> MTime,
71                uint32_t User, uint32_t Group, uint64_t Size, file_type Type,
72                perms Perms)
73     : Name(Name), UID(UID), MTime(MTime), User(User), Group(Group), Size(Size),
74       Type(Type), Perms(Perms) {}
75 
76 Status Status::copyWithNewName(const Status &In, StringRef NewName) {
77   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
78                 In.getUser(), In.getGroup(), In.getSize(), In.getType(),
79                 In.getPermissions());
80 }
81 
82 Status Status::copyWithNewName(const file_status &In, StringRef NewName) {
83   return Status(NewName, In.getUniqueID(), In.getLastModificationTime(),
84                 In.getUser(), In.getGroup(), In.getSize(), In.type(),
85                 In.permissions());
86 }
87 
88 bool Status::equivalent(const Status &Other) const {
89   assert(isStatusKnown() && Other.isStatusKnown());
90   return getUniqueID() == Other.getUniqueID();
91 }
92 
93 bool Status::isDirectory() const { return Type == file_type::directory_file; }
94 
95 bool Status::isRegularFile() const { return Type == file_type::regular_file; }
96 
97 bool Status::isOther() const {
98   return exists() && !isRegularFile() && !isDirectory() && !isSymlink();
99 }
100 
101 bool Status::isSymlink() const { return Type == file_type::symlink_file; }
102 
103 bool Status::isStatusKnown() const { return Type != file_type::status_error; }
104 
105 bool Status::exists() const {
106   return isStatusKnown() && Type != file_type::file_not_found;
107 }
108 
109 File::~File() = default;
110 
111 FileSystem::~FileSystem() = default;
112 
113 ErrorOr<std::unique_ptr<MemoryBuffer>>
114 FileSystem::getBufferForFile(const llvm::Twine &Name, int64_t FileSize,
115                              bool RequiresNullTerminator, bool IsVolatile) {
116   auto F = openFileForRead(Name);
117   if (!F)
118     return F.getError();
119 
120   return (*F)->getBuffer(Name, FileSize, RequiresNullTerminator, IsVolatile);
121 }
122 
123 std::error_code FileSystem::makeAbsolute(SmallVectorImpl<char> &Path) const {
124   if (llvm::sys::path::is_absolute(Path))
125     return {};
126 
127   auto WorkingDir = getCurrentWorkingDirectory();
128   if (!WorkingDir)
129     return WorkingDir.getError();
130 
131   return llvm::sys::fs::make_absolute(WorkingDir.get(), Path);
132 }
133 
134 std::error_code FileSystem::getRealPath(const Twine &Path,
135                                         SmallVectorImpl<char> &Output) const {
136   return errc::operation_not_permitted;
137 }
138 
139 bool FileSystem::exists(const Twine &Path) {
140   auto Status = status(Path);
141   return Status && Status->exists();
142 }
143 
144 #ifndef NDEBUG
145 static bool isTraversalComponent(StringRef Component) {
146   return Component.equals("..") || Component.equals(".");
147 }
148 
149 static bool pathHasTraversal(StringRef Path) {
150   using namespace llvm::sys;
151 
152   for (StringRef Comp : llvm::make_range(path::begin(Path), path::end(Path)))
153     if (isTraversalComponent(Comp))
154       return true;
155   return false;
156 }
157 #endif
158 
159 //===-----------------------------------------------------------------------===/
160 // RealFileSystem implementation
161 //===-----------------------------------------------------------------------===/
162 
163 namespace {
164 
165 /// Wrapper around a raw file descriptor.
166 class RealFile : public File {
167   friend class RealFileSystem;
168 
169   int FD;
170   Status S;
171   std::string RealName;
172 
173   RealFile(int FD, StringRef NewName, StringRef NewRealPathName)
174       : FD(FD), S(NewName, {}, {}, {}, {}, {},
175                   llvm::sys::fs::file_type::status_error, {}),
176         RealName(NewRealPathName.str()) {
177     assert(FD >= 0 && "Invalid or inactive file descriptor");
178   }
179 
180 public:
181   ~RealFile() override;
182 
183   ErrorOr<Status> status() override;
184   ErrorOr<std::string> getName() override;
185   ErrorOr<std::unique_ptr<MemoryBuffer>> getBuffer(const Twine &Name,
186                                                    int64_t FileSize,
187                                                    bool RequiresNullTerminator,
188                                                    bool IsVolatile) override;
189   std::error_code close() override;
190 };
191 
192 } // namespace
193 
194 RealFile::~RealFile() { close(); }
195 
196 ErrorOr<Status> RealFile::status() {
197   assert(FD != -1 && "cannot stat closed file");
198   if (!S.isStatusKnown()) {
199     file_status RealStatus;
200     if (std::error_code EC = sys::fs::status(FD, RealStatus))
201       return EC;
202     S = Status::copyWithNewName(RealStatus, S.getName());
203   }
204   return S;
205 }
206 
207 ErrorOr<std::string> RealFile::getName() {
208   return RealName.empty() ? S.getName().str() : RealName;
209 }
210 
211 ErrorOr<std::unique_ptr<MemoryBuffer>>
212 RealFile::getBuffer(const Twine &Name, int64_t FileSize,
213                     bool RequiresNullTerminator, bool IsVolatile) {
214   assert(FD != -1 && "cannot get buffer for closed file");
215   return MemoryBuffer::getOpenFile(FD, Name, FileSize, RequiresNullTerminator,
216                                    IsVolatile);
217 }
218 
219 std::error_code RealFile::close() {
220   std::error_code EC = sys::Process::SafelyCloseFileDescriptor(FD);
221   FD = -1;
222   return EC;
223 }
224 
225 namespace {
226 
227 /// The file system according to your operating system.
228 class RealFileSystem : public FileSystem {
229 public:
230   ErrorOr<Status> status(const Twine &Path) override;
231   ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine &Path) override;
232   directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override;
233 
234   llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override;
235   std::error_code setCurrentWorkingDirectory(const Twine &Path) override;
236   std::error_code getRealPath(const Twine &Path,
237                               SmallVectorImpl<char> &Output) const override;
238 
239 private:
240   mutable std::mutex CWDMutex;
241   mutable std::string CWDCache;
242 };
243 
244 } // namespace
245 
246 ErrorOr<Status> RealFileSystem::status(const Twine &Path) {
247   sys::fs::file_status RealStatus;
248   if (std::error_code EC = sys::fs::status(Path, RealStatus))
249     return EC;
250   return Status::copyWithNewName(RealStatus, Path.str());
251 }
252 
253 ErrorOr<std::unique_ptr<File>>
254 RealFileSystem::openFileForRead(const Twine &Name) {
255   int FD;
256   SmallString<256> RealName;
257   if (std::error_code EC =
258           sys::fs::openFileForRead(Name, FD, sys::fs::OF_None, &RealName))
259     return EC;
260   return std::unique_ptr<File>(new RealFile(FD, Name.str(), RealName.str()));
261 }
262 
263 llvm::ErrorOr<std::string> RealFileSystem::getCurrentWorkingDirectory() const {
264   std::lock_guard<std::mutex> Lock(CWDMutex);
265   if (!CWDCache.empty())
266     return CWDCache;
267   SmallString<256> Dir;
268   if (std::error_code EC = llvm::sys::fs::current_path(Dir))
269     return EC;
270   CWDCache = Dir.str();
271   return CWDCache;
272 }
273 
274 std::error_code RealFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
275   // FIXME: chdir is thread hostile; on the other hand, creating the same
276   // behavior as chdir is complex: chdir resolves the path once, thus
277   // guaranteeing that all subsequent relative path operations work
278   // on the same path the original chdir resulted in. This makes a
279   // difference for example on network filesystems, where symlinks might be
280   // switched during runtime of the tool. Fixing this depends on having a
281   // file system abstraction that allows openat() style interactions.
282   if (auto EC = llvm::sys::fs::set_current_path(Path))
283     return EC;
284 
285   // Invalidate cache.
286   std::lock_guard<std::mutex> Lock(CWDMutex);
287   CWDCache.clear();
288   return std::error_code();
289 }
290 
291 std::error_code
292 RealFileSystem::getRealPath(const Twine &Path,
293                             SmallVectorImpl<char> &Output) const {
294   return llvm::sys::fs::real_path(Path, Output);
295 }
296 
297 IntrusiveRefCntPtr<FileSystem> vfs::getRealFileSystem() {
298   static IntrusiveRefCntPtr<FileSystem> FS = new RealFileSystem();
299   return FS;
300 }
301 
302 namespace {
303 
304 class RealFSDirIter : public llvm::vfs::detail::DirIterImpl {
305   llvm::sys::fs::directory_iterator Iter;
306 
307 public:
308   RealFSDirIter(const Twine &Path, std::error_code &EC) : Iter(Path, EC) {
309     if (Iter != llvm::sys::fs::directory_iterator())
310       CurrentEntry = directory_entry(Iter->path(), Iter->type());
311   }
312 
313   std::error_code increment() override {
314     std::error_code EC;
315     Iter.increment(EC);
316     CurrentEntry = (Iter == llvm::sys::fs::directory_iterator())
317                        ? directory_entry()
318                        : directory_entry(Iter->path(), Iter->type());
319     return EC;
320   }
321 };
322 
323 } // namespace
324 
325 directory_iterator RealFileSystem::dir_begin(const Twine &Dir,
326                                              std::error_code &EC) {
327   return directory_iterator(std::make_shared<RealFSDirIter>(Dir, EC));
328 }
329 
330 //===-----------------------------------------------------------------------===/
331 // OverlayFileSystem implementation
332 //===-----------------------------------------------------------------------===/
333 
334 OverlayFileSystem::OverlayFileSystem(IntrusiveRefCntPtr<FileSystem> BaseFS) {
335   FSList.push_back(std::move(BaseFS));
336 }
337 
338 void OverlayFileSystem::pushOverlay(IntrusiveRefCntPtr<FileSystem> FS) {
339   FSList.push_back(FS);
340   // Synchronize added file systems by duplicating the working directory from
341   // the first one in the list.
342   FS->setCurrentWorkingDirectory(getCurrentWorkingDirectory().get());
343 }
344 
345 ErrorOr<Status> OverlayFileSystem::status(const Twine &Path) {
346   // FIXME: handle symlinks that cross file systems
347   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
348     ErrorOr<Status> Status = (*I)->status(Path);
349     if (Status || Status.getError() != llvm::errc::no_such_file_or_directory)
350       return Status;
351   }
352   return make_error_code(llvm::errc::no_such_file_or_directory);
353 }
354 
355 ErrorOr<std::unique_ptr<File>>
356 OverlayFileSystem::openFileForRead(const llvm::Twine &Path) {
357   // FIXME: handle symlinks that cross file systems
358   for (iterator I = overlays_begin(), E = overlays_end(); I != E; ++I) {
359     auto Result = (*I)->openFileForRead(Path);
360     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
361       return Result;
362   }
363   return make_error_code(llvm::errc::no_such_file_or_directory);
364 }
365 
366 llvm::ErrorOr<std::string>
367 OverlayFileSystem::getCurrentWorkingDirectory() const {
368   // All file systems are synchronized, just take the first working directory.
369   return FSList.front()->getCurrentWorkingDirectory();
370 }
371 
372 std::error_code
373 OverlayFileSystem::setCurrentWorkingDirectory(const Twine &Path) {
374   for (auto &FS : FSList)
375     if (std::error_code EC = FS->setCurrentWorkingDirectory(Path))
376       return EC;
377   return {};
378 }
379 
380 std::error_code
381 OverlayFileSystem::getRealPath(const Twine &Path,
382                                SmallVectorImpl<char> &Output) const {
383   for (auto &FS : FSList)
384     if (FS->exists(Path))
385       return FS->getRealPath(Path, Output);
386   return errc::no_such_file_or_directory;
387 }
388 
389 llvm::vfs::detail::DirIterImpl::~DirIterImpl() = default;
390 
391 namespace {
392 
393 class OverlayFSDirIterImpl : public llvm::vfs::detail::DirIterImpl {
394   OverlayFileSystem &Overlays;
395   std::string Path;
396   OverlayFileSystem::iterator CurrentFS;
397   directory_iterator CurrentDirIter;
398   llvm::StringSet<> SeenNames;
399 
400   std::error_code incrementFS() {
401     assert(CurrentFS != Overlays.overlays_end() && "incrementing past end");
402     ++CurrentFS;
403     for (auto E = Overlays.overlays_end(); CurrentFS != E; ++CurrentFS) {
404       std::error_code EC;
405       CurrentDirIter = (*CurrentFS)->dir_begin(Path, EC);
406       if (EC && EC != errc::no_such_file_or_directory)
407         return EC;
408       if (CurrentDirIter != directory_iterator())
409         break; // found
410     }
411     return {};
412   }
413 
414   std::error_code incrementDirIter(bool IsFirstTime) {
415     assert((IsFirstTime || CurrentDirIter != directory_iterator()) &&
416            "incrementing past end");
417     std::error_code EC;
418     if (!IsFirstTime)
419       CurrentDirIter.increment(EC);
420     if (!EC && CurrentDirIter == directory_iterator())
421       EC = incrementFS();
422     return EC;
423   }
424 
425   std::error_code incrementImpl(bool IsFirstTime) {
426     while (true) {
427       std::error_code EC = incrementDirIter(IsFirstTime);
428       if (EC || CurrentDirIter == directory_iterator()) {
429         CurrentEntry = directory_entry();
430         return EC;
431       }
432       CurrentEntry = *CurrentDirIter;
433       StringRef Name = llvm::sys::path::filename(CurrentEntry.path());
434       if (SeenNames.insert(Name).second)
435         return EC; // name not seen before
436     }
437     llvm_unreachable("returned above");
438   }
439 
440 public:
441   OverlayFSDirIterImpl(const Twine &Path, OverlayFileSystem &FS,
442                        std::error_code &EC)
443       : Overlays(FS), Path(Path.str()), CurrentFS(Overlays.overlays_begin()) {
444     CurrentDirIter = (*CurrentFS)->dir_begin(Path, EC);
445     EC = incrementImpl(true);
446   }
447 
448   std::error_code increment() override { return incrementImpl(false); }
449 };
450 
451 } // namespace
452 
453 directory_iterator OverlayFileSystem::dir_begin(const Twine &Dir,
454                                                 std::error_code &EC) {
455   return directory_iterator(
456       std::make_shared<OverlayFSDirIterImpl>(Dir, *this, EC));
457 }
458 
459 namespace llvm {
460 namespace vfs {
461 
462 namespace detail {
463 
464 enum InMemoryNodeKind { IME_File, IME_Directory, IME_HardLink };
465 
466 /// The in memory file system is a tree of Nodes. Every node can either be a
467 /// file , hardlink or a directory.
468 class InMemoryNode {
469   InMemoryNodeKind Kind;
470   std::string FileName;
471 
472 public:
473   InMemoryNode(llvm::StringRef FileName, InMemoryNodeKind Kind)
474       : Kind(Kind), FileName(llvm::sys::path::filename(FileName)) {}
475   virtual ~InMemoryNode() = default;
476 
477   /// Get the filename of this node (the name without the directory part).
478   StringRef getFileName() const { return FileName; }
479   InMemoryNodeKind getKind() const { return Kind; }
480   virtual std::string toString(unsigned Indent) const = 0;
481 };
482 
483 class InMemoryFile : public InMemoryNode {
484   Status Stat;
485   std::unique_ptr<llvm::MemoryBuffer> Buffer;
486 
487 public:
488   InMemoryFile(Status Stat, std::unique_ptr<llvm::MemoryBuffer> Buffer)
489       : InMemoryNode(Stat.getName(), IME_File), Stat(std::move(Stat)),
490         Buffer(std::move(Buffer)) {}
491 
492   /// Return the \p Status for this node. \p RequestedName should be the name
493   /// through which the caller referred to this node. It will override
494   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
495   Status getStatus(StringRef RequestedName) const {
496     return Status::copyWithNewName(Stat, RequestedName);
497   }
498   llvm::MemoryBuffer *getBuffer() const { return Buffer.get(); }
499 
500   std::string toString(unsigned Indent) const override {
501     return (std::string(Indent, ' ') + Stat.getName() + "\n").str();
502   }
503 
504   static bool classof(const InMemoryNode *N) {
505     return N->getKind() == IME_File;
506   }
507 };
508 
509 namespace {
510 
511 class InMemoryHardLink : public InMemoryNode {
512   const InMemoryFile &ResolvedFile;
513 
514 public:
515   InMemoryHardLink(StringRef Path, const InMemoryFile &ResolvedFile)
516       : InMemoryNode(Path, IME_HardLink), ResolvedFile(ResolvedFile) {}
517   const InMemoryFile &getResolvedFile() const { return ResolvedFile; }
518 
519   std::string toString(unsigned Indent) const override {
520     return std::string(Indent, ' ') + "HardLink to -> " +
521            ResolvedFile.toString(0);
522   }
523 
524   static bool classof(const InMemoryNode *N) {
525     return N->getKind() == IME_HardLink;
526   }
527 };
528 
529 /// Adapt a InMemoryFile for VFS' File interface.  The goal is to make
530 /// \p InMemoryFileAdaptor mimic as much as possible the behavior of
531 /// \p RealFile.
532 class InMemoryFileAdaptor : public File {
533   const InMemoryFile &Node;
534   /// The name to use when returning a Status for this file.
535   std::string RequestedName;
536 
537 public:
538   explicit InMemoryFileAdaptor(const InMemoryFile &Node,
539                                std::string RequestedName)
540       : Node(Node), RequestedName(std::move(RequestedName)) {}
541 
542   llvm::ErrorOr<Status> status() override {
543     return Node.getStatus(RequestedName);
544   }
545 
546   llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
547   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
548             bool IsVolatile) override {
549     llvm::MemoryBuffer *Buf = Node.getBuffer();
550     return llvm::MemoryBuffer::getMemBuffer(
551         Buf->getBuffer(), Buf->getBufferIdentifier(), RequiresNullTerminator);
552   }
553 
554   std::error_code close() override { return {}; }
555 };
556 } // namespace
557 
558 class InMemoryDirectory : public InMemoryNode {
559   Status Stat;
560   llvm::StringMap<std::unique_ptr<InMemoryNode>> Entries;
561 
562 public:
563   InMemoryDirectory(Status Stat)
564       : InMemoryNode(Stat.getName(), IME_Directory), Stat(std::move(Stat)) {}
565 
566   /// Return the \p Status for this node. \p RequestedName should be the name
567   /// through which the caller referred to this node. It will override
568   /// \p Status::Name in the return value, to mimic the behavior of \p RealFile.
569   Status getStatus(StringRef RequestedName) const {
570     return Status::copyWithNewName(Stat, RequestedName);
571   }
572   InMemoryNode *getChild(StringRef Name) {
573     auto I = Entries.find(Name);
574     if (I != Entries.end())
575       return I->second.get();
576     return nullptr;
577   }
578 
579   InMemoryNode *addChild(StringRef Name, std::unique_ptr<InMemoryNode> Child) {
580     return Entries.insert(make_pair(Name, std::move(Child)))
581         .first->second.get();
582   }
583 
584   using const_iterator = decltype(Entries)::const_iterator;
585 
586   const_iterator begin() const { return Entries.begin(); }
587   const_iterator end() const { return Entries.end(); }
588 
589   std::string toString(unsigned Indent) const override {
590     std::string Result =
591         (std::string(Indent, ' ') + Stat.getName() + "\n").str();
592     for (const auto &Entry : Entries)
593       Result += Entry.second->toString(Indent + 2);
594     return Result;
595   }
596 
597   static bool classof(const InMemoryNode *N) {
598     return N->getKind() == IME_Directory;
599   }
600 };
601 
602 namespace {
603 Status getNodeStatus(const InMemoryNode *Node, StringRef RequestedName) {
604   if (auto Dir = dyn_cast<detail::InMemoryDirectory>(Node))
605     return Dir->getStatus(RequestedName);
606   if (auto File = dyn_cast<detail::InMemoryFile>(Node))
607     return File->getStatus(RequestedName);
608   if (auto Link = dyn_cast<detail::InMemoryHardLink>(Node))
609     return Link->getResolvedFile().getStatus(RequestedName);
610   llvm_unreachable("Unknown node type");
611 }
612 } // namespace
613 } // namespace detail
614 
615 InMemoryFileSystem::InMemoryFileSystem(bool UseNormalizedPaths)
616     : Root(new detail::InMemoryDirectory(
617           Status("", getNextVirtualUniqueID(), llvm::sys::TimePoint<>(), 0, 0,
618                  0, llvm::sys::fs::file_type::directory_file,
619                  llvm::sys::fs::perms::all_all))),
620       UseNormalizedPaths(UseNormalizedPaths) {}
621 
622 InMemoryFileSystem::~InMemoryFileSystem() = default;
623 
624 std::string InMemoryFileSystem::toString() const {
625   return Root->toString(/*Indent=*/0);
626 }
627 
628 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
629                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
630                                  Optional<uint32_t> User,
631                                  Optional<uint32_t> Group,
632                                  Optional<llvm::sys::fs::file_type> Type,
633                                  Optional<llvm::sys::fs::perms> Perms,
634                                  const detail::InMemoryFile *HardLinkTarget) {
635   SmallString<128> Path;
636   P.toVector(Path);
637 
638   // Fix up relative paths. This just prepends the current working directory.
639   std::error_code EC = makeAbsolute(Path);
640   assert(!EC);
641   (void)EC;
642 
643   if (useNormalizedPaths())
644     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
645 
646   if (Path.empty())
647     return false;
648 
649   detail::InMemoryDirectory *Dir = Root.get();
650   auto I = llvm::sys::path::begin(Path), E = sys::path::end(Path);
651   const auto ResolvedUser = User.getValueOr(0);
652   const auto ResolvedGroup = Group.getValueOr(0);
653   const auto ResolvedType = Type.getValueOr(sys::fs::file_type::regular_file);
654   const auto ResolvedPerms = Perms.getValueOr(sys::fs::all_all);
655   assert(!(HardLinkTarget && Buffer) && "HardLink cannot have a buffer");
656   // Any intermediate directories we create should be accessible by
657   // the owner, even if Perms says otherwise for the final path.
658   const auto NewDirectoryPerms = ResolvedPerms | sys::fs::owner_all;
659   while (true) {
660     StringRef Name = *I;
661     detail::InMemoryNode *Node = Dir->getChild(Name);
662     ++I;
663     if (!Node) {
664       if (I == E) {
665         // End of the path.
666         std::unique_ptr<detail::InMemoryNode> Child;
667         if (HardLinkTarget)
668           Child.reset(new detail::InMemoryHardLink(P.str(), *HardLinkTarget));
669         else {
670           // Create a new file or directory.
671           Status Stat(P.str(), getNextVirtualUniqueID(),
672                       llvm::sys::toTimePoint(ModificationTime), ResolvedUser,
673                       ResolvedGroup, Buffer->getBufferSize(), ResolvedType,
674                       ResolvedPerms);
675           if (ResolvedType == sys::fs::file_type::directory_file) {
676             Child.reset(new detail::InMemoryDirectory(std::move(Stat)));
677           } else {
678             Child.reset(
679                 new detail::InMemoryFile(std::move(Stat), std::move(Buffer)));
680           }
681         }
682         Dir->addChild(Name, std::move(Child));
683         return true;
684       }
685 
686       // Create a new directory. Use the path up to here.
687       Status Stat(
688           StringRef(Path.str().begin(), Name.end() - Path.str().begin()),
689           getNextVirtualUniqueID(), llvm::sys::toTimePoint(ModificationTime),
690           ResolvedUser, ResolvedGroup, 0, sys::fs::file_type::directory_file,
691           NewDirectoryPerms);
692       Dir = cast<detail::InMemoryDirectory>(Dir->addChild(
693           Name, llvm::make_unique<detail::InMemoryDirectory>(std::move(Stat))));
694       continue;
695     }
696 
697     if (auto *NewDir = dyn_cast<detail::InMemoryDirectory>(Node)) {
698       Dir = NewDir;
699     } else {
700       assert((isa<detail::InMemoryFile>(Node) ||
701               isa<detail::InMemoryHardLink>(Node)) &&
702              "Must be either file, hardlink or directory!");
703 
704       // Trying to insert a directory in place of a file.
705       if (I != E)
706         return false;
707 
708       // Return false only if the new file is different from the existing one.
709       if (auto Link = dyn_cast<detail::InMemoryHardLink>(Node)) {
710         return Link->getResolvedFile().getBuffer()->getBuffer() ==
711                Buffer->getBuffer();
712       }
713       return cast<detail::InMemoryFile>(Node)->getBuffer()->getBuffer() ==
714              Buffer->getBuffer();
715     }
716   }
717 }
718 
719 bool InMemoryFileSystem::addFile(const Twine &P, time_t ModificationTime,
720                                  std::unique_ptr<llvm::MemoryBuffer> Buffer,
721                                  Optional<uint32_t> User,
722                                  Optional<uint32_t> Group,
723                                  Optional<llvm::sys::fs::file_type> Type,
724                                  Optional<llvm::sys::fs::perms> Perms) {
725   return addFile(P, ModificationTime, std::move(Buffer), User, Group, Type,
726                  Perms, /*HardLinkTarget=*/nullptr);
727 }
728 
729 bool InMemoryFileSystem::addFileNoOwn(const Twine &P, time_t ModificationTime,
730                                       llvm::MemoryBuffer *Buffer,
731                                       Optional<uint32_t> User,
732                                       Optional<uint32_t> Group,
733                                       Optional<llvm::sys::fs::file_type> Type,
734                                       Optional<llvm::sys::fs::perms> Perms) {
735   return addFile(P, ModificationTime,
736                  llvm::MemoryBuffer::getMemBuffer(
737                      Buffer->getBuffer(), Buffer->getBufferIdentifier()),
738                  std::move(User), std::move(Group), std::move(Type),
739                  std::move(Perms));
740 }
741 
742 static ErrorOr<const detail::InMemoryNode *>
743 lookupInMemoryNode(const InMemoryFileSystem &FS, detail::InMemoryDirectory *Dir,
744                    const Twine &P) {
745   SmallString<128> Path;
746   P.toVector(Path);
747 
748   // Fix up relative paths. This just prepends the current working directory.
749   std::error_code EC = FS.makeAbsolute(Path);
750   assert(!EC);
751   (void)EC;
752 
753   if (FS.useNormalizedPaths())
754     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
755 
756   if (Path.empty())
757     return Dir;
758 
759   auto I = llvm::sys::path::begin(Path), E = llvm::sys::path::end(Path);
760   while (true) {
761     detail::InMemoryNode *Node = Dir->getChild(*I);
762     ++I;
763     if (!Node)
764       return errc::no_such_file_or_directory;
765 
766     // Return the file if it's at the end of the path.
767     if (auto File = dyn_cast<detail::InMemoryFile>(Node)) {
768       if (I == E)
769         return File;
770       return errc::no_such_file_or_directory;
771     }
772 
773     // If Node is HardLink then return the resolved file.
774     if (auto File = dyn_cast<detail::InMemoryHardLink>(Node)) {
775       if (I == E)
776         return &File->getResolvedFile();
777       return errc::no_such_file_or_directory;
778     }
779     // Traverse directories.
780     Dir = cast<detail::InMemoryDirectory>(Node);
781     if (I == E)
782       return Dir;
783   }
784 }
785 
786 bool InMemoryFileSystem::addHardLink(const Twine &FromPath,
787                                      const Twine &ToPath) {
788   auto FromNode = lookupInMemoryNode(*this, Root.get(), FromPath);
789   auto ToNode = lookupInMemoryNode(*this, Root.get(), ToPath);
790   // FromPath must not have been added before. ToPath must have been added
791   // before. Resolved ToPath must be a File.
792   if (!ToNode || FromNode || !isa<detail::InMemoryFile>(*ToNode))
793     return false;
794   return this->addFile(FromPath, 0, nullptr, None, None, None, None,
795                        cast<detail::InMemoryFile>(*ToNode));
796 }
797 
798 llvm::ErrorOr<Status> InMemoryFileSystem::status(const Twine &Path) {
799   auto Node = lookupInMemoryNode(*this, Root.get(), Path);
800   if (Node)
801     return detail::getNodeStatus(*Node, Path.str());
802   return Node.getError();
803 }
804 
805 llvm::ErrorOr<std::unique_ptr<File>>
806 InMemoryFileSystem::openFileForRead(const Twine &Path) {
807   auto Node = lookupInMemoryNode(*this, Root.get(), Path);
808   if (!Node)
809     return Node.getError();
810 
811   // When we have a file provide a heap-allocated wrapper for the memory buffer
812   // to match the ownership semantics for File.
813   if (auto *F = dyn_cast<detail::InMemoryFile>(*Node))
814     return std::unique_ptr<File>(
815         new detail::InMemoryFileAdaptor(*F, Path.str()));
816 
817   // FIXME: errc::not_a_file?
818   return make_error_code(llvm::errc::invalid_argument);
819 }
820 
821 namespace {
822 
823 /// Adaptor from InMemoryDir::iterator to directory_iterator.
824 class InMemoryDirIterator : public llvm::vfs::detail::DirIterImpl {
825   detail::InMemoryDirectory::const_iterator I;
826   detail::InMemoryDirectory::const_iterator E;
827   std::string RequestedDirName;
828 
829   void setCurrentEntry() {
830     if (I != E) {
831       SmallString<256> Path(RequestedDirName);
832       llvm::sys::path::append(Path, I->second->getFileName());
833       sys::fs::file_type Type;
834       switch (I->second->getKind()) {
835       case detail::IME_File:
836       case detail::IME_HardLink:
837         Type = sys::fs::file_type::regular_file;
838         break;
839       case detail::IME_Directory:
840         Type = sys::fs::file_type::directory_file;
841         break;
842       }
843       CurrentEntry = directory_entry(Path.str(), Type);
844     } else {
845       // When we're at the end, make CurrentEntry invalid and DirIterImpl will
846       // do the rest.
847       CurrentEntry = directory_entry();
848     }
849   }
850 
851 public:
852   InMemoryDirIterator() = default;
853 
854   explicit InMemoryDirIterator(const detail::InMemoryDirectory &Dir,
855                                std::string RequestedDirName)
856       : I(Dir.begin()), E(Dir.end()),
857         RequestedDirName(std::move(RequestedDirName)) {
858     setCurrentEntry();
859   }
860 
861   std::error_code increment() override {
862     ++I;
863     setCurrentEntry();
864     return {};
865   }
866 };
867 
868 } // namespace
869 
870 directory_iterator InMemoryFileSystem::dir_begin(const Twine &Dir,
871                                                  std::error_code &EC) {
872   auto Node = lookupInMemoryNode(*this, Root.get(), Dir);
873   if (!Node) {
874     EC = Node.getError();
875     return directory_iterator(std::make_shared<InMemoryDirIterator>());
876   }
877 
878   if (auto *DirNode = dyn_cast<detail::InMemoryDirectory>(*Node))
879     return directory_iterator(
880         std::make_shared<InMemoryDirIterator>(*DirNode, Dir.str()));
881 
882   EC = make_error_code(llvm::errc::not_a_directory);
883   return directory_iterator(std::make_shared<InMemoryDirIterator>());
884 }
885 
886 std::error_code InMemoryFileSystem::setCurrentWorkingDirectory(const Twine &P) {
887   SmallString<128> Path;
888   P.toVector(Path);
889 
890   // Fix up relative paths. This just prepends the current working directory.
891   std::error_code EC = makeAbsolute(Path);
892   assert(!EC);
893   (void)EC;
894 
895   if (useNormalizedPaths())
896     llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
897 
898   if (!Path.empty())
899     WorkingDirectory = Path.str();
900   return {};
901 }
902 
903 std::error_code
904 InMemoryFileSystem::getRealPath(const Twine &Path,
905                                 SmallVectorImpl<char> &Output) const {
906   auto CWD = getCurrentWorkingDirectory();
907   if (!CWD || CWD->empty())
908     return errc::operation_not_permitted;
909   Path.toVector(Output);
910   if (auto EC = makeAbsolute(Output))
911     return EC;
912   llvm::sys::path::remove_dots(Output, /*remove_dot_dot=*/true);
913   return {};
914 }
915 
916 } // namespace vfs
917 } // namespace llvm
918 
919 //===-----------------------------------------------------------------------===/
920 // RedirectingFileSystem implementation
921 //===-----------------------------------------------------------------------===/
922 
923 namespace {
924 
925 enum EntryKind { EK_Directory, EK_File };
926 
927 /// A single file or directory in the VFS.
928 class Entry {
929   EntryKind Kind;
930   std::string Name;
931 
932 public:
933   Entry(EntryKind K, StringRef Name) : Kind(K), Name(Name) {}
934   virtual ~Entry() = default;
935 
936   StringRef getName() const { return Name; }
937   EntryKind getKind() const { return Kind; }
938 };
939 
940 class RedirectingDirectoryEntry : public Entry {
941   std::vector<std::unique_ptr<Entry>> Contents;
942   Status S;
943 
944 public:
945   RedirectingDirectoryEntry(StringRef Name,
946                             std::vector<std::unique_ptr<Entry>> Contents,
947                             Status S)
948       : Entry(EK_Directory, Name), Contents(std::move(Contents)),
949         S(std::move(S)) {}
950   RedirectingDirectoryEntry(StringRef Name, Status S)
951       : Entry(EK_Directory, Name), S(std::move(S)) {}
952 
953   Status getStatus() { return S; }
954 
955   void addContent(std::unique_ptr<Entry> Content) {
956     Contents.push_back(std::move(Content));
957   }
958 
959   Entry *getLastContent() const { return Contents.back().get(); }
960 
961   using iterator = decltype(Contents)::iterator;
962 
963   iterator contents_begin() { return Contents.begin(); }
964   iterator contents_end() { return Contents.end(); }
965 
966   static bool classof(const Entry *E) { return E->getKind() == EK_Directory; }
967 };
968 
969 class RedirectingFileEntry : public Entry {
970 public:
971   enum NameKind { NK_NotSet, NK_External, NK_Virtual };
972 
973 private:
974   std::string ExternalContentsPath;
975   NameKind UseName;
976 
977 public:
978   RedirectingFileEntry(StringRef Name, StringRef ExternalContentsPath,
979                        NameKind UseName)
980       : Entry(EK_File, Name), ExternalContentsPath(ExternalContentsPath),
981         UseName(UseName) {}
982 
983   StringRef getExternalContentsPath() const { return ExternalContentsPath; }
984 
985   /// whether to use the external path as the name for this file.
986   bool useExternalName(bool GlobalUseExternalName) const {
987     return UseName == NK_NotSet ? GlobalUseExternalName
988                                 : (UseName == NK_External);
989   }
990 
991   NameKind getUseName() const { return UseName; }
992 
993   static bool classof(const Entry *E) { return E->getKind() == EK_File; }
994 };
995 
996 class VFSFromYamlDirIterImpl : public llvm::vfs::detail::DirIterImpl {
997   std::string Dir;
998   RedirectingDirectoryEntry::iterator Current, End;
999 
1000   std::error_code incrementImpl();
1001 
1002 public:
1003   VFSFromYamlDirIterImpl(const Twine &Path,
1004                          RedirectingDirectoryEntry::iterator Begin,
1005                          RedirectingDirectoryEntry::iterator End,
1006                          std::error_code &EC);
1007 
1008   std::error_code increment() override;
1009 };
1010 
1011 /// A virtual file system parsed from a YAML file.
1012 ///
1013 /// Currently, this class allows creating virtual directories and mapping
1014 /// virtual file paths to existing external files, available in \c ExternalFS.
1015 ///
1016 /// The basic structure of the parsed file is:
1017 /// \verbatim
1018 /// {
1019 ///   'version': <version number>,
1020 ///   <optional configuration>
1021 ///   'roots': [
1022 ///              <directory entries>
1023 ///            ]
1024 /// }
1025 /// \endverbatim
1026 ///
1027 /// All configuration options are optional.
1028 ///   'case-sensitive': <boolean, default=true>
1029 ///   'use-external-names': <boolean, default=true>
1030 ///   'overlay-relative': <boolean, default=false>
1031 ///   'ignore-non-existent-contents': <boolean, default=true>
1032 ///
1033 /// Virtual directories are represented as
1034 /// \verbatim
1035 /// {
1036 ///   'type': 'directory',
1037 ///   'name': <string>,
1038 ///   'contents': [ <file or directory entries> ]
1039 /// }
1040 /// \endverbatim
1041 ///
1042 /// The default attributes for virtual directories are:
1043 /// \verbatim
1044 /// MTime = now() when created
1045 /// Perms = 0777
1046 /// User = Group = 0
1047 /// Size = 0
1048 /// UniqueID = unspecified unique value
1049 /// \endverbatim
1050 ///
1051 /// Re-mapped files are represented as
1052 /// \verbatim
1053 /// {
1054 ///   'type': 'file',
1055 ///   'name': <string>,
1056 ///   'use-external-name': <boolean> # Optional
1057 ///   'external-contents': <path to external file>
1058 /// }
1059 /// \endverbatim
1060 ///
1061 /// and inherit their attributes from the external contents.
1062 ///
1063 /// In both cases, the 'name' field may contain multiple path components (e.g.
1064 /// /path/to/file). However, any directory that contains more than one child
1065 /// must be uniquely represented by a directory entry.
1066 class RedirectingFileSystem : public vfs::FileSystem {
1067   friend class RedirectingFileSystemParser;
1068 
1069   /// The root(s) of the virtual file system.
1070   std::vector<std::unique_ptr<Entry>> Roots;
1071 
1072   /// The file system to use for external references.
1073   IntrusiveRefCntPtr<FileSystem> ExternalFS;
1074 
1075   /// If IsRelativeOverlay is set, this represents the directory
1076   /// path that should be prefixed to each 'external-contents' entry
1077   /// when reading from YAML files.
1078   std::string ExternalContentsPrefixDir;
1079 
1080   /// @name Configuration
1081   /// @{
1082 
1083   /// Whether to perform case-sensitive comparisons.
1084   ///
1085   /// Currently, case-insensitive matching only works correctly with ASCII.
1086   bool CaseSensitive = true;
1087 
1088   /// IsRelativeOverlay marks whether a ExternalContentsPrefixDir path must
1089   /// be prefixed in every 'external-contents' when reading from YAML files.
1090   bool IsRelativeOverlay = false;
1091 
1092   /// Whether to use to use the value of 'external-contents' for the
1093   /// names of files.  This global value is overridable on a per-file basis.
1094   bool UseExternalNames = true;
1095 
1096   /// Whether an invalid path obtained via 'external-contents' should
1097   /// cause iteration on the VFS to stop. If 'true', the VFS should ignore
1098   /// the entry and continue with the next. Allows YAML files to be shared
1099   /// across multiple compiler invocations regardless of prior existent
1100   /// paths in 'external-contents'. This global value is overridable on a
1101   /// per-file basis.
1102   bool IgnoreNonExistentContents = true;
1103   /// @}
1104 
1105   /// Virtual file paths and external files could be canonicalized without "..",
1106   /// "." and "./" in their paths. FIXME: some unittests currently fail on
1107   /// win32 when using remove_dots and remove_leading_dotslash on paths.
1108   bool UseCanonicalizedPaths =
1109 #ifdef _WIN32
1110       false;
1111 #else
1112       true;
1113 #endif
1114 
1115 private:
1116   RedirectingFileSystem(IntrusiveRefCntPtr<FileSystem> ExternalFS)
1117       : ExternalFS(std::move(ExternalFS)) {}
1118 
1119   /// Looks up the path <tt>[Start, End)</tt> in \p From, possibly
1120   /// recursing into the contents of \p From if it is a directory.
1121   ErrorOr<Entry *> lookupPath(sys::path::const_iterator Start,
1122                               sys::path::const_iterator End, Entry *From);
1123 
1124   /// Get the status of a given an \c Entry.
1125   ErrorOr<Status> status(const Twine &Path, Entry *E);
1126 
1127 public:
1128   /// Looks up \p Path in \c Roots.
1129   ErrorOr<Entry *> lookupPath(const Twine &Path);
1130 
1131   /// Parses \p Buffer, which is expected to be in YAML format and
1132   /// returns a virtual file system representing its contents.
1133   static RedirectingFileSystem *
1134   create(std::unique_ptr<MemoryBuffer> Buffer,
1135          SourceMgr::DiagHandlerTy DiagHandler, StringRef YAMLFilePath,
1136          void *DiagContext, IntrusiveRefCntPtr<FileSystem> ExternalFS);
1137 
1138   ErrorOr<Status> status(const Twine &Path) override;
1139   ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine &Path) override;
1140 
1141   llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override {
1142     return ExternalFS->getCurrentWorkingDirectory();
1143   }
1144 
1145   std::error_code setCurrentWorkingDirectory(const Twine &Path) override {
1146     return ExternalFS->setCurrentWorkingDirectory(Path);
1147   }
1148 
1149   directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override {
1150     ErrorOr<Entry *> E = lookupPath(Dir);
1151     if (!E) {
1152       EC = E.getError();
1153       return {};
1154     }
1155     ErrorOr<Status> S = status(Dir, *E);
1156     if (!S) {
1157       EC = S.getError();
1158       return {};
1159     }
1160     if (!S->isDirectory()) {
1161       EC = std::error_code(static_cast<int>(errc::not_a_directory),
1162                            std::system_category());
1163       return {};
1164     }
1165 
1166     auto *D = cast<RedirectingDirectoryEntry>(*E);
1167     return directory_iterator(std::make_shared<VFSFromYamlDirIterImpl>(
1168         Dir, D->contents_begin(), D->contents_end(), EC));
1169   }
1170 
1171   void setExternalContentsPrefixDir(StringRef PrefixDir) {
1172     ExternalContentsPrefixDir = PrefixDir.str();
1173   }
1174 
1175   StringRef getExternalContentsPrefixDir() const {
1176     return ExternalContentsPrefixDir;
1177   }
1178 
1179   bool ignoreNonExistentContents() const { return IgnoreNonExistentContents; }
1180 
1181 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1182   LLVM_DUMP_METHOD void dump() const {
1183     for (const auto &Root : Roots)
1184       dumpEntry(Root.get());
1185   }
1186 
1187   LLVM_DUMP_METHOD void dumpEntry(Entry *E, int NumSpaces = 0) const {
1188     StringRef Name = E->getName();
1189     for (int i = 0, e = NumSpaces; i < e; ++i)
1190       dbgs() << " ";
1191     dbgs() << "'" << Name.str().c_str() << "'"
1192            << "\n";
1193 
1194     if (E->getKind() == EK_Directory) {
1195       auto *DE = dyn_cast<RedirectingDirectoryEntry>(E);
1196       assert(DE && "Should be a directory");
1197 
1198       for (std::unique_ptr<Entry> &SubEntry :
1199            llvm::make_range(DE->contents_begin(), DE->contents_end()))
1200         dumpEntry(SubEntry.get(), NumSpaces + 2);
1201     }
1202   }
1203 #endif
1204 };
1205 
1206 /// A helper class to hold the common YAML parsing state.
1207 class RedirectingFileSystemParser {
1208   yaml::Stream &Stream;
1209 
1210   void error(yaml::Node *N, const Twine &Msg) { Stream.printError(N, Msg); }
1211 
1212   // false on error
1213   bool parseScalarString(yaml::Node *N, StringRef &Result,
1214                          SmallVectorImpl<char> &Storage) {
1215     const auto *S = dyn_cast<yaml::ScalarNode>(N);
1216 
1217     if (!S) {
1218       error(N, "expected string");
1219       return false;
1220     }
1221     Result = S->getValue(Storage);
1222     return true;
1223   }
1224 
1225   // false on error
1226   bool parseScalarBool(yaml::Node *N, bool &Result) {
1227     SmallString<5> Storage;
1228     StringRef Value;
1229     if (!parseScalarString(N, Value, Storage))
1230       return false;
1231 
1232     if (Value.equals_lower("true") || Value.equals_lower("on") ||
1233         Value.equals_lower("yes") || Value == "1") {
1234       Result = true;
1235       return true;
1236     } else if (Value.equals_lower("false") || Value.equals_lower("off") ||
1237                Value.equals_lower("no") || Value == "0") {
1238       Result = false;
1239       return true;
1240     }
1241 
1242     error(N, "expected boolean value");
1243     return false;
1244   }
1245 
1246   struct KeyStatus {
1247     bool Required;
1248     bool Seen = false;
1249 
1250     KeyStatus(bool Required = false) : Required(Required) {}
1251   };
1252 
1253   using KeyStatusPair = std::pair<StringRef, KeyStatus>;
1254 
1255   // false on error
1256   bool checkDuplicateOrUnknownKey(yaml::Node *KeyNode, StringRef Key,
1257                                   DenseMap<StringRef, KeyStatus> &Keys) {
1258     if (!Keys.count(Key)) {
1259       error(KeyNode, "unknown key");
1260       return false;
1261     }
1262     KeyStatus &S = Keys[Key];
1263     if (S.Seen) {
1264       error(KeyNode, Twine("duplicate key '") + Key + "'");
1265       return false;
1266     }
1267     S.Seen = true;
1268     return true;
1269   }
1270 
1271   // false on error
1272   bool checkMissingKeys(yaml::Node *Obj, DenseMap<StringRef, KeyStatus> &Keys) {
1273     for (const auto &I : Keys) {
1274       if (I.second.Required && !I.second.Seen) {
1275         error(Obj, Twine("missing key '") + I.first + "'");
1276         return false;
1277       }
1278     }
1279     return true;
1280   }
1281 
1282   Entry *lookupOrCreateEntry(RedirectingFileSystem *FS, StringRef Name,
1283                              Entry *ParentEntry = nullptr) {
1284     if (!ParentEntry) { // Look for a existent root
1285       for (const auto &Root : FS->Roots) {
1286         if (Name.equals(Root->getName())) {
1287           ParentEntry = Root.get();
1288           return ParentEntry;
1289         }
1290       }
1291     } else { // Advance to the next component
1292       auto *DE = dyn_cast<RedirectingDirectoryEntry>(ParentEntry);
1293       for (std::unique_ptr<Entry> &Content :
1294            llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1295         auto *DirContent = dyn_cast<RedirectingDirectoryEntry>(Content.get());
1296         if (DirContent && Name.equals(Content->getName()))
1297           return DirContent;
1298       }
1299     }
1300 
1301     // ... or create a new one
1302     std::unique_ptr<Entry> E = llvm::make_unique<RedirectingDirectoryEntry>(
1303         Name,
1304         Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1305                0, 0, 0, file_type::directory_file, sys::fs::all_all));
1306 
1307     if (!ParentEntry) { // Add a new root to the overlay
1308       FS->Roots.push_back(std::move(E));
1309       ParentEntry = FS->Roots.back().get();
1310       return ParentEntry;
1311     }
1312 
1313     auto *DE = dyn_cast<RedirectingDirectoryEntry>(ParentEntry);
1314     DE->addContent(std::move(E));
1315     return DE->getLastContent();
1316   }
1317 
1318   void uniqueOverlayTree(RedirectingFileSystem *FS, Entry *SrcE,
1319                          Entry *NewParentE = nullptr) {
1320     StringRef Name = SrcE->getName();
1321     switch (SrcE->getKind()) {
1322     case EK_Directory: {
1323       auto *DE = dyn_cast<RedirectingDirectoryEntry>(SrcE);
1324       assert(DE && "Must be a directory");
1325       // Empty directories could be present in the YAML as a way to
1326       // describe a file for a current directory after some of its subdir
1327       // is parsed. This only leads to redundant walks, ignore it.
1328       if (!Name.empty())
1329         NewParentE = lookupOrCreateEntry(FS, Name, NewParentE);
1330       for (std::unique_ptr<Entry> &SubEntry :
1331            llvm::make_range(DE->contents_begin(), DE->contents_end()))
1332         uniqueOverlayTree(FS, SubEntry.get(), NewParentE);
1333       break;
1334     }
1335     case EK_File: {
1336       auto *FE = dyn_cast<RedirectingFileEntry>(SrcE);
1337       assert(FE && "Must be a file");
1338       assert(NewParentE && "Parent entry must exist");
1339       auto *DE = dyn_cast<RedirectingDirectoryEntry>(NewParentE);
1340       DE->addContent(llvm::make_unique<RedirectingFileEntry>(
1341           Name, FE->getExternalContentsPath(), FE->getUseName()));
1342       break;
1343     }
1344     }
1345   }
1346 
1347   std::unique_ptr<Entry> parseEntry(yaml::Node *N, RedirectingFileSystem *FS,
1348                                     bool IsRootEntry) {
1349     auto *M = dyn_cast<yaml::MappingNode>(N);
1350     if (!M) {
1351       error(N, "expected mapping node for file or directory entry");
1352       return nullptr;
1353     }
1354 
1355     KeyStatusPair Fields[] = {
1356         KeyStatusPair("name", true),
1357         KeyStatusPair("type", true),
1358         KeyStatusPair("contents", false),
1359         KeyStatusPair("external-contents", false),
1360         KeyStatusPair("use-external-name", false),
1361     };
1362 
1363     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
1364 
1365     bool HasContents = false; // external or otherwise
1366     std::vector<std::unique_ptr<Entry>> EntryArrayContents;
1367     std::string ExternalContentsPath;
1368     std::string Name;
1369     yaml::Node *NameValueNode;
1370     auto UseExternalName = RedirectingFileEntry::NK_NotSet;
1371     EntryKind Kind;
1372 
1373     for (auto &I : *M) {
1374       StringRef Key;
1375       // Reuse the buffer for key and value, since we don't look at key after
1376       // parsing value.
1377       SmallString<256> Buffer;
1378       if (!parseScalarString(I.getKey(), Key, Buffer))
1379         return nullptr;
1380 
1381       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
1382         return nullptr;
1383 
1384       StringRef Value;
1385       if (Key == "name") {
1386         if (!parseScalarString(I.getValue(), Value, Buffer))
1387           return nullptr;
1388 
1389         NameValueNode = I.getValue();
1390         if (FS->UseCanonicalizedPaths) {
1391           SmallString<256> Path(Value);
1392           // Guarantee that old YAML files containing paths with ".." and "."
1393           // are properly canonicalized before read into the VFS.
1394           Path = sys::path::remove_leading_dotslash(Path);
1395           sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
1396           Name = Path.str();
1397         } else {
1398           Name = Value;
1399         }
1400       } else if (Key == "type") {
1401         if (!parseScalarString(I.getValue(), Value, Buffer))
1402           return nullptr;
1403         if (Value == "file")
1404           Kind = EK_File;
1405         else if (Value == "directory")
1406           Kind = EK_Directory;
1407         else {
1408           error(I.getValue(), "unknown value for 'type'");
1409           return nullptr;
1410         }
1411       } else if (Key == "contents") {
1412         if (HasContents) {
1413           error(I.getKey(),
1414                 "entry already has 'contents' or 'external-contents'");
1415           return nullptr;
1416         }
1417         HasContents = true;
1418         auto *Contents = dyn_cast<yaml::SequenceNode>(I.getValue());
1419         if (!Contents) {
1420           // FIXME: this is only for directories, what about files?
1421           error(I.getValue(), "expected array");
1422           return nullptr;
1423         }
1424 
1425         for (auto &I : *Contents) {
1426           if (std::unique_ptr<Entry> E =
1427                   parseEntry(&I, FS, /*IsRootEntry*/ false))
1428             EntryArrayContents.push_back(std::move(E));
1429           else
1430             return nullptr;
1431         }
1432       } else if (Key == "external-contents") {
1433         if (HasContents) {
1434           error(I.getKey(),
1435                 "entry already has 'contents' or 'external-contents'");
1436           return nullptr;
1437         }
1438         HasContents = true;
1439         if (!parseScalarString(I.getValue(), Value, Buffer))
1440           return nullptr;
1441 
1442         SmallString<256> FullPath;
1443         if (FS->IsRelativeOverlay) {
1444           FullPath = FS->getExternalContentsPrefixDir();
1445           assert(!FullPath.empty() &&
1446                  "External contents prefix directory must exist");
1447           llvm::sys::path::append(FullPath, Value);
1448         } else {
1449           FullPath = Value;
1450         }
1451 
1452         if (FS->UseCanonicalizedPaths) {
1453           // Guarantee that old YAML files containing paths with ".." and "."
1454           // are properly canonicalized before read into the VFS.
1455           FullPath = sys::path::remove_leading_dotslash(FullPath);
1456           sys::path::remove_dots(FullPath, /*remove_dot_dot=*/true);
1457         }
1458         ExternalContentsPath = FullPath.str();
1459       } else if (Key == "use-external-name") {
1460         bool Val;
1461         if (!parseScalarBool(I.getValue(), Val))
1462           return nullptr;
1463         UseExternalName = Val ? RedirectingFileEntry::NK_External
1464                               : RedirectingFileEntry::NK_Virtual;
1465       } else {
1466         llvm_unreachable("key missing from Keys");
1467       }
1468     }
1469 
1470     if (Stream.failed())
1471       return nullptr;
1472 
1473     // check for missing keys
1474     if (!HasContents) {
1475       error(N, "missing key 'contents' or 'external-contents'");
1476       return nullptr;
1477     }
1478     if (!checkMissingKeys(N, Keys))
1479       return nullptr;
1480 
1481     // check invalid configuration
1482     if (Kind == EK_Directory &&
1483         UseExternalName != RedirectingFileEntry::NK_NotSet) {
1484       error(N, "'use-external-name' is not supported for directories");
1485       return nullptr;
1486     }
1487 
1488     if (IsRootEntry && !sys::path::is_absolute(Name)) {
1489       assert(NameValueNode && "Name presence should be checked earlier");
1490       error(NameValueNode,
1491             "entry with relative path at the root level is not discoverable");
1492       return nullptr;
1493     }
1494 
1495     // Remove trailing slash(es), being careful not to remove the root path
1496     StringRef Trimmed(Name);
1497     size_t RootPathLen = sys::path::root_path(Trimmed).size();
1498     while (Trimmed.size() > RootPathLen &&
1499            sys::path::is_separator(Trimmed.back()))
1500       Trimmed = Trimmed.slice(0, Trimmed.size() - 1);
1501     // Get the last component
1502     StringRef LastComponent = sys::path::filename(Trimmed);
1503 
1504     std::unique_ptr<Entry> Result;
1505     switch (Kind) {
1506     case EK_File:
1507       Result = llvm::make_unique<RedirectingFileEntry>(
1508           LastComponent, std::move(ExternalContentsPath), UseExternalName);
1509       break;
1510     case EK_Directory:
1511       Result = llvm::make_unique<RedirectingDirectoryEntry>(
1512           LastComponent, std::move(EntryArrayContents),
1513           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1514                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1515       break;
1516     }
1517 
1518     StringRef Parent = sys::path::parent_path(Trimmed);
1519     if (Parent.empty())
1520       return Result;
1521 
1522     // if 'name' contains multiple components, create implicit directory entries
1523     for (sys::path::reverse_iterator I = sys::path::rbegin(Parent),
1524                                      E = sys::path::rend(Parent);
1525          I != E; ++I) {
1526       std::vector<std::unique_ptr<Entry>> Entries;
1527       Entries.push_back(std::move(Result));
1528       Result = llvm::make_unique<RedirectingDirectoryEntry>(
1529           *I, std::move(Entries),
1530           Status("", getNextVirtualUniqueID(), std::chrono::system_clock::now(),
1531                  0, 0, 0, file_type::directory_file, sys::fs::all_all));
1532     }
1533     return Result;
1534   }
1535 
1536 public:
1537   RedirectingFileSystemParser(yaml::Stream &S) : Stream(S) {}
1538 
1539   // false on error
1540   bool parse(yaml::Node *Root, RedirectingFileSystem *FS) {
1541     auto *Top = dyn_cast<yaml::MappingNode>(Root);
1542     if (!Top) {
1543       error(Root, "expected mapping node");
1544       return false;
1545     }
1546 
1547     KeyStatusPair Fields[] = {
1548         KeyStatusPair("version", true),
1549         KeyStatusPair("case-sensitive", false),
1550         KeyStatusPair("use-external-names", false),
1551         KeyStatusPair("overlay-relative", false),
1552         KeyStatusPair("ignore-non-existent-contents", false),
1553         KeyStatusPair("roots", true),
1554     };
1555 
1556     DenseMap<StringRef, KeyStatus> Keys(std::begin(Fields), std::end(Fields));
1557     std::vector<std::unique_ptr<Entry>> RootEntries;
1558 
1559     // Parse configuration and 'roots'
1560     for (auto &I : *Top) {
1561       SmallString<10> KeyBuffer;
1562       StringRef Key;
1563       if (!parseScalarString(I.getKey(), Key, KeyBuffer))
1564         return false;
1565 
1566       if (!checkDuplicateOrUnknownKey(I.getKey(), Key, Keys))
1567         return false;
1568 
1569       if (Key == "roots") {
1570         auto *Roots = dyn_cast<yaml::SequenceNode>(I.getValue());
1571         if (!Roots) {
1572           error(I.getValue(), "expected array");
1573           return false;
1574         }
1575 
1576         for (auto &I : *Roots) {
1577           if (std::unique_ptr<Entry> E =
1578                   parseEntry(&I, FS, /*IsRootEntry*/ true))
1579             RootEntries.push_back(std::move(E));
1580           else
1581             return false;
1582         }
1583       } else if (Key == "version") {
1584         StringRef VersionString;
1585         SmallString<4> Storage;
1586         if (!parseScalarString(I.getValue(), VersionString, Storage))
1587           return false;
1588         int Version;
1589         if (VersionString.getAsInteger<int>(10, Version)) {
1590           error(I.getValue(), "expected integer");
1591           return false;
1592         }
1593         if (Version < 0) {
1594           error(I.getValue(), "invalid version number");
1595           return false;
1596         }
1597         if (Version != 0) {
1598           error(I.getValue(), "version mismatch, expected 0");
1599           return false;
1600         }
1601       } else if (Key == "case-sensitive") {
1602         if (!parseScalarBool(I.getValue(), FS->CaseSensitive))
1603           return false;
1604       } else if (Key == "overlay-relative") {
1605         if (!parseScalarBool(I.getValue(), FS->IsRelativeOverlay))
1606           return false;
1607       } else if (Key == "use-external-names") {
1608         if (!parseScalarBool(I.getValue(), FS->UseExternalNames))
1609           return false;
1610       } else if (Key == "ignore-non-existent-contents") {
1611         if (!parseScalarBool(I.getValue(), FS->IgnoreNonExistentContents))
1612           return false;
1613       } else {
1614         llvm_unreachable("key missing from Keys");
1615       }
1616     }
1617 
1618     if (Stream.failed())
1619       return false;
1620 
1621     if (!checkMissingKeys(Top, Keys))
1622       return false;
1623 
1624     // Now that we sucessefully parsed the YAML file, canonicalize the internal
1625     // representation to a proper directory tree so that we can search faster
1626     // inside the VFS.
1627     for (auto &E : RootEntries)
1628       uniqueOverlayTree(FS, E.get());
1629 
1630     return true;
1631   }
1632 };
1633 
1634 } // namespace
1635 
1636 RedirectingFileSystem *
1637 RedirectingFileSystem::create(std::unique_ptr<MemoryBuffer> Buffer,
1638                               SourceMgr::DiagHandlerTy DiagHandler,
1639                               StringRef YAMLFilePath, void *DiagContext,
1640                               IntrusiveRefCntPtr<FileSystem> ExternalFS) {
1641   SourceMgr SM;
1642   yaml::Stream Stream(Buffer->getMemBufferRef(), SM);
1643 
1644   SM.setDiagHandler(DiagHandler, DiagContext);
1645   yaml::document_iterator DI = Stream.begin();
1646   yaml::Node *Root = DI->getRoot();
1647   if (DI == Stream.end() || !Root) {
1648     SM.PrintMessage(SMLoc(), SourceMgr::DK_Error, "expected root node");
1649     return nullptr;
1650   }
1651 
1652   RedirectingFileSystemParser P(Stream);
1653 
1654   std::unique_ptr<RedirectingFileSystem> FS(
1655       new RedirectingFileSystem(std::move(ExternalFS)));
1656 
1657   if (!YAMLFilePath.empty()) {
1658     // Use the YAML path from -ivfsoverlay to compute the dir to be prefixed
1659     // to each 'external-contents' path.
1660     //
1661     // Example:
1662     //    -ivfsoverlay dummy.cache/vfs/vfs.yaml
1663     // yields:
1664     //  FS->ExternalContentsPrefixDir => /<absolute_path_to>/dummy.cache/vfs
1665     //
1666     SmallString<256> OverlayAbsDir = sys::path::parent_path(YAMLFilePath);
1667     std::error_code EC = llvm::sys::fs::make_absolute(OverlayAbsDir);
1668     assert(!EC && "Overlay dir final path must be absolute");
1669     (void)EC;
1670     FS->setExternalContentsPrefixDir(OverlayAbsDir);
1671   }
1672 
1673   if (!P.parse(Root, FS.get()))
1674     return nullptr;
1675 
1676   return FS.release();
1677 }
1678 
1679 ErrorOr<Entry *> RedirectingFileSystem::lookupPath(const Twine &Path_) {
1680   SmallString<256> Path;
1681   Path_.toVector(Path);
1682 
1683   // Handle relative paths
1684   if (std::error_code EC = makeAbsolute(Path))
1685     return EC;
1686 
1687   // Canonicalize path by removing ".", "..", "./", etc components. This is
1688   // a VFS request, do bot bother about symlinks in the path components
1689   // but canonicalize in order to perform the correct entry search.
1690   if (UseCanonicalizedPaths) {
1691     Path = sys::path::remove_leading_dotslash(Path);
1692     sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
1693   }
1694 
1695   if (Path.empty())
1696     return make_error_code(llvm::errc::invalid_argument);
1697 
1698   sys::path::const_iterator Start = sys::path::begin(Path);
1699   sys::path::const_iterator End = sys::path::end(Path);
1700   for (const auto &Root : Roots) {
1701     ErrorOr<Entry *> Result = lookupPath(Start, End, Root.get());
1702     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
1703       return Result;
1704   }
1705   return make_error_code(llvm::errc::no_such_file_or_directory);
1706 }
1707 
1708 ErrorOr<Entry *>
1709 RedirectingFileSystem::lookupPath(sys::path::const_iterator Start,
1710                                   sys::path::const_iterator End, Entry *From) {
1711 #ifndef _WIN32
1712   assert(!isTraversalComponent(*Start) &&
1713          !isTraversalComponent(From->getName()) &&
1714          "Paths should not contain traversal components");
1715 #else
1716   // FIXME: this is here to support windows, remove it once canonicalized
1717   // paths become globally default.
1718   if (Start->equals("."))
1719     ++Start;
1720 #endif
1721 
1722   StringRef FromName = From->getName();
1723 
1724   // Forward the search to the next component in case this is an empty one.
1725   if (!FromName.empty()) {
1726     if (CaseSensitive ? !Start->equals(FromName)
1727                       : !Start->equals_lower(FromName))
1728       // failure to match
1729       return make_error_code(llvm::errc::no_such_file_or_directory);
1730 
1731     ++Start;
1732 
1733     if (Start == End) {
1734       // Match!
1735       return From;
1736     }
1737   }
1738 
1739   auto *DE = dyn_cast<RedirectingDirectoryEntry>(From);
1740   if (!DE)
1741     return make_error_code(llvm::errc::not_a_directory);
1742 
1743   for (const std::unique_ptr<Entry> &DirEntry :
1744        llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1745     ErrorOr<Entry *> Result = lookupPath(Start, End, DirEntry.get());
1746     if (Result || Result.getError() != llvm::errc::no_such_file_or_directory)
1747       return Result;
1748   }
1749   return make_error_code(llvm::errc::no_such_file_or_directory);
1750 }
1751 
1752 static Status getRedirectedFileStatus(const Twine &Path, bool UseExternalNames,
1753                                       Status ExternalStatus) {
1754   Status S = ExternalStatus;
1755   if (!UseExternalNames)
1756     S = Status::copyWithNewName(S, Path.str());
1757   S.IsVFSMapped = true;
1758   return S;
1759 }
1760 
1761 ErrorOr<Status> RedirectingFileSystem::status(const Twine &Path, Entry *E) {
1762   assert(E != nullptr);
1763   if (auto *F = dyn_cast<RedirectingFileEntry>(E)) {
1764     ErrorOr<Status> S = ExternalFS->status(F->getExternalContentsPath());
1765     assert(!S || S->getName() == F->getExternalContentsPath());
1766     if (S)
1767       return getRedirectedFileStatus(Path, F->useExternalName(UseExternalNames),
1768                                      *S);
1769     return S;
1770   } else { // directory
1771     auto *DE = cast<RedirectingDirectoryEntry>(E);
1772     return Status::copyWithNewName(DE->getStatus(), Path.str());
1773   }
1774 }
1775 
1776 ErrorOr<Status> RedirectingFileSystem::status(const Twine &Path) {
1777   ErrorOr<Entry *> Result = lookupPath(Path);
1778   if (!Result)
1779     return Result.getError();
1780   return status(Path, *Result);
1781 }
1782 
1783 namespace {
1784 
1785 /// Provide a file wrapper with an overriden status.
1786 class FileWithFixedStatus : public File {
1787   std::unique_ptr<File> InnerFile;
1788   Status S;
1789 
1790 public:
1791   FileWithFixedStatus(std::unique_ptr<File> InnerFile, Status S)
1792       : InnerFile(std::move(InnerFile)), S(std::move(S)) {}
1793 
1794   ErrorOr<Status> status() override { return S; }
1795   ErrorOr<std::unique_ptr<llvm::MemoryBuffer>>
1796 
1797   getBuffer(const Twine &Name, int64_t FileSize, bool RequiresNullTerminator,
1798             bool IsVolatile) override {
1799     return InnerFile->getBuffer(Name, FileSize, RequiresNullTerminator,
1800                                 IsVolatile);
1801   }
1802 
1803   std::error_code close() override { return InnerFile->close(); }
1804 };
1805 
1806 } // namespace
1807 
1808 ErrorOr<std::unique_ptr<File>>
1809 RedirectingFileSystem::openFileForRead(const Twine &Path) {
1810   ErrorOr<Entry *> E = lookupPath(Path);
1811   if (!E)
1812     return E.getError();
1813 
1814   auto *F = dyn_cast<RedirectingFileEntry>(*E);
1815   if (!F) // FIXME: errc::not_a_file?
1816     return make_error_code(llvm::errc::invalid_argument);
1817 
1818   auto Result = ExternalFS->openFileForRead(F->getExternalContentsPath());
1819   if (!Result)
1820     return Result;
1821 
1822   auto ExternalStatus = (*Result)->status();
1823   if (!ExternalStatus)
1824     return ExternalStatus.getError();
1825 
1826   // FIXME: Update the status with the name and VFSMapped.
1827   Status S = getRedirectedFileStatus(Path, F->useExternalName(UseExternalNames),
1828                                      *ExternalStatus);
1829   return std::unique_ptr<File>(
1830       llvm::make_unique<FileWithFixedStatus>(std::move(*Result), S));
1831 }
1832 
1833 IntrusiveRefCntPtr<FileSystem>
1834 vfs::getVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
1835                     SourceMgr::DiagHandlerTy DiagHandler,
1836                     StringRef YAMLFilePath, void *DiagContext,
1837                     IntrusiveRefCntPtr<FileSystem> ExternalFS) {
1838   return RedirectingFileSystem::create(std::move(Buffer), DiagHandler,
1839                                        YAMLFilePath, DiagContext,
1840                                        std::move(ExternalFS));
1841 }
1842 
1843 static void getVFSEntries(Entry *SrcE, SmallVectorImpl<StringRef> &Path,
1844                           SmallVectorImpl<YAMLVFSEntry> &Entries) {
1845   auto Kind = SrcE->getKind();
1846   if (Kind == EK_Directory) {
1847     auto *DE = dyn_cast<RedirectingDirectoryEntry>(SrcE);
1848     assert(DE && "Must be a directory");
1849     for (std::unique_ptr<Entry> &SubEntry :
1850          llvm::make_range(DE->contents_begin(), DE->contents_end())) {
1851       Path.push_back(SubEntry->getName());
1852       getVFSEntries(SubEntry.get(), Path, Entries);
1853       Path.pop_back();
1854     }
1855     return;
1856   }
1857 
1858   assert(Kind == EK_File && "Must be a EK_File");
1859   auto *FE = dyn_cast<RedirectingFileEntry>(SrcE);
1860   assert(FE && "Must be a file");
1861   SmallString<128> VPath;
1862   for (auto &Comp : Path)
1863     llvm::sys::path::append(VPath, Comp);
1864   Entries.push_back(YAMLVFSEntry(VPath.c_str(), FE->getExternalContentsPath()));
1865 }
1866 
1867 void vfs::collectVFSFromYAML(std::unique_ptr<MemoryBuffer> Buffer,
1868                              SourceMgr::DiagHandlerTy DiagHandler,
1869                              StringRef YAMLFilePath,
1870                              SmallVectorImpl<YAMLVFSEntry> &CollectedEntries,
1871                              void *DiagContext,
1872                              IntrusiveRefCntPtr<FileSystem> ExternalFS) {
1873   RedirectingFileSystem *VFS = RedirectingFileSystem::create(
1874       std::move(Buffer), DiagHandler, YAMLFilePath, DiagContext,
1875       std::move(ExternalFS));
1876   ErrorOr<Entry *> RootE = VFS->lookupPath("/");
1877   if (!RootE)
1878     return;
1879   SmallVector<StringRef, 8> Components;
1880   Components.push_back("/");
1881   getVFSEntries(*RootE, Components, CollectedEntries);
1882 }
1883 
1884 UniqueID vfs::getNextVirtualUniqueID() {
1885   static std::atomic<unsigned> UID;
1886   unsigned ID = ++UID;
1887   // The following assumes that uint64_t max will never collide with a real
1888   // dev_t value from the OS.
1889   return UniqueID(std::numeric_limits<uint64_t>::max(), ID);
1890 }
1891 
1892 void YAMLVFSWriter::addFileMapping(StringRef VirtualPath, StringRef RealPath) {
1893   assert(sys::path::is_absolute(VirtualPath) && "virtual path not absolute");
1894   assert(sys::path::is_absolute(RealPath) && "real path not absolute");
1895   assert(!pathHasTraversal(VirtualPath) && "path traversal is not supported");
1896   Mappings.emplace_back(VirtualPath, RealPath);
1897 }
1898 
1899 namespace {
1900 
1901 class JSONWriter {
1902   llvm::raw_ostream &OS;
1903   SmallVector<StringRef, 16> DirStack;
1904 
1905   unsigned getDirIndent() { return 4 * DirStack.size(); }
1906   unsigned getFileIndent() { return 4 * (DirStack.size() + 1); }
1907   bool containedIn(StringRef Parent, StringRef Path);
1908   StringRef containedPart(StringRef Parent, StringRef Path);
1909   void startDirectory(StringRef Path);
1910   void endDirectory();
1911   void writeEntry(StringRef VPath, StringRef RPath);
1912 
1913 public:
1914   JSONWriter(llvm::raw_ostream &OS) : OS(OS) {}
1915 
1916   void write(ArrayRef<YAMLVFSEntry> Entries, Optional<bool> UseExternalNames,
1917              Optional<bool> IsCaseSensitive, Optional<bool> IsOverlayRelative,
1918              Optional<bool> IgnoreNonExistentContents, StringRef OverlayDir);
1919 };
1920 
1921 } // namespace
1922 
1923 bool JSONWriter::containedIn(StringRef Parent, StringRef Path) {
1924   using namespace llvm::sys;
1925 
1926   // Compare each path component.
1927   auto IParent = path::begin(Parent), EParent = path::end(Parent);
1928   for (auto IChild = path::begin(Path), EChild = path::end(Path);
1929        IParent != EParent && IChild != EChild; ++IParent, ++IChild) {
1930     if (*IParent != *IChild)
1931       return false;
1932   }
1933   // Have we exhausted the parent path?
1934   return IParent == EParent;
1935 }
1936 
1937 StringRef JSONWriter::containedPart(StringRef Parent, StringRef Path) {
1938   assert(!Parent.empty());
1939   assert(containedIn(Parent, Path));
1940   return Path.slice(Parent.size() + 1, StringRef::npos);
1941 }
1942 
1943 void JSONWriter::startDirectory(StringRef Path) {
1944   StringRef Name =
1945       DirStack.empty() ? Path : containedPart(DirStack.back(), Path);
1946   DirStack.push_back(Path);
1947   unsigned Indent = getDirIndent();
1948   OS.indent(Indent) << "{\n";
1949   OS.indent(Indent + 2) << "'type': 'directory',\n";
1950   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(Name) << "\",\n";
1951   OS.indent(Indent + 2) << "'contents': [\n";
1952 }
1953 
1954 void JSONWriter::endDirectory() {
1955   unsigned Indent = getDirIndent();
1956   OS.indent(Indent + 2) << "]\n";
1957   OS.indent(Indent) << "}";
1958 
1959   DirStack.pop_back();
1960 }
1961 
1962 void JSONWriter::writeEntry(StringRef VPath, StringRef RPath) {
1963   unsigned Indent = getFileIndent();
1964   OS.indent(Indent) << "{\n";
1965   OS.indent(Indent + 2) << "'type': 'file',\n";
1966   OS.indent(Indent + 2) << "'name': \"" << llvm::yaml::escape(VPath) << "\",\n";
1967   OS.indent(Indent + 2) << "'external-contents': \""
1968                         << llvm::yaml::escape(RPath) << "\"\n";
1969   OS.indent(Indent) << "}";
1970 }
1971 
1972 void JSONWriter::write(ArrayRef<YAMLVFSEntry> Entries,
1973                        Optional<bool> UseExternalNames,
1974                        Optional<bool> IsCaseSensitive,
1975                        Optional<bool> IsOverlayRelative,
1976                        Optional<bool> IgnoreNonExistentContents,
1977                        StringRef OverlayDir) {
1978   using namespace llvm::sys;
1979 
1980   OS << "{\n"
1981         "  'version': 0,\n";
1982   if (IsCaseSensitive.hasValue())
1983     OS << "  'case-sensitive': '"
1984        << (IsCaseSensitive.getValue() ? "true" : "false") << "',\n";
1985   if (UseExternalNames.hasValue())
1986     OS << "  'use-external-names': '"
1987        << (UseExternalNames.getValue() ? "true" : "false") << "',\n";
1988   bool UseOverlayRelative = false;
1989   if (IsOverlayRelative.hasValue()) {
1990     UseOverlayRelative = IsOverlayRelative.getValue();
1991     OS << "  'overlay-relative': '" << (UseOverlayRelative ? "true" : "false")
1992        << "',\n";
1993   }
1994   if (IgnoreNonExistentContents.hasValue())
1995     OS << "  'ignore-non-existent-contents': '"
1996        << (IgnoreNonExistentContents.getValue() ? "true" : "false") << "',\n";
1997   OS << "  'roots': [\n";
1998 
1999   if (!Entries.empty()) {
2000     const YAMLVFSEntry &Entry = Entries.front();
2001     startDirectory(path::parent_path(Entry.VPath));
2002 
2003     StringRef RPath = Entry.RPath;
2004     if (UseOverlayRelative) {
2005       unsigned OverlayDirLen = OverlayDir.size();
2006       assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2007              "Overlay dir must be contained in RPath");
2008       RPath = RPath.slice(OverlayDirLen, RPath.size());
2009     }
2010 
2011     writeEntry(path::filename(Entry.VPath), RPath);
2012 
2013     for (const auto &Entry : Entries.slice(1)) {
2014       StringRef Dir = path::parent_path(Entry.VPath);
2015       if (Dir == DirStack.back())
2016         OS << ",\n";
2017       else {
2018         while (!DirStack.empty() && !containedIn(DirStack.back(), Dir)) {
2019           OS << "\n";
2020           endDirectory();
2021         }
2022         OS << ",\n";
2023         startDirectory(Dir);
2024       }
2025       StringRef RPath = Entry.RPath;
2026       if (UseOverlayRelative) {
2027         unsigned OverlayDirLen = OverlayDir.size();
2028         assert(RPath.substr(0, OverlayDirLen) == OverlayDir &&
2029                "Overlay dir must be contained in RPath");
2030         RPath = RPath.slice(OverlayDirLen, RPath.size());
2031       }
2032       writeEntry(path::filename(Entry.VPath), RPath);
2033     }
2034 
2035     while (!DirStack.empty()) {
2036       OS << "\n";
2037       endDirectory();
2038     }
2039     OS << "\n";
2040   }
2041 
2042   OS << "  ]\n"
2043      << "}\n";
2044 }
2045 
2046 void YAMLVFSWriter::write(llvm::raw_ostream &OS) {
2047   llvm::sort(Mappings, [](const YAMLVFSEntry &LHS, const YAMLVFSEntry &RHS) {
2048     return LHS.VPath < RHS.VPath;
2049   });
2050 
2051   JSONWriter(OS).write(Mappings, UseExternalNames, IsCaseSensitive,
2052                        IsOverlayRelative, IgnoreNonExistentContents,
2053                        OverlayDir);
2054 }
2055 
2056 VFSFromYamlDirIterImpl::VFSFromYamlDirIterImpl(
2057     const Twine &_Path, RedirectingDirectoryEntry::iterator Begin,
2058     RedirectingDirectoryEntry::iterator End, std::error_code &EC)
2059     : Dir(_Path.str()), Current(Begin), End(End) {
2060   EC = incrementImpl();
2061 }
2062 
2063 std::error_code VFSFromYamlDirIterImpl::increment() {
2064   assert(Current != End && "cannot iterate past end");
2065   ++Current;
2066   return incrementImpl();
2067 }
2068 
2069 std::error_code VFSFromYamlDirIterImpl::incrementImpl() {
2070   while (Current != End) {
2071     SmallString<128> PathStr(Dir);
2072     llvm::sys::path::append(PathStr, (*Current)->getName());
2073     sys::fs::file_type Type;
2074     switch ((*Current)->getKind()) {
2075     case EK_Directory:
2076       Type = sys::fs::file_type::directory_file;
2077       break;
2078     case EK_File:
2079       Type = sys::fs::file_type::regular_file;
2080       break;
2081     }
2082     CurrentEntry = directory_entry(PathStr.str(), Type);
2083     break;
2084   }
2085 
2086   if (Current == End)
2087     CurrentEntry = directory_entry();
2088   return {};
2089 }
2090 
2091 vfs::recursive_directory_iterator::recursive_directory_iterator(
2092     FileSystem &FS_, const Twine &Path, std::error_code &EC)
2093     : FS(&FS_) {
2094   directory_iterator I = FS->dir_begin(Path, EC);
2095   if (I != directory_iterator()) {
2096     State = std::make_shared<IterState>();
2097     State->push(I);
2098   }
2099 }
2100 
2101 vfs::recursive_directory_iterator &
2102 recursive_directory_iterator::increment(std::error_code &EC) {
2103   assert(FS && State && !State->empty() && "incrementing past end");
2104   assert(!State->top()->path().empty() && "non-canonical end iterator");
2105   vfs::directory_iterator End;
2106   if (State->top()->type() == sys::fs::file_type::directory_file) {
2107     vfs::directory_iterator I = FS->dir_begin(State->top()->path(), EC);
2108     if (I != End) {
2109       State->push(I);
2110       return *this;
2111     }
2112   }
2113 
2114   while (!State->empty() && State->top().increment(EC) == End)
2115     State->pop();
2116 
2117   if (State->empty())
2118     State.reset(); // end iterator
2119 
2120   return *this;
2121 }
2122