1 //===- VirtualFileSystem.h - Virtual File System Layer ----------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 /// \file 10 /// Defines the virtual file system interface vfs::FileSystem. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #ifndef LLVM_SUPPORT_VIRTUALFILESYSTEM_H 15 #define LLVM_SUPPORT_VIRTUALFILESYSTEM_H 16 17 #include "llvm/ADT/IntrusiveRefCntPtr.h" 18 #include "llvm/ADT/None.h" 19 #include "llvm/ADT/Optional.h" 20 #include "llvm/ADT/SmallVector.h" 21 #include "llvm/ADT/StringRef.h" 22 #include "llvm/ADT/Twine.h" 23 #include "llvm/Support/Chrono.h" 24 #include "llvm/Support/ErrorOr.h" 25 #include "llvm/Support/FileSystem.h" 26 #include "llvm/Support/Path.h" 27 #include "llvm/Support/SourceMgr.h" 28 #include <cassert> 29 #include <cstdint> 30 #include <ctime> 31 #include <memory> 32 #include <stack> 33 #include <string> 34 #include <system_error> 35 #include <utility> 36 #include <vector> 37 38 namespace llvm { 39 40 class MemoryBuffer; 41 42 namespace vfs { 43 44 /// The result of a \p status operation. 45 class Status { 46 std::string Name; 47 llvm::sys::fs::UniqueID UID; 48 llvm::sys::TimePoint<> MTime; 49 uint32_t User; 50 uint32_t Group; 51 uint64_t Size; 52 llvm::sys::fs::file_type Type = llvm::sys::fs::file_type::status_error; 53 llvm::sys::fs::perms Perms; 54 55 public: 56 // FIXME: remove when files support multiple names 57 bool IsVFSMapped = false; 58 59 Status() = default; 60 Status(const llvm::sys::fs::file_status &Status); 61 Status(const Twine &Name, llvm::sys::fs::UniqueID UID, 62 llvm::sys::TimePoint<> MTime, uint32_t User, uint32_t Group, 63 uint64_t Size, llvm::sys::fs::file_type Type, 64 llvm::sys::fs::perms Perms); 65 66 /// Get a copy of a Status with a different name. 67 static Status copyWithNewName(const Status &In, const Twine &NewName); 68 static Status copyWithNewName(const llvm::sys::fs::file_status &In, 69 const Twine &NewName); 70 71 /// Returns the name that should be used for this file or directory. getName()72 StringRef getName() const { return Name; } 73 74 /// @name Status interface from llvm::sys::fs 75 /// @{ getType()76 llvm::sys::fs::file_type getType() const { return Type; } getPermissions()77 llvm::sys::fs::perms getPermissions() const { return Perms; } getLastModificationTime()78 llvm::sys::TimePoint<> getLastModificationTime() const { return MTime; } getUniqueID()79 llvm::sys::fs::UniqueID getUniqueID() const { return UID; } getUser()80 uint32_t getUser() const { return User; } getGroup()81 uint32_t getGroup() const { return Group; } getSize()82 uint64_t getSize() const { return Size; } 83 /// @} 84 /// @name Status queries 85 /// These are static queries in llvm::sys::fs. 86 /// @{ 87 bool equivalent(const Status &Other) const; 88 bool isDirectory() const; 89 bool isRegularFile() const; 90 bool isOther() const; 91 bool isSymlink() const; 92 bool isStatusKnown() const; 93 bool exists() const; 94 /// @} 95 }; 96 97 /// Represents an open file. 98 class File { 99 public: 100 /// Destroy the file after closing it (if open). 101 /// Sub-classes should generally call close() inside their destructors. We 102 /// cannot do that from the base class, since close is virtual. 103 virtual ~File(); 104 105 /// Get the status of the file. 106 virtual llvm::ErrorOr<Status> status() = 0; 107 108 /// Get the name of the file getName()109 virtual llvm::ErrorOr<std::string> getName() { 110 if (auto Status = status()) 111 return Status->getName().str(); 112 else 113 return Status.getError(); 114 } 115 116 /// Get the contents of the file as a \p MemoryBuffer. 117 virtual llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> 118 getBuffer(const Twine &Name, int64_t FileSize = -1, 119 bool RequiresNullTerminator = true, bool IsVolatile = false) = 0; 120 121 /// Closes the file. 122 virtual std::error_code close() = 0; 123 }; 124 125 /// A member of a directory, yielded by a directory_iterator. 126 /// Only information available on most platforms is included. 127 class directory_entry { 128 std::string Path; 129 llvm::sys::fs::file_type Type = llvm::sys::fs::file_type::type_unknown; 130 131 public: 132 directory_entry() = default; directory_entry(std::string Path,llvm::sys::fs::file_type Type)133 directory_entry(std::string Path, llvm::sys::fs::file_type Type) 134 : Path(std::move(Path)), Type(Type) {} 135 path()136 llvm::StringRef path() const { return Path; } type()137 llvm::sys::fs::file_type type() const { return Type; } 138 }; 139 140 namespace detail { 141 142 /// An interface for virtual file systems to provide an iterator over the 143 /// (non-recursive) contents of a directory. 144 struct DirIterImpl { 145 virtual ~DirIterImpl(); 146 147 /// Sets \c CurrentEntry to the next entry in the directory on success, 148 /// to directory_entry() at end, or returns a system-defined \c error_code. 149 virtual std::error_code increment() = 0; 150 151 directory_entry CurrentEntry; 152 }; 153 154 } // namespace detail 155 156 /// An input iterator over the entries in a virtual path, similar to 157 /// llvm::sys::fs::directory_iterator. 158 class directory_iterator { 159 std::shared_ptr<detail::DirIterImpl> Impl; // Input iterator semantics on copy 160 161 public: directory_iterator(std::shared_ptr<detail::DirIterImpl> I)162 directory_iterator(std::shared_ptr<detail::DirIterImpl> I) 163 : Impl(std::move(I)) { 164 assert(Impl.get() != nullptr && "requires non-null implementation"); 165 if (Impl->CurrentEntry.path().empty()) 166 Impl.reset(); // Normalize the end iterator to Impl == nullptr. 167 } 168 169 /// Construct an 'end' iterator. 170 directory_iterator() = default; 171 172 /// Equivalent to operator++, with an error code. increment(std::error_code & EC)173 directory_iterator &increment(std::error_code &EC) { 174 assert(Impl && "attempting to increment past end"); 175 EC = Impl->increment(); 176 if (Impl->CurrentEntry.path().empty()) 177 Impl.reset(); // Normalize the end iterator to Impl == nullptr. 178 return *this; 179 } 180 181 const directory_entry &operator*() const { return Impl->CurrentEntry; } 182 const directory_entry *operator->() const { return &Impl->CurrentEntry; } 183 184 bool operator==(const directory_iterator &RHS) const { 185 if (Impl && RHS.Impl) 186 return Impl->CurrentEntry.path() == RHS.Impl->CurrentEntry.path(); 187 return !Impl && !RHS.Impl; 188 } 189 bool operator!=(const directory_iterator &RHS) const { 190 return !(*this == RHS); 191 } 192 }; 193 194 class FileSystem; 195 196 namespace detail { 197 198 /// Keeps state for the recursive_directory_iterator. 199 struct RecDirIterState { 200 std::stack<directory_iterator, std::vector<directory_iterator>> Stack; 201 bool HasNoPushRequest = false; 202 }; 203 204 } // end namespace detail 205 206 /// An input iterator over the recursive contents of a virtual path, 207 /// similar to llvm::sys::fs::recursive_directory_iterator. 208 class recursive_directory_iterator { 209 FileSystem *FS; 210 std::shared_ptr<detail::RecDirIterState> 211 State; // Input iterator semantics on copy. 212 213 public: 214 recursive_directory_iterator(FileSystem &FS, const Twine &Path, 215 std::error_code &EC); 216 217 /// Construct an 'end' iterator. 218 recursive_directory_iterator() = default; 219 220 /// Equivalent to operator++, with an error code. 221 recursive_directory_iterator &increment(std::error_code &EC); 222 223 const directory_entry &operator*() const { return *State->Stack.top(); } 224 const directory_entry *operator->() const { return &*State->Stack.top(); } 225 226 bool operator==(const recursive_directory_iterator &Other) const { 227 return State == Other.State; // identity 228 } 229 bool operator!=(const recursive_directory_iterator &RHS) const { 230 return !(*this == RHS); 231 } 232 233 /// Gets the current level. Starting path is at level 0. level()234 int level() const { 235 assert(!State->Stack.empty() && 236 "Cannot get level without any iteration state"); 237 return State->Stack.size() - 1; 238 } 239 no_push()240 void no_push() { State->HasNoPushRequest = true; } 241 }; 242 243 /// The virtual file system interface. 244 class FileSystem : public llvm::ThreadSafeRefCountedBase<FileSystem> { 245 public: 246 virtual ~FileSystem(); 247 248 /// Get the status of the entry at \p Path, if one exists. 249 virtual llvm::ErrorOr<Status> status(const Twine &Path) = 0; 250 251 /// Get a \p File object for the file at \p Path, if one exists. 252 virtual llvm::ErrorOr<std::unique_ptr<File>> 253 openFileForRead(const Twine &Path) = 0; 254 255 /// This is a convenience method that opens a file, gets its content and then 256 /// closes the file. 257 llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> 258 getBufferForFile(const Twine &Name, int64_t FileSize = -1, 259 bool RequiresNullTerminator = true, bool IsVolatile = false); 260 261 /// Get a directory_iterator for \p Dir. 262 /// \note The 'end' iterator is directory_iterator(). 263 virtual directory_iterator dir_begin(const Twine &Dir, 264 std::error_code &EC) = 0; 265 266 /// Set the working directory. This will affect all following operations on 267 /// this file system and may propagate down for nested file systems. 268 virtual std::error_code setCurrentWorkingDirectory(const Twine &Path) = 0; 269 270 /// Get the working directory of this file system. 271 virtual llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const = 0; 272 273 /// Gets real path of \p Path e.g. collapse all . and .. patterns, resolve 274 /// symlinks. For real file system, this uses `llvm::sys::fs::real_path`. 275 /// This returns errc::operation_not_permitted if not implemented by subclass. 276 virtual std::error_code getRealPath(const Twine &Path, 277 SmallVectorImpl<char> &Output) const; 278 279 /// Check whether a file exists. Provided for convenience. 280 bool exists(const Twine &Path); 281 282 /// Is the file mounted on a local filesystem? 283 virtual std::error_code isLocal(const Twine &Path, bool &Result); 284 285 /// Make \a Path an absolute path. 286 /// 287 /// Makes \a Path absolute using the current directory if it is not already. 288 /// An empty \a Path will result in the current directory. 289 /// 290 /// /absolute/path => /absolute/path 291 /// relative/../path => <current-directory>/relative/../path 292 /// 293 /// \param Path A path that is modified to be an absolute path. 294 /// \returns success if \a path has been made absolute, otherwise a 295 /// platform-specific error_code. 296 virtual std::error_code makeAbsolute(SmallVectorImpl<char> &Path) const; 297 }; 298 299 /// Gets an \p vfs::FileSystem for the 'real' file system, as seen by 300 /// the operating system. 301 /// The working directory is linked to the process's working directory. 302 /// (This is usually thread-hostile). 303 IntrusiveRefCntPtr<FileSystem> getRealFileSystem(); 304 305 /// Create an \p vfs::FileSystem for the 'real' file system, as seen by 306 /// the operating system. 307 /// It has its own working directory, independent of (but initially equal to) 308 /// that of the process. 309 std::unique_ptr<FileSystem> createPhysicalFileSystem(); 310 311 /// A file system that allows overlaying one \p AbstractFileSystem on top 312 /// of another. 313 /// 314 /// Consists of a stack of >=1 \p FileSystem objects, which are treated as being 315 /// one merged file system. When there is a directory that exists in more than 316 /// one file system, the \p OverlayFileSystem contains a directory containing 317 /// the union of their contents. The attributes (permissions, etc.) of the 318 /// top-most (most recently added) directory are used. When there is a file 319 /// that exists in more than one file system, the file in the top-most file 320 /// system overrides the other(s). 321 class OverlayFileSystem : public FileSystem { 322 using FileSystemList = SmallVector<IntrusiveRefCntPtr<FileSystem>, 1>; 323 324 /// The stack of file systems, implemented as a list in order of 325 /// their addition. 326 FileSystemList FSList; 327 328 public: 329 OverlayFileSystem(IntrusiveRefCntPtr<FileSystem> Base); 330 331 /// Pushes a file system on top of the stack. 332 void pushOverlay(IntrusiveRefCntPtr<FileSystem> FS); 333 334 llvm::ErrorOr<Status> status(const Twine &Path) override; 335 llvm::ErrorOr<std::unique_ptr<File>> 336 openFileForRead(const Twine &Path) override; 337 directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override; 338 llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override; 339 std::error_code setCurrentWorkingDirectory(const Twine &Path) override; 340 std::error_code isLocal(const Twine &Path, bool &Result) override; 341 std::error_code getRealPath(const Twine &Path, 342 SmallVectorImpl<char> &Output) const override; 343 344 using iterator = FileSystemList::reverse_iterator; 345 using const_iterator = FileSystemList::const_reverse_iterator; 346 using reverse_iterator = FileSystemList::iterator; 347 using const_reverse_iterator = FileSystemList::const_iterator; 348 349 /// Get an iterator pointing to the most recently added file system. overlays_begin()350 iterator overlays_begin() { return FSList.rbegin(); } overlays_begin()351 const_iterator overlays_begin() const { return FSList.rbegin(); } 352 353 /// Get an iterator pointing one-past the least recently added file system. overlays_end()354 iterator overlays_end() { return FSList.rend(); } overlays_end()355 const_iterator overlays_end() const { return FSList.rend(); } 356 357 /// Get an iterator pointing to the least recently added file system. overlays_rbegin()358 reverse_iterator overlays_rbegin() { return FSList.begin(); } overlays_rbegin()359 const_reverse_iterator overlays_rbegin() const { return FSList.begin(); } 360 361 /// Get an iterator pointing one-past the most recently added file system. overlays_rend()362 reverse_iterator overlays_rend() { return FSList.end(); } overlays_rend()363 const_reverse_iterator overlays_rend() const { return FSList.end(); } 364 }; 365 366 /// By default, this delegates all calls to the underlying file system. This 367 /// is useful when derived file systems want to override some calls and still 368 /// proxy other calls. 369 class ProxyFileSystem : public FileSystem { 370 public: ProxyFileSystem(IntrusiveRefCntPtr<FileSystem> FS)371 explicit ProxyFileSystem(IntrusiveRefCntPtr<FileSystem> FS) 372 : FS(std::move(FS)) {} 373 status(const Twine & Path)374 llvm::ErrorOr<Status> status(const Twine &Path) override { 375 return FS->status(Path); 376 } 377 llvm::ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine & Path)378 openFileForRead(const Twine &Path) override { 379 return FS->openFileForRead(Path); 380 } dir_begin(const Twine & Dir,std::error_code & EC)381 directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override { 382 return FS->dir_begin(Dir, EC); 383 } getCurrentWorkingDirectory()384 llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override { 385 return FS->getCurrentWorkingDirectory(); 386 } setCurrentWorkingDirectory(const Twine & Path)387 std::error_code setCurrentWorkingDirectory(const Twine &Path) override { 388 return FS->setCurrentWorkingDirectory(Path); 389 } getRealPath(const Twine & Path,SmallVectorImpl<char> & Output)390 std::error_code getRealPath(const Twine &Path, 391 SmallVectorImpl<char> &Output) const override { 392 return FS->getRealPath(Path, Output); 393 } isLocal(const Twine & Path,bool & Result)394 std::error_code isLocal(const Twine &Path, bool &Result) override { 395 return FS->isLocal(Path, Result); 396 } 397 398 protected: getUnderlyingFS()399 FileSystem &getUnderlyingFS() { return *FS; } 400 401 private: 402 IntrusiveRefCntPtr<FileSystem> FS; 403 404 virtual void anchor(); 405 }; 406 407 namespace detail { 408 409 class InMemoryDirectory; 410 class InMemoryFile; 411 412 } // namespace detail 413 414 /// An in-memory file system. 415 class InMemoryFileSystem : public FileSystem { 416 std::unique_ptr<detail::InMemoryDirectory> Root; 417 std::string WorkingDirectory; 418 bool UseNormalizedPaths = true; 419 420 /// If HardLinkTarget is non-null, a hardlink is created to the To path which 421 /// must be a file. If it is null then it adds the file as the public addFile. 422 bool addFile(const Twine &Path, time_t ModificationTime, 423 std::unique_ptr<llvm::MemoryBuffer> Buffer, 424 Optional<uint32_t> User, Optional<uint32_t> Group, 425 Optional<llvm::sys::fs::file_type> Type, 426 Optional<llvm::sys::fs::perms> Perms, 427 const detail::InMemoryFile *HardLinkTarget); 428 429 public: 430 explicit InMemoryFileSystem(bool UseNormalizedPaths = true); 431 ~InMemoryFileSystem() override; 432 433 /// Add a file containing a buffer or a directory to the VFS with a 434 /// path. The VFS owns the buffer. If present, User, Group, Type 435 /// and Perms apply to the newly-created file or directory. 436 /// \return true if the file or directory was successfully added, 437 /// false if the file or directory already exists in the file system with 438 /// different contents. 439 bool addFile(const Twine &Path, time_t ModificationTime, 440 std::unique_ptr<llvm::MemoryBuffer> Buffer, 441 Optional<uint32_t> User = None, Optional<uint32_t> Group = None, 442 Optional<llvm::sys::fs::file_type> Type = None, 443 Optional<llvm::sys::fs::perms> Perms = None); 444 445 /// Add a hard link to a file. 446 /// Here hard links are not intended to be fully equivalent to the classical 447 /// filesystem. Both the hard link and the file share the same buffer and 448 /// status (and thus have the same UniqueID). Because of this there is no way 449 /// to distinguish between the link and the file after the link has been 450 /// added. 451 /// 452 /// The To path must be an existing file or a hardlink. The From file must not 453 /// have been added before. The To Path must not be a directory. The From Node 454 /// is added as a hard link which points to the resolved file of To Node. 455 /// \return true if the above condition is satisfied and hardlink was 456 /// successfully created, false otherwise. 457 bool addHardLink(const Twine &From, const Twine &To); 458 459 /// Add a buffer to the VFS with a path. The VFS does not own the buffer. 460 /// If present, User, Group, Type and Perms apply to the newly-created file 461 /// or directory. 462 /// \return true if the file or directory was successfully added, 463 /// false if the file or directory already exists in the file system with 464 /// different contents. 465 bool addFileNoOwn(const Twine &Path, time_t ModificationTime, 466 llvm::MemoryBuffer *Buffer, Optional<uint32_t> User = None, 467 Optional<uint32_t> Group = None, 468 Optional<llvm::sys::fs::file_type> Type = None, 469 Optional<llvm::sys::fs::perms> Perms = None); 470 471 std::string toString() const; 472 473 /// Return true if this file system normalizes . and .. in paths. useNormalizedPaths()474 bool useNormalizedPaths() const { return UseNormalizedPaths; } 475 476 llvm::ErrorOr<Status> status(const Twine &Path) override; 477 llvm::ErrorOr<std::unique_ptr<File>> 478 openFileForRead(const Twine &Path) override; 479 directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override; 480 getCurrentWorkingDirectory()481 llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override { 482 return WorkingDirectory; 483 } 484 /// Canonicalizes \p Path by combining with the current working 485 /// directory and normalizing the path (e.g. remove dots). If the current 486 /// working directory is not set, this returns errc::operation_not_permitted. 487 /// 488 /// This doesn't resolve symlinks as they are not supported in in-memory file 489 /// system. 490 std::error_code getRealPath(const Twine &Path, 491 SmallVectorImpl<char> &Output) const override; 492 std::error_code isLocal(const Twine &Path, bool &Result) override; 493 std::error_code setCurrentWorkingDirectory(const Twine &Path) override; 494 }; 495 496 /// Get a globally unique ID for a virtual file or directory. 497 llvm::sys::fs::UniqueID getNextVirtualUniqueID(); 498 499 /// Gets a \p FileSystem for a virtual file system described in YAML 500 /// format. 501 IntrusiveRefCntPtr<FileSystem> 502 getVFSFromYAML(std::unique_ptr<llvm::MemoryBuffer> Buffer, 503 llvm::SourceMgr::DiagHandlerTy DiagHandler, 504 StringRef YAMLFilePath, void *DiagContext = nullptr, 505 IntrusiveRefCntPtr<FileSystem> ExternalFS = getRealFileSystem()); 506 507 struct YAMLVFSEntry { 508 template <typename T1, typename T2> YAMLVFSEntryYAMLVFSEntry509 YAMLVFSEntry(T1 &&VPath, T2 &&RPath) 510 : VPath(std::forward<T1>(VPath)), RPath(std::forward<T2>(RPath)) {} 511 std::string VPath; 512 std::string RPath; 513 }; 514 515 class VFSFromYamlDirIterImpl; 516 class RedirectingFileSystemParser; 517 518 /// A virtual file system parsed from a YAML file. 519 /// 520 /// Currently, this class allows creating virtual directories and mapping 521 /// virtual file paths to existing external files, available in \c ExternalFS. 522 /// 523 /// The basic structure of the parsed file is: 524 /// \verbatim 525 /// { 526 /// 'version': <version number>, 527 /// <optional configuration> 528 /// 'roots': [ 529 /// <directory entries> 530 /// ] 531 /// } 532 /// \endverbatim 533 /// 534 /// All configuration options are optional. 535 /// 'case-sensitive': <boolean, default=(true for Posix, false for Windows)> 536 /// 'use-external-names': <boolean, default=true> 537 /// 'overlay-relative': <boolean, default=false> 538 /// 'fallthrough': <boolean, default=true> 539 /// 540 /// Virtual directories are represented as 541 /// \verbatim 542 /// { 543 /// 'type': 'directory', 544 /// 'name': <string>, 545 /// 'contents': [ <file or directory entries> ] 546 /// } 547 /// \endverbatim 548 /// 549 /// The default attributes for virtual directories are: 550 /// \verbatim 551 /// MTime = now() when created 552 /// Perms = 0777 553 /// User = Group = 0 554 /// Size = 0 555 /// UniqueID = unspecified unique value 556 /// \endverbatim 557 /// 558 /// Re-mapped files are represented as 559 /// \verbatim 560 /// { 561 /// 'type': 'file', 562 /// 'name': <string>, 563 /// 'use-external-name': <boolean> # Optional 564 /// 'external-contents': <path to external file> 565 /// } 566 /// \endverbatim 567 /// 568 /// and inherit their attributes from the external contents. 569 /// 570 /// In both cases, the 'name' field may contain multiple path components (e.g. 571 /// /path/to/file). However, any directory that contains more than one child 572 /// must be uniquely represented by a directory entry. 573 class RedirectingFileSystem : public vfs::FileSystem { 574 public: 575 enum EntryKind { EK_Directory, EK_File }; 576 577 /// A single file or directory in the VFS. 578 class Entry { 579 EntryKind Kind; 580 std::string Name; 581 582 public: Entry(EntryKind K,StringRef Name)583 Entry(EntryKind K, StringRef Name) : Kind(K), Name(Name) {} 584 virtual ~Entry() = default; 585 getName()586 StringRef getName() const { return Name; } getKind()587 EntryKind getKind() const { return Kind; } 588 }; 589 590 class RedirectingDirectoryEntry : public Entry { 591 std::vector<std::unique_ptr<Entry>> Contents; 592 Status S; 593 594 public: RedirectingDirectoryEntry(StringRef Name,std::vector<std::unique_ptr<Entry>> Contents,Status S)595 RedirectingDirectoryEntry(StringRef Name, 596 std::vector<std::unique_ptr<Entry>> Contents, 597 Status S) 598 : Entry(EK_Directory, Name), Contents(std::move(Contents)), 599 S(std::move(S)) {} RedirectingDirectoryEntry(StringRef Name,Status S)600 RedirectingDirectoryEntry(StringRef Name, Status S) 601 : Entry(EK_Directory, Name), S(std::move(S)) {} 602 getStatus()603 Status getStatus() { return S; } 604 addContent(std::unique_ptr<Entry> Content)605 void addContent(std::unique_ptr<Entry> Content) { 606 Contents.push_back(std::move(Content)); 607 } 608 getLastContent()609 Entry *getLastContent() const { return Contents.back().get(); } 610 611 using iterator = decltype(Contents)::iterator; 612 contents_begin()613 iterator contents_begin() { return Contents.begin(); } contents_end()614 iterator contents_end() { return Contents.end(); } 615 classof(const Entry * E)616 static bool classof(const Entry *E) { return E->getKind() == EK_Directory; } 617 }; 618 619 class RedirectingFileEntry : public Entry { 620 public: 621 enum NameKind { NK_NotSet, NK_External, NK_Virtual }; 622 623 private: 624 std::string ExternalContentsPath; 625 NameKind UseName; 626 627 public: RedirectingFileEntry(StringRef Name,StringRef ExternalContentsPath,NameKind UseName)628 RedirectingFileEntry(StringRef Name, StringRef ExternalContentsPath, 629 NameKind UseName) 630 : Entry(EK_File, Name), ExternalContentsPath(ExternalContentsPath), 631 UseName(UseName) {} 632 getExternalContentsPath()633 StringRef getExternalContentsPath() const { return ExternalContentsPath; } 634 635 /// whether to use the external path as the name for this file. useExternalName(bool GlobalUseExternalName)636 bool useExternalName(bool GlobalUseExternalName) const { 637 return UseName == NK_NotSet ? GlobalUseExternalName 638 : (UseName == NK_External); 639 } 640 getUseName()641 NameKind getUseName() const { return UseName; } 642 classof(const Entry * E)643 static bool classof(const Entry *E) { return E->getKind() == EK_File; } 644 }; 645 646 private: 647 friend class VFSFromYamlDirIterImpl; 648 friend class RedirectingFileSystemParser; 649 shouldUseExternalFS()650 bool shouldUseExternalFS() const { 651 return ExternalFSValidWD && IsFallthrough; 652 } 653 654 // In a RedirectingFileSystem, keys can be specified in Posix or Windows 655 // style (or even a mixture of both), so this comparison helper allows 656 // slashes (representing a root) to match backslashes (and vice versa). Note 657 // that, other than the root, patch components should not contain slashes or 658 // backslashes. pathComponentMatches(llvm::StringRef lhs,llvm::StringRef rhs)659 bool pathComponentMatches(llvm::StringRef lhs, llvm::StringRef rhs) const { 660 if ((CaseSensitive ? lhs.equals(rhs) : lhs.equals_lower(rhs))) 661 return true; 662 return (lhs == "/" && rhs == "\\") || (lhs == "\\" && rhs == "/"); 663 } 664 665 /// The root(s) of the virtual file system. 666 std::vector<std::unique_ptr<Entry>> Roots; 667 668 /// The current working directory of the file system. 669 std::string WorkingDirectory; 670 671 /// Whether the current working directory is valid for the external FS. 672 bool ExternalFSValidWD = false; 673 674 /// The file system to use for external references. 675 IntrusiveRefCntPtr<FileSystem> ExternalFS; 676 677 /// If IsRelativeOverlay is set, this represents the directory 678 /// path that should be prefixed to each 'external-contents' entry 679 /// when reading from YAML files. 680 std::string ExternalContentsPrefixDir; 681 682 /// @name Configuration 683 /// @{ 684 685 /// Whether to perform case-sensitive comparisons. 686 /// 687 /// Currently, case-insensitive matching only works correctly with ASCII. 688 bool CaseSensitive = 689 #ifdef _WIN32 690 false; 691 #else 692 true; 693 #endif 694 695 /// IsRelativeOverlay marks whether a ExternalContentsPrefixDir path must 696 /// be prefixed in every 'external-contents' when reading from YAML files. 697 bool IsRelativeOverlay = false; 698 699 /// Whether to use to use the value of 'external-contents' for the 700 /// names of files. This global value is overridable on a per-file basis. 701 bool UseExternalNames = true; 702 703 /// Whether to attempt a file lookup in external file system after it wasn't 704 /// found in VFS. 705 bool IsFallthrough = true; 706 /// @} 707 708 /// Virtual file paths and external files could be canonicalized without "..", 709 /// "." and "./" in their paths. FIXME: some unittests currently fail on 710 /// win32 when using remove_dots and remove_leading_dotslash on paths. 711 bool UseCanonicalizedPaths = 712 #ifdef _WIN32 713 false; 714 #else 715 true; 716 #endif 717 718 RedirectingFileSystem(IntrusiveRefCntPtr<FileSystem> ExternalFS); 719 720 /// Looks up the path <tt>[Start, End)</tt> in \p From, possibly 721 /// recursing into the contents of \p From if it is a directory. 722 ErrorOr<Entry *> lookupPath(llvm::sys::path::const_iterator Start, 723 llvm::sys::path::const_iterator End, 724 Entry *From) const; 725 726 /// Get the status of a given an \c Entry. 727 ErrorOr<Status> status(const Twine &Path, Entry *E); 728 729 public: 730 /// Looks up \p Path in \c Roots. 731 ErrorOr<Entry *> lookupPath(const Twine &Path) const; 732 733 /// Parses \p Buffer, which is expected to be in YAML format and 734 /// returns a virtual file system representing its contents. 735 static RedirectingFileSystem * 736 create(std::unique_ptr<MemoryBuffer> Buffer, 737 SourceMgr::DiagHandlerTy DiagHandler, StringRef YAMLFilePath, 738 void *DiagContext, IntrusiveRefCntPtr<FileSystem> ExternalFS); 739 740 ErrorOr<Status> status(const Twine &Path) override; 741 ErrorOr<std::unique_ptr<File>> openFileForRead(const Twine &Path) override; 742 743 std::error_code getRealPath(const Twine &Path, 744 SmallVectorImpl<char> &Output) const override; 745 746 llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override; 747 748 std::error_code setCurrentWorkingDirectory(const Twine &Path) override; 749 750 std::error_code isLocal(const Twine &Path, bool &Result) override; 751 752 std::error_code makeAbsolute(SmallVectorImpl<char> &Path) const override; 753 754 directory_iterator dir_begin(const Twine &Dir, std::error_code &EC) override; 755 756 void setExternalContentsPrefixDir(StringRef PrefixDir); 757 758 StringRef getExternalContentsPrefixDir() const; 759 760 void dump(raw_ostream &OS) const; 761 void dumpEntry(raw_ostream &OS, Entry *E, int NumSpaces = 0) const; 762 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) 763 LLVM_DUMP_METHOD void dump() const; 764 #endif 765 }; 766 767 /// Collect all pairs of <virtual path, real path> entries from the 768 /// \p YAMLFilePath. This is used by the module dependency collector to forward 769 /// the entries into the reproducer output VFS YAML file. 770 void collectVFSFromYAML( 771 std::unique_ptr<llvm::MemoryBuffer> Buffer, 772 llvm::SourceMgr::DiagHandlerTy DiagHandler, StringRef YAMLFilePath, 773 SmallVectorImpl<YAMLVFSEntry> &CollectedEntries, 774 void *DiagContext = nullptr, 775 IntrusiveRefCntPtr<FileSystem> ExternalFS = getRealFileSystem()); 776 777 class YAMLVFSWriter { 778 std::vector<YAMLVFSEntry> Mappings; 779 Optional<bool> IsCaseSensitive; 780 Optional<bool> IsOverlayRelative; 781 Optional<bool> UseExternalNames; 782 std::string OverlayDir; 783 784 public: 785 YAMLVFSWriter() = default; 786 787 void addFileMapping(StringRef VirtualPath, StringRef RealPath); 788 setCaseSensitivity(bool CaseSensitive)789 void setCaseSensitivity(bool CaseSensitive) { 790 IsCaseSensitive = CaseSensitive; 791 } 792 setUseExternalNames(bool UseExtNames)793 void setUseExternalNames(bool UseExtNames) { UseExternalNames = UseExtNames; } 794 setOverlayDir(StringRef OverlayDirectory)795 void setOverlayDir(StringRef OverlayDirectory) { 796 IsOverlayRelative = true; 797 OverlayDir.assign(OverlayDirectory.str()); 798 } 799 getMappings()800 const std::vector<YAMLVFSEntry> &getMappings() const { return Mappings; } 801 802 void write(llvm::raw_ostream &OS); 803 }; 804 805 } // namespace vfs 806 } // namespace llvm 807 808 #endif // LLVM_SUPPORT_VIRTUALFILESYSTEM_H 809