316 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			316 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===-- FileCollector.cpp ---------------------------------------*- C++ -*-===//
 | |
| //
 | |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | |
| // See https://llvm.org/LICENSE.txt for license information.
 | |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "llvm/Support/FileCollector.h"
 | |
| #include "llvm/ADT/SmallString.h"
 | |
| #include "llvm/ADT/Twine.h"
 | |
| #include "llvm/Support/FileSystem.h"
 | |
| #include "llvm/Support/Path.h"
 | |
| #include "llvm/Support/Process.h"
 | |
| 
 | |
| using namespace llvm;
 | |
| 
 | |
| FileCollectorBase::FileCollectorBase() = default;
 | |
| FileCollectorBase::~FileCollectorBase() = default;
 | |
| 
 | |
| void FileCollectorBase::addFile(const Twine &File) {
 | |
|   std::lock_guard<std::mutex> lock(Mutex);
 | |
|   std::string FileStr = File.str();
 | |
|   if (markAsSeen(FileStr))
 | |
|     addFileImpl(FileStr);
 | |
| }
 | |
| 
 | |
| void FileCollectorBase::addDirectory(const Twine &Dir) {
 | |
|   assert(sys::fs::is_directory(Dir));
 | |
|   std::error_code EC;
 | |
|   addDirectoryImpl(Dir, vfs::getRealFileSystem(), EC);
 | |
| }
 | |
| 
 | |
| static bool isCaseSensitivePath(StringRef Path) {
 | |
|   SmallString<256> TmpDest = Path, UpperDest, RealDest;
 | |
| 
 | |
|   // Remove component traversals, links, etc.
 | |
|   if (sys::fs::real_path(Path, TmpDest))
 | |
|     return true; // Current default value in vfs.yaml
 | |
|   Path = TmpDest;
 | |
| 
 | |
|   // Change path to all upper case and ask for its real path, if the latter
 | |
|   // exists and is equal to path, it's not case sensitive. Default to case
 | |
|   // sensitive in the absence of real_path, since this is the YAMLVFSWriter
 | |
|   // default.
 | |
|   UpperDest = Path.upper();
 | |
|   if (!sys::fs::real_path(UpperDest, RealDest) && Path.equals(RealDest))
 | |
|     return false;
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| FileCollector::FileCollector(std::string Root, std::string OverlayRoot)
 | |
|     : Root(std::move(Root)), OverlayRoot(std::move(OverlayRoot)) {
 | |
| }
 | |
| 
 | |
| void FileCollector::PathCanonicalizer::updateWithRealPath(
 | |
|     SmallVectorImpl<char> &Path) {
 | |
|   StringRef SrcPath(Path.begin(), Path.size());
 | |
|   StringRef Filename = sys::path::filename(SrcPath);
 | |
|   StringRef Directory = sys::path::parent_path(SrcPath);
 | |
| 
 | |
|   // Use real_path to fix any symbolic link component present in the directory
 | |
|   // part of the path, caching the search because computing the real path is
 | |
|   // expensive.
 | |
|   SmallString<256> RealPath;
 | |
|   auto DirWithSymlink = CachedDirs.find(Directory);
 | |
|   if (DirWithSymlink == CachedDirs.end()) {
 | |
|     // FIXME: Should this be a call to FileSystem::getRealpath(), in some
 | |
|     // cases? What if there is nothing on disk?
 | |
|     if (sys::fs::real_path(Directory, RealPath))
 | |
|       return;
 | |
|     CachedDirs[Directory] = std::string(RealPath.str());
 | |
|   } else {
 | |
|     RealPath = DirWithSymlink->second;
 | |
|   }
 | |
| 
 | |
|   // Finish recreating the path by appending the original filename, since we
 | |
|   // don't need to resolve symlinks in the filename.
 | |
|   //
 | |
|   // FIXME: If we can cope with this, maybe we can cope without calling
 | |
|   // getRealPath() at all when there's no ".." component.
 | |
|   sys::path::append(RealPath, Filename);
 | |
| 
 | |
|   // Swap to create the output.
 | |
|   Path.swap(RealPath);
 | |
| }
 | |
| 
 | |
| /// Make Path absolute.
 | |
| static void makeAbsolute(SmallVectorImpl<char> &Path) {
 | |
|   // We need an absolute src path to append to the root.
 | |
|   sys::fs::make_absolute(Path);
 | |
| 
 | |
|   // Canonicalize src to a native path to avoid mixed separator styles.
 | |
|   sys::path::native(Path);
 | |
| 
 | |
|   // Remove redundant leading "./" pieces and consecutive separators.
 | |
|   Path.erase(Path.begin(), sys::path::remove_leading_dotslash(
 | |
|                                StringRef(Path.begin(), Path.size()))
 | |
|                                .begin());
 | |
| }
 | |
| 
 | |
| FileCollector::PathCanonicalizer::PathStorage
 | |
| FileCollector::PathCanonicalizer::canonicalize(StringRef SrcPath) {
 | |
|   PathStorage Paths;
 | |
|   Paths.VirtualPath = SrcPath;
 | |
|   makeAbsolute(Paths.VirtualPath);
 | |
| 
 | |
|   // If a ".." component is present after a symlink component, remove_dots may
 | |
|   // lead to the wrong real destination path. Let the source be canonicalized
 | |
|   // like that but make sure we always use the real path for the destination.
 | |
|   Paths.CopyFrom = Paths.VirtualPath;
 | |
|   updateWithRealPath(Paths.CopyFrom);
 | |
| 
 | |
|   // Canonicalize the virtual path by removing "..", "." components.
 | |
|   sys::path::remove_dots(Paths.VirtualPath, /*remove_dot_dot=*/true);
 | |
| 
 | |
|   return Paths;
 | |
| }
 | |
| 
 | |
| void FileCollector::addFileImpl(StringRef SrcPath) {
 | |
|   PathCanonicalizer::PathStorage Paths = Canonicalizer.canonicalize(SrcPath);
 | |
| 
 | |
|   SmallString<256> DstPath = StringRef(Root);
 | |
|   sys::path::append(DstPath, sys::path::relative_path(Paths.CopyFrom));
 | |
| 
 | |
|   // Always map a canonical src path to its real path into the YAML, by doing
 | |
|   // this we map different virtual src paths to the same entry in the VFS
 | |
|   // overlay, which is a way to emulate symlink inside the VFS; this is also
 | |
|   // needed for correctness, not doing that can lead to module redefinition
 | |
|   // errors.
 | |
|   addFileToMapping(Paths.VirtualPath, DstPath);
 | |
| }
 | |
| 
 | |
| llvm::vfs::directory_iterator
 | |
| FileCollector::addDirectoryImpl(const llvm::Twine &Dir,
 | |
|                                 IntrusiveRefCntPtr<vfs::FileSystem> FS,
 | |
|                                 std::error_code &EC) {
 | |
|   auto It = FS->dir_begin(Dir, EC);
 | |
|   if (EC)
 | |
|     return It;
 | |
|   addFile(Dir);
 | |
|   for (; !EC && It != llvm::vfs::directory_iterator(); It.increment(EC)) {
 | |
|     if (It->type() == sys::fs::file_type::regular_file ||
 | |
|         It->type() == sys::fs::file_type::directory_file ||
 | |
|         It->type() == sys::fs::file_type::symlink_file) {
 | |
|       addFile(It->path());
 | |
|     }
 | |
|   }
 | |
|   if (EC)
 | |
|     return It;
 | |
|   // Return a new iterator.
 | |
|   return FS->dir_begin(Dir, EC);
 | |
| }
 | |
| 
 | |
| /// Set the access and modification time for the given file from the given
 | |
| /// status object.
 | |
| static std::error_code
 | |
| copyAccessAndModificationTime(StringRef Filename,
 | |
|                               const sys::fs::file_status &Stat) {
 | |
|   int FD;
 | |
| 
 | |
|   if (auto EC =
 | |
|           sys::fs::openFileForWrite(Filename, FD, sys::fs::CD_OpenExisting))
 | |
|     return EC;
 | |
| 
 | |
|   if (auto EC = sys::fs::setLastAccessAndModificationTime(
 | |
|           FD, Stat.getLastAccessedTime(), Stat.getLastModificationTime()))
 | |
|     return EC;
 | |
| 
 | |
|   if (auto EC = sys::Process::SafelyCloseFileDescriptor(FD))
 | |
|     return EC;
 | |
| 
 | |
|   return {};
 | |
| }
 | |
| 
 | |
| std::error_code FileCollector::copyFiles(bool StopOnError) {
 | |
|   auto Err = sys::fs::create_directories(Root, /*IgnoreExisting=*/true);
 | |
|   if (Err) {
 | |
|     return Err;
 | |
|   }
 | |
| 
 | |
|   std::lock_guard<std::mutex> lock(Mutex);
 | |
| 
 | |
|   for (auto &entry : VFSWriter.getMappings()) {
 | |
|     // Get the status of the original file/directory.
 | |
|     sys::fs::file_status Stat;
 | |
|     if (std::error_code EC = sys::fs::status(entry.VPath, Stat)) {
 | |
|       if (StopOnError)
 | |
|         return EC;
 | |
|       continue;
 | |
|     }
 | |
| 
 | |
|     // Continue if the file doesn't exist.
 | |
|     if (Stat.type() == sys::fs::file_type::file_not_found)
 | |
|       continue;
 | |
| 
 | |
|     // Create directory tree.
 | |
|     if (std::error_code EC =
 | |
|             sys::fs::create_directories(sys::path::parent_path(entry.RPath),
 | |
|                                         /*IgnoreExisting=*/true)) {
 | |
|       if (StopOnError)
 | |
|         return EC;
 | |
|     }
 | |
| 
 | |
|     if (Stat.type() == sys::fs::file_type::directory_file) {
 | |
|       // Construct a directory when it's just a directory entry.
 | |
|       if (std::error_code EC =
 | |
|               sys::fs::create_directories(entry.RPath,
 | |
|                                           /*IgnoreExisting=*/true)) {
 | |
|         if (StopOnError)
 | |
|           return EC;
 | |
|       }
 | |
|       continue;
 | |
|     }
 | |
| 
 | |
|     // Copy file over.
 | |
|     if (std::error_code EC = sys::fs::copy_file(entry.VPath, entry.RPath)) {
 | |
|       if (StopOnError)
 | |
|         return EC;
 | |
|     }
 | |
| 
 | |
|     // Copy over permissions.
 | |
|     if (auto perms = sys::fs::getPermissions(entry.VPath)) {
 | |
|       if (std::error_code EC = sys::fs::setPermissions(entry.RPath, *perms)) {
 | |
|         if (StopOnError)
 | |
|           return EC;
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     // Copy over modification time.
 | |
|     copyAccessAndModificationTime(entry.RPath, Stat);
 | |
|   }
 | |
|   return {};
 | |
| }
 | |
| 
 | |
| std::error_code FileCollector::writeMapping(StringRef MappingFile) {
 | |
|   std::lock_guard<std::mutex> lock(Mutex);
 | |
| 
 | |
|   VFSWriter.setOverlayDir(OverlayRoot);
 | |
|   VFSWriter.setCaseSensitivity(isCaseSensitivePath(OverlayRoot));
 | |
|   VFSWriter.setUseExternalNames(false);
 | |
| 
 | |
|   std::error_code EC;
 | |
|   raw_fd_ostream os(MappingFile, EC, sys::fs::OF_TextWithCRLF);
 | |
|   if (EC)
 | |
|     return EC;
 | |
| 
 | |
|   VFSWriter.write(os);
 | |
| 
 | |
|   return {};
 | |
| }
 | |
| 
 | |
| namespace llvm {
 | |
| 
 | |
| class FileCollectorFileSystem : public vfs::FileSystem {
 | |
| public:
 | |
|   explicit FileCollectorFileSystem(IntrusiveRefCntPtr<vfs::FileSystem> FS,
 | |
|                                    std::shared_ptr<FileCollector> Collector)
 | |
|       : FS(std::move(FS)), Collector(std::move(Collector)) {}
 | |
| 
 | |
|   llvm::ErrorOr<llvm::vfs::Status> status(const Twine &Path) override {
 | |
|     auto Result = FS->status(Path);
 | |
|     if (Result && Result->exists())
 | |
|       Collector->addFile(Path);
 | |
|     return Result;
 | |
|   }
 | |
| 
 | |
|   llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>
 | |
|   openFileForRead(const Twine &Path) override {
 | |
|     auto Result = FS->openFileForRead(Path);
 | |
|     if (Result && *Result)
 | |
|       Collector->addFile(Path);
 | |
|     return Result;
 | |
|   }
 | |
| 
 | |
|   llvm::vfs::directory_iterator dir_begin(const llvm::Twine &Dir,
 | |
|                                           std::error_code &EC) override {
 | |
|     return Collector->addDirectoryImpl(Dir, FS, EC);
 | |
|   }
 | |
| 
 | |
|   std::error_code getRealPath(const Twine &Path,
 | |
|                               SmallVectorImpl<char> &Output) const override {
 | |
|     auto EC = FS->getRealPath(Path, Output);
 | |
|     if (!EC) {
 | |
|       Collector->addFile(Path);
 | |
|       if (Output.size() > 0)
 | |
|         Collector->addFile(Output);
 | |
|     }
 | |
|     return EC;
 | |
|   }
 | |
| 
 | |
|   std::error_code isLocal(const Twine &Path, bool &Result) override {
 | |
|     return FS->isLocal(Path, Result);
 | |
|   }
 | |
| 
 | |
|   llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override {
 | |
|     return FS->getCurrentWorkingDirectory();
 | |
|   }
 | |
| 
 | |
|   std::error_code setCurrentWorkingDirectory(const llvm::Twine &Path) override {
 | |
|     return FS->setCurrentWorkingDirectory(Path);
 | |
|   }
 | |
| 
 | |
| private:
 | |
|   IntrusiveRefCntPtr<vfs::FileSystem> FS;
 | |
|   std::shared_ptr<FileCollector> Collector;
 | |
| };
 | |
| 
 | |
| } // namespace llvm
 | |
| 
 | |
| IntrusiveRefCntPtr<vfs::FileSystem>
 | |
| FileCollector::createCollectorVFS(IntrusiveRefCntPtr<vfs::FileSystem> BaseFS,
 | |
|                                   std::shared_ptr<FileCollector> Collector) {
 | |
|   return new FileCollectorFileSystem(std::move(BaseFS), std::move(Collector));
 | |
| }
 |