//===-- FileCollector.cpp ---------------------------------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "llvm/Support/FileCollector.h" #include "llvm/ADT/SmallString.h" #include "llvm/ADT/Twine.h" #include "llvm/Support/FileSystem.h" #include "llvm/Support/Path.h" #include "llvm/Support/Process.h" using namespace llvm; FileCollectorBase::FileCollectorBase() = default; FileCollectorBase::~FileCollectorBase() = default; void FileCollectorBase::addFile(const Twine &File) { std::lock_guard lock(Mutex); std::string FileStr = File.str(); if (markAsSeen(FileStr)) addFileImpl(FileStr); } void FileCollectorBase::addDirectory(const Twine &Dir) { assert(sys::fs::is_directory(Dir)); std::error_code EC; addDirectoryImpl(Dir, vfs::getRealFileSystem(), EC); } static bool isCaseSensitivePath(StringRef Path) { SmallString<256> TmpDest = Path, UpperDest, RealDest; // Remove component traversals, links, etc. if (!sys::fs::real_path(Path, TmpDest)) return true; // Current default value in vfs.yaml Path = TmpDest; // Change path to all upper case and ask for its real path, if the latter // exists and is equal to path, it's not case sensitive. Default to case // sensitive in the absence of real_path, since this is the YAMLVFSWriter // default. UpperDest = Path.upper(); if (sys::fs::real_path(UpperDest, RealDest) && Path.equals(RealDest)) return false; return true; } FileCollector::FileCollector(std::string Root, std::string OverlayRoot) : Root(std::move(Root)), OverlayRoot(std::move(OverlayRoot)) { } void FileCollector::PathCanonicalizer::updateWithRealPath( SmallVectorImpl &Path) { StringRef SrcPath(Path.begin(), Path.size()); StringRef Filename = sys::path::filename(SrcPath); StringRef Directory = sys::path::parent_path(SrcPath); // Use real_path to fix any symbolic link component present in the directory // part of the path, caching the search because computing the real path is // expensive. SmallString<256> RealPath; auto DirWithSymlink = CachedDirs.find(Directory); if (DirWithSymlink == CachedDirs.end()) { // FIXME: Should this be a call to FileSystem::getRealpath(), in some // cases? What if there is nothing on disk? if (sys::fs::real_path(Directory, RealPath)) return; CachedDirs[Directory] = std::string(RealPath.str()); } else { RealPath = DirWithSymlink->second; } // Finish recreating the path by appending the original filename, since we // don't need to resolve symlinks in the filename. // // FIXME: If we can cope with this, maybe we can cope without calling // getRealPath() at all when there's no ".." component. sys::path::append(RealPath, Filename); // Swap to create the output. Path.swap(RealPath); } /// Make Path absolute. static void makeAbsolute(SmallVectorImpl &Path) { // We need an absolute src path to append to the root. sys::fs::make_absolute(Path); // Canonicalize src to a native path to avoid mixed separator styles. sys::path::native(Path); // Remove redundant leading "./" pieces and consecutive separators. Path.erase(Path.begin(), sys::path::remove_leading_dotslash( StringRef(Path.begin(), Path.size())) .begin()); } FileCollector::PathCanonicalizer::PathStorage FileCollector::PathCanonicalizer::canonicalize(StringRef SrcPath) { PathStorage Paths; Paths.VirtualPath = SrcPath; makeAbsolute(Paths.VirtualPath); // If a ".." component is present after a symlink component, remove_dots may // lead to the wrong real destination path. Let the source be canonicalized // like that but make sure we always use the real path for the destination. Paths.CopyFrom = Paths.VirtualPath; updateWithRealPath(Paths.CopyFrom); // Canonicalize the virtual path by removing "..", "." components. sys::path::remove_dots(Paths.VirtualPath, /*remove_dot_dot=*/true); return Paths; } void FileCollector::addFileImpl(StringRef SrcPath) { PathCanonicalizer::PathStorage Paths = Canonicalizer.canonicalize(SrcPath); SmallString<256> DstPath = StringRef(Root); sys::path::append(DstPath, sys::path::relative_path(Paths.CopyFrom)); // Always map a canonical src path to its real path into the YAML, by doing // this we map different virtual src paths to the same entry in the VFS // overlay, which is a way to emulate symlink inside the VFS; this is also // needed for correctness, not doing that can lead to module redefinition // errors. addFileToMapping(Paths.VirtualPath, DstPath); } llvm::vfs::directory_iterator FileCollector::addDirectoryImpl(const llvm::Twine &Dir, IntrusiveRefCntPtr FS, std::error_code &EC) { auto It = FS->dir_begin(Dir, EC); if (EC) return It; addFile(Dir); for (; !EC && It != llvm::vfs::directory_iterator(); It.increment(EC)) { if (It->type() == sys::fs::file_type::regular_file || It->type() == sys::fs::file_type::directory_file || It->type() == sys::fs::file_type::symlink_file) { addFile(It->path()); } } if (EC) return It; // Return a new iterator. return FS->dir_begin(Dir, EC); } /// Set the access and modification time for the given file from the given /// status object. static std::error_code copyAccessAndModificationTime(StringRef Filename, const sys::fs::file_status &Stat) { int FD; if (auto EC = sys::fs::openFileForWrite(Filename, FD, sys::fs::CD_OpenExisting)) return EC; if (auto EC = sys::fs::setLastAccessAndModificationTime( FD, Stat.getLastAccessedTime(), Stat.getLastModificationTime())) return EC; if (auto EC = sys::Process::SafelyCloseFileDescriptor(FD)) return EC; return {}; } std::error_code FileCollector::copyFiles(bool StopOnError) { auto Err = sys::fs::create_directories(Root, /*IgnoreExisting=*/true); if (Err) { return Err; } std::lock_guard lock(Mutex); for (auto &entry : VFSWriter.getMappings()) { // Get the status of the original file/directory. sys::fs::file_status Stat; if (std::error_code EC = sys::fs::status(entry.VPath, Stat)) { if (StopOnError) return EC; continue; } // Continue if the file doesn't exist. if (Stat.type() == sys::fs::file_type::file_not_found) continue; // Create directory tree. if (std::error_code EC = sys::fs::create_directories(sys::path::parent_path(entry.RPath), /*IgnoreExisting=*/true)) { if (StopOnError) return EC; } if (Stat.type() == sys::fs::file_type::directory_file) { // Construct a directory when it's just a directory entry. if (std::error_code EC = sys::fs::create_directories(entry.RPath, /*IgnoreExisting=*/true)) { if (StopOnError) return EC; } continue; } // Copy file over. if (std::error_code EC = sys::fs::copy_file(entry.VPath, entry.RPath)) { if (StopOnError) return EC; } // Copy over permissions. if (auto perms = sys::fs::getPermissions(entry.VPath)) { if (std::error_code EC = sys::fs::setPermissions(entry.RPath, *perms)) { if (StopOnError) return EC; } } // Copy over modification time. copyAccessAndModificationTime(entry.RPath, Stat); } return {}; } std::error_code FileCollector::writeMapping(StringRef MappingFile) { std::lock_guard lock(Mutex); VFSWriter.setOverlayDir(OverlayRoot); VFSWriter.setCaseSensitivity(isCaseSensitivePath(OverlayRoot)); VFSWriter.setUseExternalNames(false); std::error_code EC; raw_fd_ostream os(MappingFile, EC, sys::fs::OF_Text); if (EC) return EC; VFSWriter.write(os); return {}; } namespace llvm { class FileCollectorFileSystem : public vfs::FileSystem { public: explicit FileCollectorFileSystem(IntrusiveRefCntPtr FS, std::shared_ptr Collector) : FS(std::move(FS)), Collector(std::move(Collector)) {} llvm::ErrorOr status(const Twine &Path) override { auto Result = FS->status(Path); if (Result && Result->exists()) Collector->addFile(Path); return Result; } llvm::ErrorOr> openFileForRead(const Twine &Path) override { auto Result = FS->openFileForRead(Path); if (Result && *Result) Collector->addFile(Path); return Result; } llvm::vfs::directory_iterator dir_begin(const llvm::Twine &Dir, std::error_code &EC) override { return Collector->addDirectoryImpl(Dir, FS, EC); } std::error_code getRealPath(const Twine &Path, SmallVectorImpl &Output) const override { auto EC = FS->getRealPath(Path, Output); if (!EC) { Collector->addFile(Path); if (Output.size() > 0) Collector->addFile(Output); } return EC; } std::error_code isLocal(const Twine &Path, bool &Result) override { return FS->isLocal(Path, Result); } llvm::ErrorOr getCurrentWorkingDirectory() const override { return FS->getCurrentWorkingDirectory(); } std::error_code setCurrentWorkingDirectory(const llvm::Twine &Path) override { return FS->setCurrentWorkingDirectory(Path); } private: IntrusiveRefCntPtr FS; std::shared_ptr Collector; }; } // namespace llvm IntrusiveRefCntPtr FileCollector::createCollectorVFS(IntrusiveRefCntPtr BaseFS, std::shared_ptr Collector) { return new FileCollectorFileSystem(std::move(BaseFS), std::move(Collector)); }