123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317 |
- //===-- FileCollector.cpp ---------------------------------------*- C++ -*-===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/Support/FileCollector.h"
- #include "llvm/ADT/SmallString.h"
- #include "llvm/ADT/Twine.h"
- #include "llvm/Support/FileSystem.h"
- #include "llvm/Support/Path.h"
- #include "llvm/Support/Process.h"
- using namespace llvm;
- FileCollectorBase::FileCollectorBase() = default;
- FileCollectorBase::~FileCollectorBase() = default;
- void FileCollectorBase::addFile(const Twine &File) {
- std::lock_guard<std::mutex> lock(Mutex);
- std::string FileStr = File.str();
- if (markAsSeen(FileStr))
- addFileImpl(FileStr);
- }
- void FileCollectorBase::addDirectory(const Twine &Dir) {
- assert(sys::fs::is_directory(Dir));
- std::error_code EC;
- addDirectoryImpl(Dir, vfs::getRealFileSystem(), EC);
- }
- static bool isCaseSensitivePath(StringRef Path) {
- SmallString<256> TmpDest = Path, UpperDest, RealDest;
- // Remove component traversals, links, etc.
- if (sys::fs::real_path(Path, TmpDest))
- return true; // Current default value in vfs.yaml
- Path = TmpDest;
- // Change path to all upper case and ask for its real path, if the latter
- // exists and is equal to path, it's not case sensitive. Default to case
- // sensitive in the absence of real_path, since this is the YAMLVFSWriter
- // default.
- UpperDest = Path.upper();
- if (!sys::fs::real_path(UpperDest, RealDest) && Path.equals(RealDest))
- return false;
- return true;
- }
- FileCollector::FileCollector(std::string Root, std::string OverlayRoot)
- : Root(Root), OverlayRoot(OverlayRoot) {
- assert(sys::path::is_absolute(Root) && "Root not absolute");
- assert(sys::path::is_absolute(OverlayRoot) && "OverlayRoot not absolute");
- }
- void FileCollector::PathCanonicalizer::updateWithRealPath(
- SmallVectorImpl<char> &Path) {
- StringRef SrcPath(Path.begin(), Path.size());
- StringRef Filename = sys::path::filename(SrcPath);
- StringRef Directory = sys::path::parent_path(SrcPath);
- // Use real_path to fix any symbolic link component present in the directory
- // part of the path, caching the search because computing the real path is
- // expensive.
- SmallString<256> RealPath;
- auto DirWithSymlink = CachedDirs.find(Directory);
- if (DirWithSymlink == CachedDirs.end()) {
- // FIXME: Should this be a call to FileSystem::getRealpath(), in some
- // cases? What if there is nothing on disk?
- if (sys::fs::real_path(Directory, RealPath))
- return;
- CachedDirs[Directory] = std::string(RealPath.str());
- } else {
- RealPath = DirWithSymlink->second;
- }
- // Finish recreating the path by appending the original filename, since we
- // don't need to resolve symlinks in the filename.
- //
- // FIXME: If we can cope with this, maybe we can cope without calling
- // getRealPath() at all when there's no ".." component.
- sys::path::append(RealPath, Filename);
- // Swap to create the output.
- Path.swap(RealPath);
- }
- /// Make Path absolute.
- static void makeAbsolute(SmallVectorImpl<char> &Path) {
- // We need an absolute src path to append to the root.
- sys::fs::make_absolute(Path);
- // Canonicalize src to a native path to avoid mixed separator styles.
- sys::path::native(Path);
- // Remove redundant leading "./" pieces and consecutive separators.
- Path.erase(Path.begin(), sys::path::remove_leading_dotslash(
- StringRef(Path.begin(), Path.size()))
- .begin());
- }
- FileCollector::PathCanonicalizer::PathStorage
- FileCollector::PathCanonicalizer::canonicalize(StringRef SrcPath) {
- PathStorage Paths;
- Paths.VirtualPath = SrcPath;
- makeAbsolute(Paths.VirtualPath);
- // If a ".." component is present after a symlink component, remove_dots may
- // lead to the wrong real destination path. Let the source be canonicalized
- // like that but make sure we always use the real path for the destination.
- Paths.CopyFrom = Paths.VirtualPath;
- updateWithRealPath(Paths.CopyFrom);
- // Canonicalize the virtual path by removing "..", "." components.
- sys::path::remove_dots(Paths.VirtualPath, /*remove_dot_dot=*/true);
- return Paths;
- }
- void FileCollector::addFileImpl(StringRef SrcPath) {
- PathCanonicalizer::PathStorage Paths = Canonicalizer.canonicalize(SrcPath);
- SmallString<256> DstPath = StringRef(Root);
- sys::path::append(DstPath, sys::path::relative_path(Paths.CopyFrom));
- // Always map a canonical src path to its real path into the YAML, by doing
- // this we map different virtual src paths to the same entry in the VFS
- // overlay, which is a way to emulate symlink inside the VFS; this is also
- // needed for correctness, not doing that can lead to module redefinition
- // errors.
- addFileToMapping(Paths.VirtualPath, DstPath);
- }
- llvm::vfs::directory_iterator
- FileCollector::addDirectoryImpl(const llvm::Twine &Dir,
- IntrusiveRefCntPtr<vfs::FileSystem> FS,
- std::error_code &EC) {
- auto It = FS->dir_begin(Dir, EC);
- if (EC)
- return It;
- addFile(Dir);
- for (; !EC && It != llvm::vfs::directory_iterator(); It.increment(EC)) {
- if (It->type() == sys::fs::file_type::regular_file ||
- It->type() == sys::fs::file_type::directory_file ||
- It->type() == sys::fs::file_type::symlink_file) {
- addFile(It->path());
- }
- }
- if (EC)
- return It;
- // Return a new iterator.
- return FS->dir_begin(Dir, EC);
- }
- /// Set the access and modification time for the given file from the given
- /// status object.
- static std::error_code
- copyAccessAndModificationTime(StringRef Filename,
- const sys::fs::file_status &Stat) {
- int FD;
- if (auto EC =
- sys::fs::openFileForWrite(Filename, FD, sys::fs::CD_OpenExisting))
- return EC;
- if (auto EC = sys::fs::setLastAccessAndModificationTime(
- FD, Stat.getLastAccessedTime(), Stat.getLastModificationTime()))
- return EC;
- if (auto EC = sys::Process::SafelyCloseFileDescriptor(FD))
- return EC;
- return {};
- }
- std::error_code FileCollector::copyFiles(bool StopOnError) {
- auto Err = sys::fs::create_directories(Root, /*IgnoreExisting=*/true);
- if (Err) {
- return Err;
- }
- std::lock_guard<std::mutex> lock(Mutex);
- for (auto &entry : VFSWriter.getMappings()) {
- // Get the status of the original file/directory.
- sys::fs::file_status Stat;
- if (std::error_code EC = sys::fs::status(entry.VPath, Stat)) {
- if (StopOnError)
- return EC;
- continue;
- }
- // Continue if the file doesn't exist.
- if (Stat.type() == sys::fs::file_type::file_not_found)
- continue;
- // Create directory tree.
- if (std::error_code EC =
- sys::fs::create_directories(sys::path::parent_path(entry.RPath),
- /*IgnoreExisting=*/true)) {
- if (StopOnError)
- return EC;
- }
- if (Stat.type() == sys::fs::file_type::directory_file) {
- // Construct a directory when it's just a directory entry.
- if (std::error_code EC =
- sys::fs::create_directories(entry.RPath,
- /*IgnoreExisting=*/true)) {
- if (StopOnError)
- return EC;
- }
- continue;
- }
- // Copy file over.
- if (std::error_code EC = sys::fs::copy_file(entry.VPath, entry.RPath)) {
- if (StopOnError)
- return EC;
- }
- // Copy over permissions.
- if (auto perms = sys::fs::getPermissions(entry.VPath)) {
- if (std::error_code EC = sys::fs::setPermissions(entry.RPath, *perms)) {
- if (StopOnError)
- return EC;
- }
- }
- // Copy over modification time.
- copyAccessAndModificationTime(entry.RPath, Stat);
- }
- return {};
- }
- std::error_code FileCollector::writeMapping(StringRef MappingFile) {
- std::lock_guard<std::mutex> lock(Mutex);
- VFSWriter.setOverlayDir(OverlayRoot);
- VFSWriter.setCaseSensitivity(isCaseSensitivePath(OverlayRoot));
- VFSWriter.setUseExternalNames(false);
- std::error_code EC;
- raw_fd_ostream os(MappingFile, EC, sys::fs::OF_TextWithCRLF);
- if (EC)
- return EC;
- VFSWriter.write(os);
- return {};
- }
- namespace llvm {
- class FileCollectorFileSystem : public vfs::FileSystem {
- public:
- explicit FileCollectorFileSystem(IntrusiveRefCntPtr<vfs::FileSystem> FS,
- std::shared_ptr<FileCollector> Collector)
- : FS(std::move(FS)), Collector(std::move(Collector)) {}
- llvm::ErrorOr<llvm::vfs::Status> status(const Twine &Path) override {
- auto Result = FS->status(Path);
- if (Result && Result->exists())
- Collector->addFile(Path);
- return Result;
- }
- llvm::ErrorOr<std::unique_ptr<llvm::vfs::File>>
- openFileForRead(const Twine &Path) override {
- auto Result = FS->openFileForRead(Path);
- if (Result && *Result)
- Collector->addFile(Path);
- return Result;
- }
- llvm::vfs::directory_iterator dir_begin(const llvm::Twine &Dir,
- std::error_code &EC) override {
- return Collector->addDirectoryImpl(Dir, FS, EC);
- }
- std::error_code getRealPath(const Twine &Path,
- SmallVectorImpl<char> &Output) const override {
- auto EC = FS->getRealPath(Path, Output);
- if (!EC) {
- Collector->addFile(Path);
- if (Output.size() > 0)
- Collector->addFile(Output);
- }
- return EC;
- }
- std::error_code isLocal(const Twine &Path, bool &Result) override {
- return FS->isLocal(Path, Result);
- }
- llvm::ErrorOr<std::string> getCurrentWorkingDirectory() const override {
- return FS->getCurrentWorkingDirectory();
- }
- std::error_code setCurrentWorkingDirectory(const llvm::Twine &Path) override {
- return FS->setCurrentWorkingDirectory(Path);
- }
- private:
- IntrusiveRefCntPtr<vfs::FileSystem> FS;
- std::shared_ptr<FileCollector> Collector;
- };
- } // namespace llvm
- IntrusiveRefCntPtr<vfs::FileSystem>
- FileCollector::createCollectorVFS(IntrusiveRefCntPtr<vfs::FileSystem> BaseFS,
- std::shared_ptr<FileCollector> Collector) {
- return new FileCollectorFileSystem(std::move(BaseFS), std::move(Collector));
- }
|