From a16fe65b724538eb346322ec7aa88ac029881907 Mon Sep 17 00:00:00 2001 From: Rui Ueyama Date: Wed, 1 Nov 2017 21:38:14 +0000 Subject: [PATCH] Rewrite FileOutputBuffer as two separate classes. This patch is to rewrite FileOutputBuffer as two separate classes; one for file-backed output buffer and the other for memory-backed output buffer. I think the new code is easier to follow because two different implementations are now actually separated as different classes. Unlike the previous implementation, the class that does not replace the final output file using rename(2) does not create a temporary file at all. Instead, it allocates memory using mmap(2) and use it. I think this is an improvement because it is now guaranteed that the temporary memory region doesn't trigger any I/O and there's now zero chance to leave a temporary file behind. Also, it shouldn't impose new restrictions because were using mmap IO too. Differential Revision: https://reviews.llvm.org/D39449 llvm-svn: 317127 --- llvm/include/llvm/Support/FileOutputBuffer.h | 34 +--- llvm/lib/Support/FileOutputBuffer.cpp | 204 +++++++++++-------- 2 files changed, 130 insertions(+), 108 deletions(-) diff --git a/llvm/include/llvm/Support/FileOutputBuffer.h b/llvm/include/llvm/Support/FileOutputBuffer.h index 2c054c75374b..8db64098c368 100644 --- a/llvm/include/llvm/Support/FileOutputBuffer.h +++ b/llvm/include/llvm/Support/FileOutputBuffer.h @@ -30,7 +30,6 @@ namespace llvm { /// not committed, the file will be deleted in the FileOutputBuffer destructor. class FileOutputBuffer { public: - enum { F_executable = 1 /// set the 'x' bit on the resulting file }; @@ -42,48 +41,33 @@ public: create(StringRef FilePath, size_t Size, unsigned Flags = 0); /// Returns a pointer to the start of the buffer. - uint8_t *getBufferStart() { - return (uint8_t*)Region->data(); - } + virtual uint8_t *getBufferStart() const = 0; /// Returns a pointer to the end of the buffer. - uint8_t *getBufferEnd() { - return (uint8_t*)Region->data() + Region->size(); - } + virtual uint8_t *getBufferEnd() const = 0; /// Returns size of the buffer. - size_t getBufferSize() const { - return Region->size(); - } + virtual size_t getBufferSize() const = 0; /// Returns path where file will show up if buffer is committed. - StringRef getPath() const { - return FinalPath; - } + StringRef getPath() const { return FinalPath; } /// Flushes the content of the buffer to its file and deallocates the /// buffer. If commit() is not called before this object's destructor /// is called, the file is deleted in the destructor. The optional parameter /// is used if it turns out you want the file size to be smaller than /// initially requested. - std::error_code commit(); + virtual std::error_code commit() = 0; /// If this object was previously committed, the destructor just deletes /// this object. If this object was not committed, the destructor /// deallocates the buffer and the target file is never written. - ~FileOutputBuffer(); + virtual ~FileOutputBuffer() {} -private: - FileOutputBuffer(const FileOutputBuffer &) = delete; - FileOutputBuffer &operator=(const FileOutputBuffer &) = delete; +protected: + FileOutputBuffer(StringRef Path) : FinalPath(Path) {} - FileOutputBuffer(std::unique_ptr R, - StringRef Path, StringRef TempPath, bool IsRegular); - - std::unique_ptr Region; - SmallString<128> FinalPath; - SmallString<128> TempPath; - bool IsRegular; + std::string FinalPath; }; } // end namespace llvm diff --git a/llvm/lib/Support/FileOutputBuffer.cpp b/llvm/lib/Support/FileOutputBuffer.cpp index d9c9f8234e26..1e20b01fc4aa 100644 --- a/llvm/lib/Support/FileOutputBuffer.cpp +++ b/llvm/lib/Support/FileOutputBuffer.cpp @@ -15,6 +15,7 @@ #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallString.h" #include "llvm/Support/Errc.h" +#include "llvm/Support/Memory.h" #include "llvm/Support/Path.h" #include "llvm/Support/Signals.h" #include @@ -25,110 +26,147 @@ #include #endif -using llvm::sys::fs::mapped_file_region; +using namespace llvm; +using namespace llvm::sys; -namespace llvm { -FileOutputBuffer::FileOutputBuffer(std::unique_ptr R, - StringRef Path, StringRef TmpPath, - bool IsRegular) - : Region(std::move(R)), FinalPath(Path), TempPath(TmpPath), - IsRegular(IsRegular) {} +// A FileOutputBuffer which creates a temporary file in the same directory +// as the final output file. The final output file is atomically replaced +// with the temporary file on commit(). +class OnDiskBuffer : public FileOutputBuffer { +public: + OnDiskBuffer(StringRef Path, StringRef TempPath, + std::unique_ptr Buf) + : FileOutputBuffer(Path), Buffer(std::move(Buf)), TempPath(TempPath) {} -FileOutputBuffer::~FileOutputBuffer() { - // Close the mapping before deleting the temp file, so that the removal - // succeeds. - Region.reset(); - sys::fs::remove(Twine(TempPath)); -} + static ErrorOr> + create(StringRef Path, size_t Size, unsigned Mode); -ErrorOr> -FileOutputBuffer::create(StringRef FilePath, size_t Size, unsigned Flags) { - // Check file is not a regular file, in which case we cannot remove it. - sys::fs::file_status Stat; - std::error_code EC = sys::fs::status(FilePath, Stat); - bool IsRegular = true; - switch (Stat.type()) { - case sys::fs::file_type::file_not_found: - // If file does not exist, we'll create one. - break; - case sys::fs::file_type::regular_file: { - // If file is not currently writable, error out. - // FIXME: There is no sys::fs:: api for checking this. - // FIXME: In posix, you use the access() call to check this. - } - break; - case sys::fs::file_type::directory_file: - return errc::is_a_directory; - default: - if (EC) - return EC; - IsRegular = false; + uint8_t *getBufferStart() const override { return (uint8_t *)Buffer->data(); } + + uint8_t *getBufferEnd() const override { + return (uint8_t *)Buffer->data() + Buffer->size(); } - SmallString<128> TempFilePath; + size_t getBufferSize() const override { return Buffer->size(); } + + std::error_code commit() override { + // Unmap buffer, letting OS flush dirty pages to file on disk. + Buffer.reset(); + + // Atomically replace the existing file with the new one. + auto EC = fs::rename(TempPath, FinalPath); + sys::DontRemoveFileOnSignal(TempPath); + return EC; + } + + ~OnDiskBuffer() override { + // Close the mapping before deleting the temp file, so that the removal + // succeeds. + Buffer.reset(); + fs::remove(TempPath); + } + +private: + std::unique_ptr Buffer; + std::string TempPath; +}; + +// A FileOutputBuffer which keeps data in memory and writes to the final +// output file on commit(). This is used only when we cannot use OnDiskBuffer. +class InMemoryBuffer : public FileOutputBuffer { +public: + InMemoryBuffer(StringRef Path, MemoryBlock Buf, unsigned Mode) + : FileOutputBuffer(Path), Buffer(Buf), Mode(Mode) {} + + static ErrorOr> + create(StringRef Path, size_t Size, unsigned Mode) { + std::error_code EC; + MemoryBlock MB = Memory::allocateMappedMemory( + Size, nullptr, sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC); + if (EC) + return EC; + return llvm::make_unique(Path, MB, Mode); + } + + uint8_t *getBufferStart() const override { return (uint8_t *)Buffer.base(); } + + uint8_t *getBufferEnd() const override { + return (uint8_t *)Buffer.base() + Buffer.size(); + } + + size_t getBufferSize() const override { return Buffer.size(); } + + std::error_code commit() override { + int FD; + std::error_code EC; + if (auto EC = openFileForWrite(FinalPath, FD, fs::F_None, Mode)) + return EC; + raw_fd_ostream OS(FD, /*shouldClose=*/true, /*unbuffered=*/true); + OS << StringRef((const char *)Buffer.base(), Buffer.size()); + return std::error_code(); + } + +private: + OwningMemoryBlock Buffer; + unsigned Mode; +}; + +ErrorOr> +OnDiskBuffer::create(StringRef Path, size_t Size, unsigned Mode) { + // Create new file in same directory but with random name. + SmallString<128> TempPath; int FD; - if (IsRegular) { - unsigned Mode = sys::fs::all_read | sys::fs::all_write; - // If requested, make the output file executable. - if (Flags & F_executable) - Mode |= sys::fs::all_exe; - // Create new file in same directory but with random name. - EC = sys::fs::createUniqueFile(Twine(FilePath) + ".tmp%%%%%%%", FD, - TempFilePath, Mode); - } else { - // Create a temporary file. Since this is a special file, we will not move - // it and the new file can be in another filesystem. This avoids trying to - // create a temporary file in /dev when outputting to /dev/null for example. - EC = sys::fs::createTemporaryFile(sys::path::filename(FilePath), "", FD, - TempFilePath); - } - - if (EC) + if (auto EC = fs::createUniqueFile(Path + ".tmp%%%%%%%", FD, TempPath, Mode)) return EC; - sys::RemoveFileOnSignal(TempFilePath); + sys::RemoveFileOnSignal(TempPath); #ifndef LLVM_ON_WIN32 // On Windows, CreateFileMapping (the mmap function on Windows) // automatically extends the underlying file. We don't need to // extend the file beforehand. _chsize (ftruncate on Windows) is // pretty slow just like it writes specified amount of bytes, - // so we should avoid calling that. - EC = sys::fs::resize_file(FD, Size); - if (EC) + // so we should avoid calling that function. + if (auto EC = fs::resize_file(FD, Size)) return EC; #endif - auto MappedFile = llvm::make_unique( - FD, mapped_file_region::readwrite, Size, 0, EC); - int Ret = close(FD); + // Mmap it. + std::error_code EC; + auto MappedFile = llvm::make_unique( + FD, fs::mapped_file_region::readwrite, Size, 0, EC); + close(FD); if (EC) return EC; - if (Ret) - return std::error_code(errno, std::generic_category()); - - std::unique_ptr Buf(new FileOutputBuffer( - std::move(MappedFile), FilePath, TempFilePath, IsRegular)); - return std::move(Buf); + return llvm::make_unique(Path, TempPath, std::move(MappedFile)); } -std::error_code FileOutputBuffer::commit() { - // Unmap buffer, letting OS flush dirty pages to file on disk. - Region.reset(); +// Create an instance of FileOutputBuffer. +ErrorOr> +FileOutputBuffer::create(StringRef Path, size_t Size, unsigned Flags) { + unsigned Mode = fs::all_read | fs::all_write; + if (Flags & F_executable) + Mode |= fs::all_exe; - std::error_code EC; - if (IsRegular) { - // Atomically replace the existing file with the new one. - EC = sys::fs::rename(Twine(TempPath), Twine(FinalPath)); - sys::DontRemoveFileOnSignal(TempPath); - } else { - EC = sys::fs::copy_file(TempPath, FinalPath); - std::error_code RMEC = sys::fs::remove(TempPath); - sys::DontRemoveFileOnSignal(TempPath); - if (RMEC) - return RMEC; + fs::file_status Stat; + fs::status(Path, Stat); + + // Usually, we want to create OnDiskBuffer to create a temporary file in + // the same directory as the destination file and atomically replaces it + // by rename(2). + // + // However, if the destination file is a special file, we don't want to + // use rename (e.g. we don't want to replace /dev/null with a regular + // file.) If that's the case, we create an in-memory buffer, open the + // destination file and write to it on commit(). + switch (Stat.type()) { + case fs::file_type::directory_file: + return errc::is_a_directory; + case fs::file_type::regular_file: + case fs::file_type::file_not_found: + case fs::file_type::status_error: + return OnDiskBuffer::create(Path, Size, Mode); + default: + return InMemoryBuffer::create(Path, Size, Mode); } - - return EC; } -} // namespace