2012-08-01 10:29:50 +08:00
|
|
|
//===- FileOutputBuffer.cpp - File Output Buffer ----------------*- C++ -*-===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2012-08-01 10:29:50 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// Utility for creating a in-memory buffer that will be written to a file.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2015-01-14 19:23:27 +08:00
|
|
|
#include "llvm/Support/FileOutputBuffer.h"
|
2015-03-24 02:07:13 +08:00
|
|
|
#include "llvm/ADT/STLExtras.h"
|
|
|
|
#include "llvm/Support/Errc.h"
|
2020-05-28 21:37:17 +08:00
|
|
|
#include "llvm/Support/FileSystem.h"
|
2017-11-02 05:38:14 +08:00
|
|
|
#include "llvm/Support/Memory.h"
|
2017-01-10 05:52:35 +08:00
|
|
|
#include "llvm/Support/Path.h"
|
2014-06-13 01:38:55 +08:00
|
|
|
#include <system_error>
|
2012-08-01 10:29:50 +08:00
|
|
|
|
2014-12-12 04:12:55 +08:00
|
|
|
#if !defined(_MSC_VER) && !defined(__MINGW32__)
|
|
|
|
#include <unistd.h>
|
|
|
|
#else
|
|
|
|
#include <io.h>
|
|
|
|
#endif
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
using namespace llvm;
|
|
|
|
using namespace llvm::sys;
|
2012-08-01 10:29:50 +08:00
|
|
|
|
2017-11-24 22:55:41 +08:00
|
|
|
namespace {
|
2017-11-02 05:38:14 +08:00
|
|
|
// A FileOutputBuffer which creates a temporary file in the same directory
|
|
|
|
// as the final output file. The final output file is atomically replaced
|
|
|
|
// with the temporary file on commit().
|
|
|
|
class OnDiskBuffer : public FileOutputBuffer {
|
|
|
|
public:
|
2017-11-14 02:33:44 +08:00
|
|
|
OnDiskBuffer(StringRef Path, fs::TempFile Temp,
|
2017-11-02 05:38:14 +08:00
|
|
|
std::unique_ptr<fs::mapped_file_region> Buf)
|
2017-11-14 02:33:44 +08:00
|
|
|
: FileOutputBuffer(Path), Buffer(std::move(Buf)), Temp(std::move(Temp)) {}
|
2012-08-01 10:29:50 +08:00
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
uint8_t *getBufferStart() const override { return (uint8_t *)Buffer->data(); }
|
|
|
|
|
|
|
|
uint8_t *getBufferEnd() const override {
|
|
|
|
return (uint8_t *)Buffer->data() + Buffer->size();
|
2012-08-01 10:29:50 +08:00
|
|
|
}
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
size_t getBufferSize() const override { return Buffer->size(); }
|
|
|
|
|
2017-11-08 09:50:29 +08:00
|
|
|
Error commit() override {
|
2017-11-02 05:38:14 +08:00
|
|
|
// Unmap buffer, letting OS flush dirty pages to file on disk.
|
|
|
|
Buffer.reset();
|
|
|
|
|
|
|
|
// Atomically replace the existing file with the new one.
|
2017-11-14 02:33:44 +08:00
|
|
|
return Temp.keep(FinalPath);
|
2017-01-10 05:52:35 +08:00
|
|
|
}
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
~OnDiskBuffer() override {
|
|
|
|
// Close the mapping before deleting the temp file, so that the removal
|
|
|
|
// succeeds.
|
|
|
|
Buffer.reset();
|
2017-11-14 02:33:44 +08:00
|
|
|
consumeError(Temp.discard());
|
2017-11-02 05:38:14 +08:00
|
|
|
}
|
|
|
|
|
2018-08-25 02:36:22 +08:00
|
|
|
void discard() override {
|
|
|
|
// Delete the temp file if it still was open, but keeping the mapping
|
|
|
|
// active.
|
|
|
|
consumeError(Temp.discard());
|
|
|
|
}
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
private:
|
|
|
|
std::unique_ptr<fs::mapped_file_region> Buffer;
|
2017-11-14 02:33:44 +08:00
|
|
|
fs::TempFile Temp;
|
2017-11-02 05:38:14 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
// A FileOutputBuffer which keeps data in memory and writes to the final
|
|
|
|
// output file on commit(). This is used only when we cannot use OnDiskBuffer.
|
|
|
|
class InMemoryBuffer : public FileOutputBuffer {
|
|
|
|
public:
|
2019-05-21 04:53:05 +08:00
|
|
|
InMemoryBuffer(StringRef Path, MemoryBlock Buf, std::size_t BufSize,
|
|
|
|
unsigned Mode)
|
|
|
|
: FileOutputBuffer(Path), Buffer(Buf), BufferSize(BufSize),
|
|
|
|
Mode(Mode) {}
|
2017-11-02 05:38:14 +08:00
|
|
|
|
|
|
|
uint8_t *getBufferStart() const override { return (uint8_t *)Buffer.base(); }
|
|
|
|
|
|
|
|
uint8_t *getBufferEnd() const override {
|
2019-05-21 04:53:05 +08:00
|
|
|
return (uint8_t *)Buffer.base() + BufferSize;
|
2017-11-02 05:38:14 +08:00
|
|
|
}
|
|
|
|
|
2019-05-21 04:53:05 +08:00
|
|
|
size_t getBufferSize() const override { return BufferSize; }
|
2017-11-02 05:38:14 +08:00
|
|
|
|
2017-11-08 09:50:29 +08:00
|
|
|
Error commit() override {
|
2019-01-23 02:44:04 +08:00
|
|
|
if (FinalPath == "-") {
|
2019-05-21 04:53:05 +08:00
|
|
|
llvm::outs() << StringRef((const char *)Buffer.base(), BufferSize);
|
2019-01-23 02:44:04 +08:00
|
|
|
llvm::outs().flush();
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2018-06-08 03:58:58 +08:00
|
|
|
using namespace sys::fs;
|
2017-11-02 05:38:14 +08:00
|
|
|
int FD;
|
|
|
|
std::error_code EC;
|
2018-06-08 04:07:08 +08:00
|
|
|
if (auto EC =
|
|
|
|
openFileForWrite(FinalPath, FD, CD_CreateAlways, OF_None, Mode))
|
2017-11-08 09:50:29 +08:00
|
|
|
return errorCodeToError(EC);
|
2017-11-02 05:38:14 +08:00
|
|
|
raw_fd_ostream OS(FD, /*shouldClose=*/true, /*unbuffered=*/true);
|
2019-05-21 04:53:05 +08:00
|
|
|
OS << StringRef((const char *)Buffer.base(), BufferSize);
|
2017-11-08 09:50:29 +08:00
|
|
|
return Error::success();
|
2017-11-02 05:38:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2019-05-21 04:53:05 +08:00
|
|
|
// Buffer may actually contain a larger memory block than BufferSize
|
2017-11-02 05:38:14 +08:00
|
|
|
OwningMemoryBlock Buffer;
|
2019-05-21 04:53:05 +08:00
|
|
|
size_t BufferSize;
|
2017-11-02 05:38:14 +08:00
|
|
|
unsigned Mode;
|
|
|
|
};
|
2017-11-24 22:55:41 +08:00
|
|
|
} // namespace
|
2017-11-02 05:38:14 +08:00
|
|
|
|
2017-11-09 06:57:48 +08:00
|
|
|
static Expected<std::unique_ptr<InMemoryBuffer>>
|
|
|
|
createInMemoryBuffer(StringRef Path, size_t Size, unsigned Mode) {
|
|
|
|
std::error_code EC;
|
|
|
|
MemoryBlock MB = Memory::allocateMappedMemory(
|
|
|
|
Size, nullptr, sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC);
|
|
|
|
if (EC)
|
|
|
|
return errorCodeToError(EC);
|
2019-08-15 23:54:37 +08:00
|
|
|
return std::make_unique<InMemoryBuffer>(Path, MB, Size, Mode);
|
2017-11-09 06:57:48 +08:00
|
|
|
}
|
|
|
|
|
2019-01-23 05:49:56 +08:00
|
|
|
static Expected<std::unique_ptr<FileOutputBuffer>>
|
2019-01-19 08:07:57 +08:00
|
|
|
createOnDiskBuffer(StringRef Path, size_t Size, unsigned Mode) {
|
2017-11-14 02:33:44 +08:00
|
|
|
Expected<fs::TempFile> FileOrErr =
|
|
|
|
fs::TempFile::create(Path + ".tmp%%%%%%%", Mode);
|
|
|
|
if (!FileOrErr)
|
|
|
|
return FileOrErr.takeError();
|
|
|
|
fs::TempFile File = std::move(*FileOrErr);
|
2015-09-18 23:17:53 +08:00
|
|
|
|
2018-04-29 08:45:03 +08:00
|
|
|
#ifndef _WIN32
|
2019-01-19 08:07:57 +08:00
|
|
|
// On Windows, CreateFileMapping (the mmap function on Windows)
|
|
|
|
// automatically extends the underlying file. We don't need to
|
|
|
|
// extend the file beforehand. _chsize (ftruncate on Windows) is
|
|
|
|
// pretty slow just like it writes specified amount of bytes,
|
|
|
|
// so we should avoid calling that function.
|
|
|
|
if (auto EC = fs::resize_file(File.FD, Size)) {
|
|
|
|
consumeError(File.discard());
|
|
|
|
return errorCodeToError(EC);
|
2018-06-29 02:49:09 +08:00
|
|
|
}
|
2019-01-19 08:07:57 +08:00
|
|
|
#endif
|
2014-12-13 02:13:23 +08:00
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
// Mmap it.
|
|
|
|
std::error_code EC;
|
2019-08-15 23:54:37 +08:00
|
|
|
auto MappedFile = std::make_unique<fs::mapped_file_region>(
|
[Support] Move llvm::MemoryBuffer to sys::fs::file_t
Summary:
On Windows, Posix integer file descriptors are a compatibility layer
over native file handles provided by the C runtime. There is a hard
limit on the maximum number of file descriptors that a process can open,
and the limit is 8192. LLD typically doesn't run into this limit because
it opens input files, maps them into memory, and then immediately closes
the file descriptor. This prevents it from running out of FDs.
For various reasons, I'd like to open handles to every input file and
keep them open during linking. That requires migrating MemoryBuffer over
to taking open native file handles instead of integer FDs.
Reviewers: aganea, Bigcheese
Reviewed By: aganea
Subscribers: smeenai, silvas, mehdi_amini, hiraditya, steven_wu, dexonsmith, dang, llvm-commits, zturner
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D63453
llvm-svn: 365588
2019-07-10 08:34:13 +08:00
|
|
|
fs::convertFDToNativeFile(File.FD), fs::mapped_file_region::readwrite,
|
|
|
|
Size, 0, EC);
|
2019-01-23 05:49:56 +08:00
|
|
|
|
|
|
|
// mmap(2) can fail if the underlying filesystem does not support it.
|
|
|
|
// If that happens, we fall back to in-memory buffer as the last resort.
|
2017-11-14 02:33:44 +08:00
|
|
|
if (EC) {
|
|
|
|
consumeError(File.discard());
|
2019-01-23 05:49:56 +08:00
|
|
|
return createInMemoryBuffer(Path, Size, Mode);
|
2017-11-14 02:33:44 +08:00
|
|
|
}
|
2019-01-23 05:49:56 +08:00
|
|
|
|
2019-08-15 23:54:37 +08:00
|
|
|
return std::make_unique<OnDiskBuffer>(Path, std::move(File),
|
2017-11-14 02:33:44 +08:00
|
|
|
std::move(MappedFile));
|
2012-12-04 06:09:52 +08:00
|
|
|
}
|
2012-08-01 10:29:50 +08:00
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
// Create an instance of FileOutputBuffer.
|
2017-11-08 09:05:44 +08:00
|
|
|
Expected<std::unique_ptr<FileOutputBuffer>>
|
2017-11-02 05:38:14 +08:00
|
|
|
FileOutputBuffer::create(StringRef Path, size_t Size, unsigned Flags) {
|
2019-01-23 02:44:04 +08:00
|
|
|
// Handle "-" as stdout just like llvm::raw_ostream does.
|
|
|
|
if (Path == "-")
|
|
|
|
return createInMemoryBuffer("-", Size, /*Mode=*/0);
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
unsigned Mode = fs::all_read | fs::all_write;
|
|
|
|
if (Flags & F_executable)
|
|
|
|
Mode |= fs::all_exe;
|
2012-12-04 06:09:52 +08:00
|
|
|
|
2020-05-05 00:45:41 +08:00
|
|
|
// If Size is zero, don't use mmap which will fail with EINVAL.
|
|
|
|
if (Size == 0)
|
|
|
|
return createInMemoryBuffer(Path, Size, Mode);
|
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
fs::file_status Stat;
|
|
|
|
fs::status(Path, Stat);
|
2012-12-04 06:09:52 +08:00
|
|
|
|
2017-11-02 05:38:14 +08:00
|
|
|
// Usually, we want to create OnDiskBuffer to create a temporary file in
|
|
|
|
// the same directory as the destination file and atomically replaces it
|
|
|
|
// by rename(2).
|
|
|
|
//
|
|
|
|
// However, if the destination file is a special file, we don't want to
|
|
|
|
// use rename (e.g. we don't want to replace /dev/null with a regular
|
|
|
|
// file.) If that's the case, we create an in-memory buffer, open the
|
|
|
|
// destination file and write to it on commit().
|
|
|
|
switch (Stat.type()) {
|
|
|
|
case fs::file_type::directory_file:
|
2017-11-08 09:05:44 +08:00
|
|
|
return errorCodeToError(errc::is_a_directory);
|
2017-11-02 05:38:14 +08:00
|
|
|
case fs::file_type::regular_file:
|
|
|
|
case fs::file_type::file_not_found:
|
|
|
|
case fs::file_type::status_error:
|
[LLD][ELF] Support --[no-]mmap-output-file with F_no_mmap
Summary:
Add a flag `F_no_mmap` to `FileOutputBuffer` to support
`--[no-]mmap-output-file` in ELF LLD. LLD currently explicitly ignores
this flag for compatibility with GNU ld and gold.
We need this flag to speed up link time for large binaries in certain
scenarios. When we link some of our larger binaries we find that LLD
takes 50+ GB of memory, which causes memory pressure. The memory
pressure causes the VM to flush dirty pages of the output file to disk.
This is normally okay, since we should be flushing cold pages. However,
when using BtrFS with compression we need to write 128KB at a time when
we flush a page. If any page in that 128KB block is written again, then
it must be flushed a second time, and so on. Since LLD doesn't write
sequentially this causes write amplification. The same 128KB block will
end up being flushed multiple times, causing the linker to many times
more IO than necessary. We've observed 3-5x faster builds with
-no-mmap-output-file when we hit this scenario.
The bad scenario only applies to compressed filesystems, which group
together multiple pages into a single compressed block. I've tested
BtrFS, but the problem will be present for any compressed filesystem
on Linux, since it is caused by the VM.
Silently ignoring --no-mmap-output-file caused a silent regression when
we switched from gold to lld. We pass --no-mmap-output-file to fix this
edge case, but since lld silently ignored the flag we didn't realize it
wasn't being respected.
Benchmark building a 9 GB binary that exposes this edge case. I linked 3
times with --mmap-output-file and 3 times with --no-mmap-output-file and
took the average. The machine has 24 cores @ 2.4 GHz, 112 GB of RAM,
BtrFS mounted with -compress-force=zstd, and an 80% full disk.
| Mode | Time |
|---------|-------|
| mmap | 894 s |
| no mmap | 126 s |
When compression is disabled, BtrFS performs just as well with and
without mmap on this benchmark.
I was unable to reproduce the regression with any binaries in
lld-speed-test.
Reviewed By: ruiu, MaskRay
Differential Revision: https://reviews.llvm.org/D69294
2019-10-30 06:46:22 +08:00
|
|
|
if (Flags & F_no_mmap)
|
|
|
|
return createInMemoryBuffer(Path, Size, Mode);
|
|
|
|
else
|
|
|
|
return createOnDiskBuffer(Path, Size, Mode);
|
2017-11-02 05:38:14 +08:00
|
|
|
default:
|
2017-11-09 06:57:48 +08:00
|
|
|
return createInMemoryBuffer(Path, Size, Mode);
|
2017-11-02 05:38:14 +08:00
|
|
|
}
|
2012-08-01 10:29:50 +08:00
|
|
|
}
|