mirror of
https://github.com/tkuschel/bees.git
synced 2025-11-17 23:09:14 +01:00
Get rid of the thread-local TempFiles and use Pool instead. This eliminates a potential FD leak when the loadavg governor repeatedly creates and destroys threads. With the old per-thread TempFiles, we were guaranteed to have exclusive ownership of the TempFile object within the current thread. Pool is somewhat stricter: it only guarantees ownership while the checked-out Handle exists. Adjust the users of TempFile objects to ensure they hold the Handle object until they are finished using the TempFile. It appears that maintaining large, heavily-reflinked, long-lived temporary files costs more than truncating after every use: btrfs has to write multiple references to the temporary file's extents, then some commits later, remove references as the temporary file is deleted or truncated. Using the temporary file in a dedupe operation flushes the data to disk, so nothing is saved by pretending that there is writeback pipelining and trying to avoid flushes in truncate. Pool provides usage tracking and a checkin callback, so use it to truncate the temporary file immediately after every use. Redesign TempFile so that every instance creates exactly one Fd which persists over the lifetime of the TempFile object. Provide a reset() method which resets the file back to the initial state and call it from the Pool checkin callback. This makes TempFile's lifetime equivalent to its Fd's lifetime, which simplifies interactions with FdCache and Roots. This change means we can now blacklist temporary files without having an effective memory leak, so do that. We also have a reason to ever remove something from the blacklist, so add a method for that too. In order to move to extent-centric addressing, we need to be able to reliably open temporary files by root and inode number. Previously we would place TempFile fd's into the cache with insert_root_ino, but the cache would be cleared periodically, and it would not be possible to reopen temporary files after that happened. Now that the TempFile's lifetime is the same as the TempFile Fd's lifetime, we can have TempFile manage a separate FileId -> Fd map in Roots which is unaffected by the periodic cache clearing. BeesRoots::open_root_ino_nocache will check this map before attempting to open the file via btrfs root+ino lookup, and return it through the cache as if Roots had opened the file via btrfs. Hold a reference to BeesRoots in BeesTempFile because the usual way to get such a reference now throws an exception in BeesTempFile's destructor. These changes make method BeesTempFile::create() and all methods named insert_root_ino unnecessary, so delete them. We construct and destroy TempFiles much less often now, so make their constructor and destructor more informative. Signed-off-by: Zygo Blaxell <bees@furryterror.org>
917 lines
22 KiB
C++
917 lines
22 KiB
C++
#include "bees.h"
|
|
|
|
#include "crucible/limits.h"
|
|
#include "crucible/process.h"
|
|
#include "crucible/string.h"
|
|
#include "crucible/task.h"
|
|
|
|
#include <cctype>
|
|
#include <cmath>
|
|
#include <cstdio>
|
|
|
|
#include <iostream>
|
|
#include <memory>
|
|
#include <sstream>
|
|
|
|
// PRIx64
|
|
#include <inttypes.h>
|
|
|
|
#include <sched.h>
|
|
#include <sys/fanotify.h>
|
|
|
|
#include <linux/fs.h>
|
|
#include <sys/ioctl.h>
|
|
|
|
// setrlimit
|
|
#include <sys/time.h>
|
|
#include <sys/resource.h>
|
|
|
|
#include <getopt.h>
|
|
|
|
using namespace crucible;
|
|
using namespace std;
|
|
|
|
int bees_log_level = 8;
|
|
|
|
void
|
|
do_cmd_help(char *argv[])
|
|
{
|
|
fprintf(stderr, BEES_USAGE, argv[0]);
|
|
}
|
|
|
|
// tracing ----------------------------------------
|
|
|
|
thread_local BeesTracer *BeesTracer::tl_next_tracer = nullptr;
|
|
thread_local bool BeesTracer::tl_silent = false;
|
|
|
|
BeesTracer::~BeesTracer()
|
|
{
|
|
if (!tl_silent && current_exception()) {
|
|
try {
|
|
m_func();
|
|
} catch (exception &e) {
|
|
BEESLOGNOTICE("Nested exception: " << e.what());
|
|
} catch (...) {
|
|
BEESLOGNOTICE("Nested exception ...");
|
|
}
|
|
if (!m_next_tracer) {
|
|
BEESLOGNOTICE("--- END TRACE --- exception ---");
|
|
}
|
|
}
|
|
tl_next_tracer = m_next_tracer;
|
|
if (!m_next_tracer) {
|
|
tl_silent = false;
|
|
}
|
|
}
|
|
|
|
BeesTracer::BeesTracer(function<void()> f, bool silent) :
|
|
m_func(f)
|
|
{
|
|
m_next_tracer = tl_next_tracer;
|
|
tl_next_tracer = this;
|
|
tl_silent = silent;
|
|
}
|
|
|
|
void
|
|
BeesTracer::trace_now()
|
|
{
|
|
BeesTracer *tp = tl_next_tracer;
|
|
BEESLOGNOTICE("--- BEGIN TRACE ---");
|
|
while (tp) {
|
|
tp->m_func();
|
|
tp = tp->m_next_tracer;
|
|
}
|
|
BEESLOGNOTICE("--- END TRACE ---");
|
|
}
|
|
|
|
bool
|
|
BeesTracer::get_silent()
|
|
{
|
|
return tl_silent;
|
|
}
|
|
|
|
void
|
|
BeesTracer::set_silent()
|
|
{
|
|
tl_silent = true;
|
|
}
|
|
|
|
thread_local BeesNote *BeesNote::tl_next = nullptr;
|
|
mutex BeesNote::s_mutex;
|
|
map<pid_t, BeesNote*> BeesNote::s_status;
|
|
thread_local string BeesNote::tl_name;
|
|
|
|
BeesNote::~BeesNote()
|
|
{
|
|
tl_next = m_prev;
|
|
unique_lock<mutex> lock(s_mutex);
|
|
if (tl_next) {
|
|
s_status[crucible::gettid()] = tl_next;
|
|
} else {
|
|
s_status.erase(crucible::gettid());
|
|
}
|
|
}
|
|
|
|
BeesNote::BeesNote(function<void(ostream &os)> f) :
|
|
m_func(f)
|
|
{
|
|
m_name = get_name();
|
|
m_prev = tl_next;
|
|
tl_next = this;
|
|
unique_lock<mutex> lock(s_mutex);
|
|
s_status[crucible::gettid()] = tl_next;
|
|
}
|
|
|
|
void
|
|
BeesNote::set_name(const string &name)
|
|
{
|
|
tl_name = name;
|
|
catch_all([&]() {
|
|
DIE_IF_MINUS_ERRNO(pthread_setname_np(pthread_self(), name.c_str()));
|
|
});
|
|
}
|
|
|
|
string
|
|
BeesNote::get_name()
|
|
{
|
|
// Use explicit name if given
|
|
if (!tl_name.empty()) {
|
|
return tl_name;
|
|
}
|
|
|
|
// Try a Task name. If there is one, return it, but do not
|
|
// remember it. Each output message may be a different Task.
|
|
// The current task is thread_local so we don't need to worry
|
|
// about it being destroyed under us.
|
|
auto current_task = Task::current_task();
|
|
if (current_task) {
|
|
return current_task.title();
|
|
}
|
|
|
|
// OK try the pthread name next.
|
|
char buf[24];
|
|
memset(buf, '\0', sizeof(buf));
|
|
int err = pthread_getname_np(pthread_self(), buf, sizeof(buf));
|
|
if (err) {
|
|
return string("pthread_getname_np: ") + strerror(err);
|
|
}
|
|
buf[sizeof(buf) - 1] = '\0';
|
|
|
|
// thread_getname_np returns process name
|
|
// ...by default? ...for the main thread?
|
|
// ...except during exception handling?
|
|
// ...randomly?
|
|
return buf;
|
|
}
|
|
|
|
BeesNote::ThreadStatusMap
|
|
BeesNote::get_status()
|
|
{
|
|
unique_lock<mutex> lock(s_mutex);
|
|
ThreadStatusMap rv;
|
|
for (auto t : s_status) {
|
|
ostringstream oss;
|
|
if (!t.second->m_name.empty()) {
|
|
oss << t.second->m_name << ": ";
|
|
}
|
|
if (t.second->m_timer.age() > BEES_TOO_LONG) {
|
|
oss << "[" << t.second->m_timer << "s] ";
|
|
}
|
|
t.second->m_func(oss);
|
|
rv[t.first] = oss.str();
|
|
}
|
|
return rv;
|
|
}
|
|
|
|
// static inline helpers ----------------------------------------
|
|
|
|
string
|
|
pretty(double d)
|
|
{
|
|
static const char * units[] = { "", "K", "M", "G", "T", "P", "E" };
|
|
static const char * *units_stop = units + sizeof(units) / sizeof(units[0]) - 1;
|
|
const char * *unit = units;
|
|
while (d >= 1024 && unit < units_stop) {
|
|
d /= 1024;
|
|
++unit;
|
|
}
|
|
ostringstream oss;
|
|
oss << (round(d * 1000.0) / 1000.0) << *unit;
|
|
return oss.str();
|
|
}
|
|
|
|
// ostream operators ----------------------------------------
|
|
|
|
template <class T>
|
|
ostream &
|
|
operator<<(ostream &os, const BeesStatTmpl<T> &bs)
|
|
{
|
|
unique_lock<mutex> lock(bs.m_mutex);
|
|
bool first = true;
|
|
string last_tag;
|
|
for (auto i : bs.m_stats_map) {
|
|
if (i.second == 0) {
|
|
continue;
|
|
}
|
|
string tag = i.first.substr(0, i.first.find_first_of("_"));
|
|
if (!last_tag.empty() && tag != last_tag) {
|
|
os << "\n\t";
|
|
} else if (!first) {
|
|
os << " ";
|
|
}
|
|
last_tag = tag;
|
|
first = false;
|
|
os << i.first << "=" << i.second;
|
|
}
|
|
return os;
|
|
}
|
|
|
|
// other ----------------------------------------
|
|
|
|
template <class T>
|
|
T&
|
|
BeesStatTmpl<T>::at(string idx)
|
|
{
|
|
if (!m_stats_map.count(idx)) {
|
|
m_stats_map[idx] = 0;
|
|
}
|
|
return m_stats_map[idx];
|
|
}
|
|
|
|
template <class T>
|
|
T
|
|
BeesStatTmpl<T>::at(string idx) const
|
|
{
|
|
unique_lock<mutex> lock(m_mutex);
|
|
auto rv = m_stats_map.at(idx);
|
|
return rv;
|
|
}
|
|
|
|
template <class T>
|
|
void
|
|
BeesStatTmpl<T>::add_count(string idx, size_t amount)
|
|
{
|
|
unique_lock<mutex> lock(m_mutex);
|
|
if (!m_stats_map.count(idx)) {
|
|
m_stats_map[idx] = amount;
|
|
} else {
|
|
m_stats_map[idx] += amount;
|
|
}
|
|
}
|
|
|
|
template <class T>
|
|
BeesStatTmpl<T>::BeesStatTmpl(const BeesStatTmpl &that)
|
|
{
|
|
if (&that == this) return;
|
|
unique_lock<mutex> lock(m_mutex);
|
|
unique_lock<mutex> lock2(that.m_mutex);
|
|
m_stats_map = that.m_stats_map;
|
|
}
|
|
|
|
template <class T>
|
|
BeesStatTmpl<T> &
|
|
BeesStatTmpl<T>::operator=(const BeesStatTmpl<T> &that)
|
|
{
|
|
if (&that == this) return *this;
|
|
unique_lock<mutex> lock(m_mutex);
|
|
unique_lock<mutex> lock2(that.m_mutex);
|
|
m_stats_map = that.m_stats_map;
|
|
return *this;
|
|
}
|
|
|
|
BeesStats BeesStats::s_global;
|
|
|
|
BeesStats
|
|
BeesStats::operator-(const BeesStats &that) const
|
|
{
|
|
if (&that == this) return BeesStats();
|
|
|
|
unique_lock<mutex> this_lock(m_mutex);
|
|
BeesStats this_copy;
|
|
this_copy.m_stats_map = m_stats_map;
|
|
this_lock.unlock();
|
|
|
|
unique_lock<mutex> that_lock(that.m_mutex);
|
|
BeesStats that_copy;
|
|
that_copy.m_stats_map = that.m_stats_map;
|
|
that_lock.unlock();
|
|
|
|
for (auto i : that.m_stats_map) {
|
|
if (i.second != 0) {
|
|
this_copy.at(i.first) -= i.second;
|
|
}
|
|
}
|
|
return this_copy;
|
|
}
|
|
|
|
BeesRates
|
|
BeesStats::operator/(double d) const
|
|
{
|
|
BeesRates rv;
|
|
unique_lock<mutex> lock(m_mutex);
|
|
for (auto i : m_stats_map) {
|
|
rv.m_stats_map[i.first] = ceil(i.second / d * 1000) / 1000;
|
|
}
|
|
return rv;
|
|
}
|
|
|
|
BeesStats::operator bool() const
|
|
{
|
|
unique_lock<mutex> lock(m_mutex);
|
|
for (auto i : m_stats_map) {
|
|
if (i.second != 0) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
BeesTooLong::BeesTooLong(const string &s, double limit) :
|
|
m_limit(limit),
|
|
m_func([s](ostream &os) { os << s; })
|
|
{
|
|
}
|
|
|
|
BeesTooLong::BeesTooLong(const func_type &func, double limit) :
|
|
m_limit(limit),
|
|
m_func(func)
|
|
{
|
|
}
|
|
|
|
void
|
|
BeesTooLong::check() const
|
|
{
|
|
if (age() > m_limit) {
|
|
ostringstream oss;
|
|
m_func(oss);
|
|
BEESLOGWARN("PERFORMANCE: " << *this << " sec: " << oss.str());
|
|
}
|
|
}
|
|
|
|
BeesTooLong::~BeesTooLong()
|
|
{
|
|
check();
|
|
}
|
|
|
|
BeesTooLong &
|
|
BeesTooLong::operator=(const func_type &f)
|
|
{
|
|
m_func = f;
|
|
return *this;
|
|
}
|
|
|
|
void
|
|
bees_sync(int fd)
|
|
{
|
|
Timer sync_timer;
|
|
BEESNOTE("syncing " << name_fd(fd));
|
|
BEESTOOLONG("syncing " << name_fd(fd));
|
|
DIE_IF_NON_ZERO(fsync(fd));
|
|
BEESCOUNT(sync_count);
|
|
BEESCOUNTADD(sync_ms, sync_timer.age() * 1000);
|
|
}
|
|
|
|
BeesStringFile::BeesStringFile(Fd dir_fd, string name, size_t limit) :
|
|
m_dir_fd(dir_fd),
|
|
m_name(name),
|
|
m_limit(limit)
|
|
{
|
|
BEESLOGINFO("BeesStringFile " << name_fd(m_dir_fd) << "/" << m_name << " max size " << pretty(m_limit));
|
|
}
|
|
|
|
void
|
|
BeesStringFile::name(const string &new_name)
|
|
{
|
|
m_name = new_name;
|
|
}
|
|
|
|
string
|
|
BeesStringFile::name() const
|
|
{
|
|
return m_name;
|
|
}
|
|
|
|
string
|
|
BeesStringFile::read()
|
|
{
|
|
BEESNOTE("opening " << m_name << " in " << name_fd(m_dir_fd));
|
|
Fd fd(openat(m_dir_fd, m_name.c_str(), FLAGS_OPEN_FILE));
|
|
if (!fd) {
|
|
return string();
|
|
}
|
|
|
|
BEESNOTE("sizing " << m_name << " in " << name_fd(m_dir_fd));
|
|
Stat st(fd);
|
|
THROW_CHECK1(out_of_range, st.st_size, st.st_size > 0);
|
|
THROW_CHECK1(out_of_range, st.st_size, st.st_size < ranged_cast<off_t>(m_limit));
|
|
|
|
BEESNOTE("reading " << m_name << " in " << name_fd(m_dir_fd));
|
|
return read_string(fd, st.st_size);
|
|
}
|
|
|
|
void
|
|
BeesStringFile::write(string contents)
|
|
{
|
|
THROW_CHECK2(out_of_range, contents.size(), m_limit, contents.size() < m_limit);
|
|
auto tmpname = m_name + ".tmp";
|
|
|
|
BEESNOTE("unlinking " << tmpname << " in " << name_fd(m_dir_fd));
|
|
unlinkat(m_dir_fd, tmpname.c_str(), 0);
|
|
// ignore error
|
|
|
|
BEESNOTE("closing " << tmpname << " in " << name_fd(m_dir_fd));
|
|
{
|
|
Fd ofd = openat_or_die(m_dir_fd, tmpname, FLAGS_CREATE_FILE, S_IRUSR | S_IWUSR);
|
|
BEESNOTE("writing " << tmpname << " in " << name_fd(m_dir_fd));
|
|
write_or_die(ofd, contents);
|
|
#if 0
|
|
// This triggers too many btrfs bugs. I wish I was kidding.
|
|
// Forget snapshots, balance, compression, and dedup:
|
|
// the system call you have to fear on btrfs is fsync().
|
|
// Also note that when bees renames a temporary over an
|
|
// existing file, it flushes the temporary, so we get
|
|
// the right behavior if we just do nothing here
|
|
// (except when the file is first created; however,
|
|
// in that case the result is the same as if the file
|
|
// did not exist, was empty, or was filled with garbage).
|
|
BEESNOTE("fsyncing " << tmpname << " in " << name_fd(m_dir_fd));
|
|
DIE_IF_NON_ZERO(fsync(ofd));
|
|
#endif
|
|
}
|
|
BEESNOTE("renaming " << tmpname << " to " << m_name << " in FD " << name_fd(m_dir_fd));
|
|
BEESTRACE("renaming " << tmpname << " to " << m_name << " in FD " << name_fd(m_dir_fd));
|
|
renameat_or_die(m_dir_fd, tmpname, m_dir_fd, m_name);
|
|
}
|
|
|
|
void
|
|
BeesTempFile::resize(off_t offset)
|
|
{
|
|
BEESTOOLONG("Resizing temporary file to " << to_hex(offset));
|
|
BEESNOTE("Resizing temporary file " << name_fd(m_fd) << " to " << to_hex(offset));
|
|
BEESTRACE("Resizing temporary file " << name_fd(m_fd) << " to " << to_hex(offset));
|
|
|
|
// Truncate
|
|
Timer resize_timer;
|
|
DIE_IF_NON_ZERO(ftruncate(m_fd, offset));
|
|
BEESCOUNT(tmp_resize);
|
|
|
|
// Success
|
|
m_end_offset = offset;
|
|
|
|
// Count time spent here
|
|
BEESCOUNTADD(tmp_resize_ms, resize_timer.age() * 1000);
|
|
}
|
|
|
|
void
|
|
BeesTempFile::reset()
|
|
{
|
|
// Always leave first block empty to avoid creating a file with an inline extent
|
|
resize(BLOCK_SIZE_CLONE);
|
|
}
|
|
|
|
|
|
BeesTempFile::~BeesTempFile()
|
|
{
|
|
BEESLOGDEBUG("destroying temporary file " << this << " in " << m_ctx->root_path() << " fd " << name_fd(m_fd));
|
|
|
|
// Remove this file from open_root_ino lookup table
|
|
m_roots->erase_tmpfile(m_fd);
|
|
|
|
// Remove from blacklist
|
|
m_ctx->blacklist_erase(BeesFileId(m_fd));
|
|
}
|
|
|
|
BeesTempFile::BeesTempFile(shared_ptr<BeesContext> ctx) :
|
|
m_ctx(ctx),
|
|
m_roots(ctx->roots()),
|
|
m_end_offset(0)
|
|
{
|
|
BEESLOGDEBUG("creating temporary file " << this << " in " << m_ctx->root_path());
|
|
BEESNOTE("creating temporary file in " << m_ctx->root_path());
|
|
BEESTOOLONG("creating temporary file in " << m_ctx->root_path());
|
|
|
|
Timer create_timer;
|
|
DIE_IF_MINUS_ONE(m_fd = openat(m_ctx->root_fd(), ".", FLAGS_OPEN_TMPFILE, S_IRUSR | S_IWUSR));
|
|
BEESCOUNT(tmp_create);
|
|
|
|
// Don't include this file in new extent scans
|
|
m_ctx->blacklist_insert(BeesFileId(m_fd));
|
|
|
|
// Add this file to open_root_ino lookup table
|
|
m_roots->insert_tmpfile(m_fd);
|
|
|
|
// Set compression attribute
|
|
BEESTRACE("Getting FS_COMPR_FL on m_fd " << name_fd(m_fd));
|
|
int flags = ioctl_iflags_get(m_fd);
|
|
flags |= FS_COMPR_FL;
|
|
BEESTRACE("Setting FS_COMPR_FL on m_fd " << name_fd(m_fd) << " flags " << to_hex(flags));
|
|
ioctl_iflags_set(m_fd, flags);
|
|
|
|
// Count time spent here
|
|
BEESCOUNTADD(tmp_create_ms, create_timer.age() * 1000);
|
|
|
|
// Set initial size
|
|
reset();
|
|
}
|
|
|
|
void
|
|
BeesTempFile::realign()
|
|
{
|
|
if (m_end_offset > BLOCK_SIZE_MAX_TEMP_FILE) {
|
|
BEESLOGINFO("temporary file size " << to_hex(m_end_offset) << " > max " << BLOCK_SIZE_MAX_TEMP_FILE);
|
|
BEESCOUNT(tmp_trunc);
|
|
reset();
|
|
return;
|
|
}
|
|
if (m_end_offset & BLOCK_MASK_CLONE) {
|
|
// BEESTRACE("temporary file size " << to_hex(m_end_offset) << " not aligned");
|
|
BEESCOUNT(tmp_realign);
|
|
reset();
|
|
return;
|
|
}
|
|
// OK as is
|
|
BEESCOUNT(tmp_aligned);
|
|
}
|
|
|
|
BeesFileRange
|
|
BeesTempFile::make_hole(off_t count)
|
|
{
|
|
THROW_CHECK1(invalid_argument, count, count > 0);
|
|
realign();
|
|
|
|
BEESTRACE("make hole at " << m_end_offset);
|
|
|
|
auto end = m_end_offset + count;
|
|
BeesFileRange rv(m_fd, m_end_offset, end);
|
|
|
|
resize(end);
|
|
|
|
BEESTRACE("created temporary hole " << rv);
|
|
BEESCOUNT(tmp_hole);
|
|
return rv;
|
|
}
|
|
|
|
BeesFileRange
|
|
BeesTempFile::make_copy(const BeesFileRange &src)
|
|
{
|
|
BEESLOGINFO("copy: " << src);
|
|
BEESNOTE("Copying " << src);
|
|
BEESTRACE("Copying " << src);
|
|
|
|
THROW_CHECK1(invalid_argument, src, src.size() > 0);
|
|
|
|
// FIEMAP used to give us garbage data, e.g. distinct adjacent
|
|
// extents merged into a single entry in the FIEMAP output.
|
|
// FIEMAP didn't stop giving us garbage data, we just stopped
|
|
// using FIEMAP.
|
|
// We shouldn't get absurdly large extents any more; however,
|
|
// it's still a problem if we do, so bail out and leave a trace
|
|
// in the log.
|
|
THROW_CHECK1(invalid_argument, src, src.size() < BLOCK_SIZE_MAX_TEMP_FILE);
|
|
|
|
realign();
|
|
|
|
auto begin = m_end_offset;
|
|
auto end = m_end_offset + src.size();
|
|
resize(end);
|
|
|
|
Timer copy_timer;
|
|
BeesFileRange rv(m_fd, begin, end);
|
|
BEESTRACE("copying to: " << rv);
|
|
BEESNOTE("copying " << src << " to " << rv);
|
|
|
|
auto src_p = src.begin();
|
|
auto dst_p = begin;
|
|
|
|
bool did_block_write = false;
|
|
while (dst_p < end) {
|
|
auto len = min(BLOCK_SIZE_CLONE, end - dst_p);
|
|
BeesBlockData bbd(src.fd(), src_p, len);
|
|
// Don't fill in holes
|
|
if (bbd.is_data_zero()) {
|
|
BEESCOUNT(tmp_block_zero);
|
|
} else {
|
|
BEESNOTE("copying " << src << " to " << rv << "\n"
|
|
"\tpwrite " << bbd << " to " << name_fd(m_fd) << " offset " << to_hex(dst_p) << " len " << len);
|
|
pwrite_or_die(m_fd, bbd.data().data(), len, dst_p);
|
|
did_block_write = true;
|
|
BEESCOUNT(tmp_block);
|
|
BEESCOUNTADD(tmp_bytes, len);
|
|
}
|
|
src_p += len;
|
|
dst_p += len;
|
|
}
|
|
BEESCOUNTADD(tmp_copy_ms, copy_timer.age() * 1000);
|
|
|
|
if (did_block_write) {
|
|
#if 0
|
|
// There were a lot of kernel bugs leading to lockups.
|
|
// Most of them are fixed now.
|
|
// Unnecessary sync makes us slow, but maybe it has some robustness utility.
|
|
// TODO: make this configurable.
|
|
bees_sync(m_fd);
|
|
#endif
|
|
}
|
|
|
|
BEESCOUNT(tmp_copy);
|
|
return rv;
|
|
}
|
|
|
|
static
|
|
ostream &
|
|
operator<<(ostream &os, const siginfo_t &si)
|
|
{
|
|
return os << "siginfo_t { "
|
|
<< "signo = " << si.si_signo << " (" << signal_ntoa(si.si_signo) << "), "
|
|
<< "errno = " << si.si_errno << ", "
|
|
<< "code = " << si.si_code << ", "
|
|
// << "trapno = " << si.si_trapno << ", "
|
|
<< "pid = " << si.si_pid << ", "
|
|
<< "uid = " << si.si_uid << ", "
|
|
<< "status = " << si.si_status << ", "
|
|
<< "utime = " << si.si_utime << ", "
|
|
<< "stime = " << si.si_stime << ", "
|
|
// << "value = " << si.si_value << ", "
|
|
<< "int = " << si.si_int << ", "
|
|
<< "ptr = " << si.si_ptr << ", "
|
|
<< "overrun = " << si.si_overrun << ", "
|
|
<< "timerid = " << si.si_timerid << ", "
|
|
<< "addr = " << si.si_addr << ", "
|
|
<< "band = " << si.si_band << ", "
|
|
<< "fd = " << si.si_fd << ", "
|
|
<< "addr_lsb = " << si.si_addr_lsb << ", "
|
|
// << "lower = " << si.si_lower << ", "
|
|
// << "upper = " << si.si_upper << ", "
|
|
// << "pkey = " << si.si_pkey << ", "
|
|
<< "call_addr = " << si.si_call_addr << ", "
|
|
<< "syscall = " << si.si_syscall << ", "
|
|
<< "arch = " << si.si_arch
|
|
<< " }";
|
|
}
|
|
|
|
static sigset_t new_sigset, old_sigset;
|
|
|
|
void
|
|
block_term_signal()
|
|
{
|
|
BEESLOGDEBUG("Masking signals");
|
|
|
|
DIE_IF_NON_ZERO(sigemptyset(&new_sigset));
|
|
DIE_IF_NON_ZERO(sigaddset(&new_sigset, SIGTERM));
|
|
DIE_IF_NON_ZERO(sigaddset(&new_sigset, SIGINT));
|
|
DIE_IF_NON_ZERO(sigprocmask(SIG_BLOCK, &new_sigset, &old_sigset));
|
|
}
|
|
|
|
void
|
|
wait_for_term_signal()
|
|
{
|
|
BEESNOTE("waiting for signals");
|
|
BEESLOGDEBUG("Waiting for signals...");
|
|
siginfo_t info;
|
|
|
|
// Ironically, sigwaitinfo can be interrupted by a signal.
|
|
while (true) {
|
|
const int rv = sigwaitinfo(&new_sigset, &info);
|
|
if (rv == -1) {
|
|
if (errno == EINTR) {
|
|
BEESLOGDEBUG("Restarting sigwaitinfo");
|
|
continue;
|
|
}
|
|
THROW_ERRNO("sigwaitinfo errno = " << errno);
|
|
} else {
|
|
BEESLOGNOTICE("Received signal " << rv << " info " << info);
|
|
// Unblock so we die immediately if signalled again
|
|
DIE_IF_NON_ZERO(sigprocmask(SIG_BLOCK, &old_sigset, &new_sigset));
|
|
break;
|
|
}
|
|
}
|
|
BEESLOGDEBUG("Signal catcher exiting");
|
|
}
|
|
|
|
int
|
|
bees_main(int argc, char *argv[])
|
|
{
|
|
set_catch_explainer([&](string s) {
|
|
if (BeesTracer::get_silent()) {
|
|
BEESLOGDEBUG("exception (ignored): " << s);
|
|
BEESCOUNT(exception_caught_silent);
|
|
} else {
|
|
BEESLOGNOTICE("\n\n*** EXCEPTION ***\n\t" << s << "\n***\n");
|
|
BEESCOUNT(exception_caught);
|
|
}
|
|
});
|
|
|
|
// The thread name for the main function is also what the kernel
|
|
// Oops messages call the entire process. So even though this
|
|
// thread's proper title is "main", let's call it "bees".
|
|
BeesNote::set_name("bees");
|
|
BEESNOTE("main");
|
|
|
|
THROW_CHECK1(invalid_argument, argc, argc >= 0);
|
|
|
|
// Have to block signals now before we create a bunch of threads
|
|
// so the threads will also have the signals blocked.
|
|
block_term_signal();
|
|
|
|
// Create a context so we can apply configuration to it
|
|
shared_ptr<BeesContext> bc = make_shared<BeesContext>();
|
|
|
|
string cwd(readlink_or_die("/proc/self/cwd"));
|
|
|
|
// Defaults
|
|
bool chatter_prefix_timestamp = true;
|
|
double thread_factor = 0;
|
|
unsigned thread_count = 0;
|
|
unsigned thread_min = 0;
|
|
double load_target = 0;
|
|
bool workaround_btrfs_send = false;
|
|
BeesRoots::ScanMode root_scan_mode = BeesRoots::SCAN_MODE_ZERO;
|
|
|
|
// Configure getopt_long
|
|
static const struct option long_options[] = {
|
|
{ "thread-factor", required_argument, NULL, 'C' },
|
|
{ "thread-min", required_argument, NULL, 'G' },
|
|
{ "strip-paths", no_argument, NULL, 'P' },
|
|
{ "no-timestamps", no_argument, NULL, 'T' },
|
|
{ "workaround-btrfs-send", no_argument, NULL, 'a' },
|
|
{ "thread-count", required_argument, NULL, 'c' },
|
|
{ "loadavg-target", required_argument, NULL, 'g' },
|
|
{ "help", no_argument, NULL, 'h' },
|
|
{ "scan-mode", required_argument, NULL, 'm' },
|
|
{ "absolute-paths", no_argument, NULL, 'p' },
|
|
{ "timestamps", no_argument, NULL, 't' },
|
|
{ "verbose", required_argument, NULL, 'v' },
|
|
{ 0, 0, 0, 0 },
|
|
};
|
|
|
|
// Build getopt_long's short option list from the long_options table.
|
|
// While we're at it, make sure we didn't duplicate any options.
|
|
string getopt_list;
|
|
set<decltype(option::val)> option_vals;
|
|
for (const struct option *op = long_options; op->val; ++op) {
|
|
THROW_CHECK1(runtime_error, op->val, !option_vals.count(op->val));
|
|
option_vals.insert(op->val);
|
|
if ((op->val & 0xff) != op->val) {
|
|
continue;
|
|
}
|
|
getopt_list += op->val;
|
|
if (op->has_arg == required_argument) {
|
|
getopt_list += ':';
|
|
}
|
|
}
|
|
|
|
// Parse options
|
|
int c;
|
|
while (true) {
|
|
int option_index = 0;
|
|
|
|
c = getopt_long(argc, argv, getopt_list.c_str(), long_options, &option_index);
|
|
if (-1 == c) {
|
|
break;
|
|
}
|
|
|
|
switch (c) {
|
|
|
|
case 'C':
|
|
thread_factor = stod(optarg);
|
|
break;
|
|
case 'G':
|
|
thread_min = stoul(optarg);
|
|
break;
|
|
case 'P':
|
|
crucible::set_relative_path(cwd);
|
|
break;
|
|
case 'T':
|
|
chatter_prefix_timestamp = false;
|
|
break;
|
|
case 'a':
|
|
workaround_btrfs_send = true;
|
|
break;
|
|
case 'c':
|
|
thread_count = stoul(optarg);
|
|
break;
|
|
case 'g':
|
|
load_target = stod(optarg);
|
|
break;
|
|
case 'm':
|
|
root_scan_mode = static_cast<BeesRoots::ScanMode>(stoul(optarg));
|
|
break;
|
|
case 'p':
|
|
crucible::set_relative_path("");
|
|
break;
|
|
case 't':
|
|
chatter_prefix_timestamp = true;
|
|
break;
|
|
case 'v':
|
|
{
|
|
int new_log_level = stoul(optarg);
|
|
THROW_CHECK1(out_of_range, new_log_level, new_log_level <= 8);
|
|
THROW_CHECK1(out_of_range, new_log_level, new_log_level >= 0);
|
|
bees_log_level = new_log_level;
|
|
BEESLOGNOTICE("log level set to " << bees_log_level);
|
|
}
|
|
break;
|
|
|
|
case 'h':
|
|
default:
|
|
do_cmd_help(argv);
|
|
return EXIT_FAILURE;
|
|
}
|
|
}
|
|
|
|
if (optind + 1 != argc) {
|
|
BEESLOGERR("Only one filesystem path per bees process");
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
Chatter::enable_timestamp(chatter_prefix_timestamp);
|
|
|
|
if (!relative_path().empty()) {
|
|
BEESLOGINFO("using relative path " << relative_path() << "\n");
|
|
}
|
|
|
|
BEESLOGINFO("setting rlimit NOFILE to " << BEES_OPEN_FILE_LIMIT);
|
|
|
|
struct rlimit lim = {
|
|
.rlim_cur = BEES_OPEN_FILE_LIMIT,
|
|
.rlim_max = BEES_OPEN_FILE_LIMIT,
|
|
};
|
|
int rv = setrlimit(RLIMIT_NOFILE, &lim);
|
|
if (rv) {
|
|
BEESLOGINFO("setrlimit(RLIMIT_NOFILE, { " << lim.rlim_cur << " }): " << strerror(errno));
|
|
};
|
|
|
|
// Set up worker thread pool
|
|
THROW_CHECK1(out_of_range, thread_factor, thread_factor >= 0);
|
|
if (thread_count < 1) {
|
|
if (thread_factor == 0) {
|
|
thread_factor = BEES_DEFAULT_THREAD_FACTOR;
|
|
}
|
|
thread_count = max(1U, static_cast<unsigned>(ceil(thread::hardware_concurrency() * thread_factor)));
|
|
if (thread_count > BEES_DEFAULT_THREAD_LIMIT) {
|
|
BEESLOGNOTICE("Limiting computed thread count to " << BEES_DEFAULT_THREAD_LIMIT);
|
|
BEESLOGNOTICE("Use --thread-count to override this limit");
|
|
thread_count = BEES_DEFAULT_THREAD_LIMIT;
|
|
}
|
|
}
|
|
|
|
if (load_target != 0) {
|
|
BEESLOGNOTICE("setting load average target to " << load_target);
|
|
BEESLOGNOTICE("setting worker thread pool minimum size to " << thread_min);
|
|
TaskMaster::set_thread_min_count(thread_min);
|
|
}
|
|
TaskMaster::set_loadavg_target(load_target);
|
|
|
|
BEESLOGNOTICE("setting worker thread pool maximum size to " << thread_count);
|
|
TaskMaster::set_thread_count(thread_count);
|
|
|
|
// Set root path
|
|
string root_path = argv[optind++];
|
|
BEESLOGNOTICE("setting root path to '" << root_path << "'");
|
|
bc->set_root_path(root_path);
|
|
|
|
// Workaround for btrfs send
|
|
bc->roots()->set_workaround_btrfs_send(workaround_btrfs_send);
|
|
|
|
// Set root scan mode
|
|
bc->roots()->set_scan_mode(root_scan_mode);
|
|
|
|
// Start crawlers
|
|
bc->start();
|
|
|
|
// Now we just wait forever
|
|
wait_for_term_signal();
|
|
|
|
// Shut it down
|
|
bc->stop();
|
|
|
|
// That is all.
|
|
return EXIT_SUCCESS;
|
|
}
|
|
|
|
int
|
|
main(int argc, char *argv[])
|
|
{
|
|
cerr << "bees version " << BEES_VERSION << endl;
|
|
|
|
if (argc < 2) {
|
|
do_cmd_help(argv);
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
int rv = 1;
|
|
catch_and_explain([&]() {
|
|
rv = bees_main(argc, argv);
|
|
});
|
|
BEESLOGNOTICE("Exiting with status " << rv << " " << (rv ? "(failure)" : "(success)"));
|
|
return rv;
|
|
}
|
|
|
|
// instantiate templates for linkage ----------------------------------------
|
|
|
|
template class BeesStatTmpl<uint64_t>;
|
|
template ostream & operator<<(ostream &os, const BeesStatTmpl<uint64_t> &bs);
|
|
|
|
template class BeesStatTmpl<double>;
|
|
template ostream & operator<<(ostream &os, const BeesStatTmpl<double> &bs);
|