dragonfly/server/db_slice.cc

396 lines
9.8 KiB
C++

// Copyright 2021, Roman Gershman. All rights reserved.
// See LICENSE for licensing terms.
//
#include "server/db_slice.h"
extern "C" {
#include "redis/object.h"
}
#include <boost/fiber/fiber.hpp>
#include <boost/fiber/operations.hpp>
#include "base/logging.h"
#include "server/engine_shard_set.h"
#include "util/fiber_sched_algo.h"
#include "util/proactor_base.h"
namespace dfly {
using namespace boost;
using namespace std;
using namespace util;
#define ADD(x) (x) += o.x
DbStats& DbStats::operator+=(const DbStats& o) {
ADD(key_count);
ADD(expire_count);
ADD(bucket_count);
ADD(inline_keys);
ADD(obj_memory_usage);
ADD(table_mem_usage);
return *this;
}
SliceEvents& SliceEvents::operator+=(const SliceEvents& o) {
ADD(evicted_entries);
return *this;
}
#undef ADD
DbSlice::DbSlice(uint32_t index, EngineShard* owner) : shard_id_(index), owner_(owner) {
db_arr_.emplace_back();
CreateDb(0);
}
DbSlice::~DbSlice() {
// we do not need this code but it's easier to debug in case we encounter
// memory allocation bugs during delete operations.
for (auto& db : db_arr_) {
if (!db)
continue;
db.reset();
}
}
auto DbSlice::GetStats() const -> Stats {
Stats s;
s.events = events_;
for (const auto& db : db_arr_) {
if (!db)
continue;
s.db.key_count += db->main_table.size();
s.db.bucket_count += db->main_table.bucket_count();
s.db.expire_count += db->expire_table.size();
s.db.obj_memory_usage += db->stats.obj_memory_usage;
s.db.inline_keys += db->stats.inline_keys;
s.db.table_mem_usage += (db->main_table.mem_usage() + db->expire_table.mem_usage());
}
return s;
}
void DbSlice::Reserve(DbIndex db_ind, size_t key_size) {
ActivateDb(db_ind);
auto& db = db_arr_[db_ind];
DCHECK(db);
db->main_table.Reserve(key_size);
}
auto DbSlice::Find(DbIndex db_index, string_view key, unsigned req_obj_type) const
-> OpResult<MainIterator> {
auto it = FindExt(db_index, key).first;
if (!IsValid(it))
return OpStatus::KEY_NOTFOUND;
if (it->second.ObjType() != req_obj_type) {
return OpStatus::WRONG_TYPE;
}
return it;
}
pair<MainIterator, ExpireIterator> DbSlice::FindExt(DbIndex db_ind, string_view key) const {
DCHECK(IsDbValid(db_ind));
auto& db = db_arr_[db_ind];
MainIterator it = db->main_table.Find(key);
if (!IsValid(it)) {
return make_pair(it, ExpireIterator{});
}
if (it->second.HasExpire()) { // check expiry state
return ExpireIfNeeded(db_ind, it);
}
return make_pair(it, ExpireIterator{});
}
OpResult<pair<MainIterator, unsigned>> DbSlice::FindFirst(DbIndex db_index, const ArgSlice& args) {
DCHECK(!args.empty());
for (unsigned i = 0; i < args.size(); ++i) {
string_view s = args[i];
OpResult<MainIterator> res = Find(db_index, s, OBJ_LIST);
if (res)
return make_pair(res.value(), i);
if (res.status() != OpStatus::KEY_NOTFOUND)
return res.status();
}
VLOG(1) << "FindFirst " << args.front() << " not found";
return OpStatus::KEY_NOTFOUND;
}
auto DbSlice::AddOrFind(DbIndex db_index, string_view key) -> pair<MainIterator, bool> {
DCHECK(IsDbValid(db_index));
auto& db = db_arr_[db_index];
CompactObj co_key{key};
auto [it, inserted] = db->main_table.Insert(std::move(co_key), PrimeValue{});
if (inserted) { // new entry
db->stats.inline_keys += it->first.IsInline();
db->stats.obj_memory_usage += it->first.MallocUsed();
it.SetVersion(NextVersion());
return make_pair(it, true);
}
auto& existing = it;
DCHECK(IsValid(existing));
if (existing->second.HasExpire()) {
auto expire_it = db->expire_table.Find(existing->first);
CHECK(IsValid(expire_it));
if (expire_it->second <= now_ms_) {
db->expire_table.Erase(expire_it);
// Keep the entry but reset the object.
db->stats.obj_memory_usage -= existing->second.MallocUsed();
existing->second.Reset();
return make_pair(existing, true);
}
}
return make_pair(existing, false);
}
void DbSlice::ActivateDb(DbIndex db_ind) {
if (db_arr_.size() <= db_ind)
db_arr_.resize(db_ind + 1);
CreateDb(db_ind);
}
void DbSlice::CreateDb(DbIndex index) {
auto& db = db_arr_[index];
if (!db) {
db.reset(new DbWrapper);
}
}
bool DbSlice::Del(DbIndex db_ind, MainIterator it) {
auto& db = db_arr_[db_ind];
if (!IsValid(it)) {
return false;
}
if (it->second.HasExpire()) {
CHECK_EQ(1u, db->expire_table.Erase(it->first));
}
db->stats.inline_keys -= it->first.IsInline();
db->stats.obj_memory_usage -= (it->first.MallocUsed() + it->second.MallocUsed());
db->main_table.Erase(it);
return true;
}
size_t DbSlice::FlushDb(DbIndex db_ind) {
auto flush_single = [this](DbIndex id) {
auto& db = db_arr_[id];
CHECK(db);
size_t removed = db->main_table.size();
db->main_table.Clear();
db->expire_table.Clear();
db->stats.inline_keys = 0;
db->stats.obj_memory_usage = 0;
return removed;
};
if (db_ind != kDbAll) {
CHECK_LT(db_ind, db_arr_.size());
return flush_single(db_ind);
}
size_t removed = 0;
for (size_t i = 0; i < db_arr_.size(); ++i) {
if (db_arr_[i]) {
removed += flush_single(i);
}
}
return removed;
}
// Returns true if a state has changed, false otherwise.
bool DbSlice::Expire(DbIndex db_ind, MainIterator it, uint64_t at) {
auto& db = db_arr_[db_ind];
if (at == 0 && it->second.HasExpire()) {
CHECK_EQ(1u, db->expire_table.Erase(it->first));
it->second.SetExpire(false);
return true;
}
if (!it->second.HasExpire() && at) {
CHECK(db->expire_table.Insert(it->first.AsRef(), at).second);
it->second.SetExpire(true);
return true;
}
return false;
}
void DbSlice::AddNew(DbIndex db_ind, string_view key, PrimeValue obj, uint64_t expire_at_ms) {
CHECK(AddIfNotExist(db_ind, key, std::move(obj), expire_at_ms));
}
bool DbSlice::AddIfNotExist(DbIndex db_ind, string_view key, PrimeValue obj,
uint64_t expire_at_ms) {
DCHECK(!obj.IsRef());
auto& db = db_arr_[db_ind];
CompactObj co_key{key};
auto [new_entry, success] = db->main_table.Insert(std::move(co_key), std::move(obj));
if (!success)
return false; // in this case obj won't be moved and will be destroyed during unwinding.
new_entry.SetVersion(NextVersion());
db->stats.inline_keys += new_entry->first.IsInline();
db->stats.obj_memory_usage += (new_entry->first.MallocUsed() + new_entry->second.MallocUsed());
if (expire_at_ms) {
new_entry->second.SetExpire(true);
CHECK(db->expire_table.Insert(new_entry->first.AsRef(), expire_at_ms).second);
}
return true;
}
size_t DbSlice::DbSize(DbIndex db_ind) const {
DCHECK_LT(db_ind, db_array_size());
if (IsDbValid(db_ind)) {
return db_arr_[db_ind]->main_table.size();
}
return 0;
}
bool DbSlice::Acquire(IntentLock::Mode mode, const KeyLockArgs& lock_args) {
DCHECK(!lock_args.args.empty());
auto& lt = db_arr_[lock_args.db_index]->lock_table;
bool lock_acquired = true;
if (lock_args.args.size() == 1) {
lock_acquired = lt[lock_args.args.front()].Acquire(mode);
} else {
uniq_keys_.clear();
for (size_t i = 0; i < lock_args.args.size(); i += lock_args.key_step) {
auto s = lock_args.args[i];
if (uniq_keys_.insert(s).second) {
bool res = lt[s].Acquire(mode);
lock_acquired &= res;
}
}
}
DVLOG(2) << "Acquire " << IntentLock::ModeName(mode) << " for " << lock_args.args[0]
<< " has_acquired: " << lock_acquired;
return lock_acquired;
}
void DbSlice::Release(IntentLock::Mode mode, const KeyLockArgs& lock_args) {
if (lock_args.args.size() == 1) {
Release(mode, lock_args.db_index, lock_args.args.front(), 1);
} else {
auto& lt = db_arr_[lock_args.db_index]->lock_table;
uniq_keys_.clear();
for (size_t i = 0; i < lock_args.args.size(); i += lock_args.key_step) {
auto s = lock_args.args[i];
if (uniq_keys_.insert(s).second) {
auto it = lt.find(s);
CHECK(it != lt.end());
it->second.Release(mode);
if (it->second.IsFree()) {
lt.erase(it);
}
}
}
DVLOG(1) << "Release " << IntentLock::ModeName(mode) << " for " << lock_args.args[0];
}
}
void DbSlice::Release(IntentLock::Mode mode, DbIndex db_index, string_view key, unsigned count) {
DVLOG(1) << "Release " << IntentLock::ModeName(mode) << " " << count << " for " << key;
auto& lt = db_arr_[db_index]->lock_table;
auto it = lt.find(key);
CHECK(it != lt.end()) << key;
it->second.Release(mode, count);
if (it->second.IsFree()) {
lt.erase(it);
}
}
bool DbSlice::CheckLock(IntentLock::Mode mode, const KeyLockArgs& lock_args) const {
DCHECK(!lock_args.args.empty());
const auto& lt = db_arr_[lock_args.db_index]->lock_table;
for (size_t i = 0; i < lock_args.args.size(); i += lock_args.key_step) {
auto s = lock_args.args[i];
auto it = lt.find(s);
if (it != lt.end() && !it->second.Check(mode)) {
return false;
}
}
return true;
}
void DbSlice::PreUpdate(DbIndex db_ind, MainIterator it) {
auto& db = db_arr_[db_ind];
db->stats.obj_memory_usage -= it->second.MallocUsed();
it.SetVersion(NextVersion());
}
void DbSlice::PostUpdate(DbIndex db_ind, MainIterator it) {
auto& db = db_arr_[db_ind];
db->stats.obj_memory_usage += it->second.MallocUsed();
}
pair<MainIterator, ExpireIterator> DbSlice::ExpireIfNeeded(DbIndex db_ind, MainIterator it) const {
DCHECK(it->second.HasExpire());
auto& db = db_arr_[db_ind];
auto expire_it = db->expire_table.Find(it->first);
CHECK(IsValid(expire_it));
if (expire_it->second > now_ms_)
return make_pair(it, expire_it);
db->expire_table.Erase(expire_it);
db->stats.inline_keys -= it->first.IsInline();
db->stats.obj_memory_usage -= (it->first.MallocUsed() + it->second.MallocUsed());
db->main_table.Erase(it);
return make_pair(MainIterator{}, ExpireIterator{});
}
} // namespace dfly