mirror of
https://github.com/ceph/ceph
synced 2025-04-06 17:44:22 +00:00
rgw: reshard complete handling, use multiple locks
to reduce contention. Also, fix completions cleanup. Signed-off-by: Yehuda Sadeh <yehuda@redhat.com>
This commit is contained in:
parent
da1f5bc910
commit
94e3c380ab
@ -3383,7 +3383,9 @@ int RGWRados::get_max_chunk_size(const string& placement_rule, const rgw_obj& ob
|
|||||||
class RGWIndexCompletionManager;
|
class RGWIndexCompletionManager;
|
||||||
|
|
||||||
struct complete_op_data {
|
struct complete_op_data {
|
||||||
|
Mutex lock{"complete_op_data"};
|
||||||
AioCompletion *rados_completion{nullptr};
|
AioCompletion *rados_completion{nullptr};
|
||||||
|
int manager_shard_id{-1};
|
||||||
RGWIndexCompletionManager *manager{nullptr};
|
RGWIndexCompletionManager *manager{nullptr};
|
||||||
rgw_obj obj;
|
rgw_obj obj;
|
||||||
RGWModifyOp op;
|
RGWModifyOp op;
|
||||||
@ -3394,6 +3396,13 @@ struct complete_op_data {
|
|||||||
list<cls_rgw_obj_key> remove_objs;
|
list<cls_rgw_obj_key> remove_objs;
|
||||||
bool log_op;
|
bool log_op;
|
||||||
uint16_t bilog_op;
|
uint16_t bilog_op;
|
||||||
|
|
||||||
|
bool stopped{false};
|
||||||
|
|
||||||
|
void stop() {
|
||||||
|
Mutex::Locker l(lock);
|
||||||
|
stopped = true;
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
class RGWIndexCompletionThread : public RGWRadosThread {
|
class RGWIndexCompletionThread : public RGWRadosThread {
|
||||||
@ -3472,20 +3481,43 @@ int RGWIndexCompletionThread::process()
|
|||||||
|
|
||||||
class RGWIndexCompletionManager {
|
class RGWIndexCompletionManager {
|
||||||
RGWRados *store{nullptr};
|
RGWRados *store{nullptr};
|
||||||
Mutex lock{"RGWIndexCompletionManager::lock"};
|
vector<Mutex *> locks;
|
||||||
set<complete_op_data *> completions;
|
vector<set<complete_op_data *> > completions;
|
||||||
|
|
||||||
RGWIndexCompletionThread *completion_thread{nullptr};
|
RGWIndexCompletionThread *completion_thread{nullptr};
|
||||||
|
|
||||||
|
int num_shards;
|
||||||
|
|
||||||
|
atomic_t cur_shard;
|
||||||
|
|
||||||
|
|
||||||
public:
|
public:
|
||||||
RGWIndexCompletionManager(RGWRados *_store) : store(_store) {}
|
RGWIndexCompletionManager(RGWRados *_store) : store(_store) {
|
||||||
~RGWIndexCompletionManager() {
|
num_shards = store->ctx()->_conf->rgw_thread_pool_size;
|
||||||
stop();
|
|
||||||
|
for (int i = 0; i < num_shards; i++) {
|
||||||
|
char buf[64];
|
||||||
|
snprintf(buf, sizeof(buf), "RGWIndexCompletionManager::lock::%d", i);
|
||||||
|
locks.push_back(new Mutex(buf));
|
||||||
}
|
}
|
||||||
|
|
||||||
void create_completion(AioCompletion *rados_completion,
|
completions.resize(num_shards);
|
||||||
const rgw_obj& obj,
|
}
|
||||||
|
~RGWIndexCompletionManager() {
|
||||||
|
stop();
|
||||||
|
|
||||||
|
for (auto l : locks) {
|
||||||
|
delete l;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
int next_shard() {
|
||||||
|
int result = cur_shard.read() % num_shards;
|
||||||
|
cur_shard.inc();
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
void create_completion(const rgw_obj& obj,
|
||||||
RGWModifyOp op, string& tag,
|
RGWModifyOp op, string& tag,
|
||||||
rgw_bucket_entry_ver& ver,
|
rgw_bucket_entry_ver& ver,
|
||||||
const cls_rgw_obj_key& key,
|
const cls_rgw_obj_key& key,
|
||||||
@ -3510,17 +3542,31 @@ public:
|
|||||||
delete completion_thread;
|
delete completion_thread;
|
||||||
}
|
}
|
||||||
|
|
||||||
Mutex::Locker l(lock);
|
for (int i = 0; i < num_shards; ++i) {
|
||||||
for (auto c : completions) {
|
Mutex::Locker l(*locks[i]);
|
||||||
c->rados_completion->release();
|
for (auto c : completions[i]) {
|
||||||
delete c;
|
Mutex::Locker cl(c->lock);
|
||||||
|
c->stop();
|
||||||
|
}
|
||||||
}
|
}
|
||||||
completions.clear();
|
completions.clear();
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
void RGWIndexCompletionManager::create_completion(AioCompletion *rados_completion,
|
static void obj_complete_cb(completion_t cb, void *arg)
|
||||||
const rgw_obj& obj,
|
{
|
||||||
|
complete_op_data *completion = (complete_op_data *)arg;
|
||||||
|
completion->lock.Lock();
|
||||||
|
if (completion->stopped) {
|
||||||
|
completion->lock.Unlock(); /* can drop lock, no one else is referencing us */
|
||||||
|
delete completion;
|
||||||
|
}
|
||||||
|
((complete_op_data *)arg)->manager->handle_completion(cb, completion);
|
||||||
|
completion->lock.Unlock();
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void RGWIndexCompletionManager::create_completion(const rgw_obj& obj,
|
||||||
RGWModifyOp op, string& tag,
|
RGWModifyOp op, string& tag,
|
||||||
rgw_bucket_entry_ver& ver,
|
rgw_bucket_entry_ver& ver,
|
||||||
const cls_rgw_obj_key& key,
|
const cls_rgw_obj_key& key,
|
||||||
@ -3531,7 +3577,9 @@ void RGWIndexCompletionManager::create_completion(AioCompletion *rados_completio
|
|||||||
{
|
{
|
||||||
complete_op_data *entry = new complete_op_data;
|
complete_op_data *entry = new complete_op_data;
|
||||||
|
|
||||||
entry->rados_completion = rados_completion;
|
int shard_id = next_shard();
|
||||||
|
|
||||||
|
entry->manager_shard_id = shard_id;
|
||||||
entry->manager = this;
|
entry->manager = this;
|
||||||
entry->obj = obj;
|
entry->obj = obj;
|
||||||
entry->op = op;
|
entry->op = op;
|
||||||
@ -3545,21 +3593,26 @@ void RGWIndexCompletionManager::create_completion(AioCompletion *rados_completio
|
|||||||
|
|
||||||
*result = entry;
|
*result = entry;
|
||||||
|
|
||||||
Mutex::Locker l(lock);
|
entry->rados_completion = librados::Rados::aio_create_completion(entry, NULL, obj_complete_cb);
|
||||||
completions.insert(entry);
|
|
||||||
|
Mutex::Locker l(*locks[shard_id]);
|
||||||
|
completions[shard_id].insert(entry);
|
||||||
}
|
}
|
||||||
|
|
||||||
void RGWIndexCompletionManager::handle_completion(completion_t cb, complete_op_data *arg)
|
void RGWIndexCompletionManager::handle_completion(completion_t cb, complete_op_data *arg)
|
||||||
{
|
{
|
||||||
|
int shard_id = arg->manager_shard_id;
|
||||||
{
|
{
|
||||||
Mutex::Locker l(lock);
|
Mutex::Locker l(*locks[shard_id]);
|
||||||
|
|
||||||
auto iter = completions.find(arg);
|
auto& comps = completions[shard_id];
|
||||||
if (iter == completions.end()) {
|
|
||||||
|
auto iter = comps.find(arg);
|
||||||
|
if (iter == comps.end()) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
completions.erase(iter);
|
comps.erase(iter);
|
||||||
}
|
}
|
||||||
|
|
||||||
int r = rados_aio_get_return_value(cb);
|
int r = rados_aio_get_return_value(cb);
|
||||||
@ -12420,11 +12473,6 @@ int RGWRados::cls_obj_prepare_op(BucketShard& bs, RGWModifyOp op, string& tag,
|
|||||||
return bs.index_ctx.operate(bs.bucket_obj, &o);
|
return bs.index_ctx.operate(bs.bucket_obj, &o);
|
||||||
}
|
}
|
||||||
|
|
||||||
static void obj_complete_cb(completion_t cb, void *arg)
|
|
||||||
{
|
|
||||||
((complete_op_data *)arg)->manager->handle_completion(cb, (complete_op_data *)arg);
|
|
||||||
}
|
|
||||||
|
|
||||||
int RGWRados::cls_obj_complete_op(BucketShard& bs, const rgw_obj& obj, RGWModifyOp op, string& tag,
|
int RGWRados::cls_obj_complete_op(BucketShard& bs, const rgw_obj& obj, RGWModifyOp op, string& tag,
|
||||||
int64_t pool, uint64_t epoch,
|
int64_t pool, uint64_t epoch,
|
||||||
rgw_bucket_dir_entry& ent, RGWObjCategory category,
|
rgw_bucket_dir_entry& ent, RGWObjCategory category,
|
||||||
@ -12462,11 +12510,10 @@ int RGWRados::cls_obj_complete_op(BucketShard& bs, const rgw_obj& obj, RGWModify
|
|||||||
get_zone().log_data, bilog_flags, zones_trace);
|
get_zone().log_data, bilog_flags, zones_trace);
|
||||||
|
|
||||||
complete_op_data *arg;
|
complete_op_data *arg;
|
||||||
AioCompletion *c = librados::Rados::aio_create_completion(arg, NULL, obj_complete_cb);
|
index_completion_manager->create_completion(obj, op, tag, ver, key, dir_meta, ro,
|
||||||
index_completion_manager->create_completion(c, obj, op, tag, ver, key, dir_meta, ro,
|
|
||||||
get_zone().log_data, bilog_flags, &arg);
|
get_zone().log_data, bilog_flags, &arg);
|
||||||
int ret = bs.index_ctx.aio_operate(bs.bucket_obj, c, &o);
|
int ret = bs.index_ctx.aio_operate(bs.bucket_obj, arg->rados_completion, &o);
|
||||||
c->release();
|
arg->rados_completion->release();
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user