Add a new KV wrapper GenericObjectMap

Now we already have DBObjectMap which implement ObjectMap and other
interfaces, and ObjectMap.h implied that ObjectMap is used to encapsulates
the FileStore key value store. There exists limitation in current DBObjectMap
implementation, such as lacking of "coll_t" in "key", complicated prefix
hard-coded and inflexible extending.

So in order to provide a more flexible API and clear implementation to wrap KV
store, I copy the origin DBObjectMap and redesign the partial implementation.
Adding "coll_t" argument to all API and export "prefix" to callers. Prefixes
are divided into two parts "INTERN" and "USER". "INTERN" keys used by self to
manage and "USER" keys are managed by callers. Besides above, misc fixes are
imported such as more clear member function name and extendible header
structure.

Signed-off-by: Haomai Wang <haomaiwang@gmail.com>
This commit is contained in:
Haomai Wang 2014-01-29 17:46:00 +08:00
parent 2a737d841e
commit 8fb366f089
3 changed files with 1581 additions and 0 deletions

View File

@ -79,6 +79,7 @@ SUBSYS(osd, 0, 5)
SUBSYS(optracker, 0, 5)
SUBSYS(objclass, 0, 5)
SUBSYS(filestore, 1, 3)
SUBSYS(keyvaluestore, 1, 3)
SUBSYS(journal, 1, 3)
SUBSYS(ms, 0, 5)
SUBSYS(mon, 1, 5)

1112
src/os/GenericObjectMap.cc Normal file

File diff suppressed because it is too large Load Diff

468
src/os/GenericObjectMap.h Normal file
View File

@ -0,0 +1,468 @@
// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
// vim: ts=8 sw=2 smarttab
/*
* Ceph - scalable distributed file system
*
* Copyright (C) 2013 UnitedStack <haomai@unitedstack.com>
*
* Author: Haomai Wang <haomaiwang@gmail.com>
*
* This is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License version 2.1, as published by the Free Software
* Foundation. See file COPYING.
*
*/
#ifndef CEPH_GENERICOBJECTMAP_H
#define CEPH_GENERICOBJECTMAP_H
#include "include/buffer.h"
#include <set>
#include <map>
#include <string>
#include <vector>
#include <boost/scoped_ptr.hpp>
#include "include/memory.h"
#include "ObjectMap.h"
#include "KeyValueDB.h"
#include "osd/osd_types.h"
#include "common/Mutex.h"
#include "common/Cond.h"
/**
* Genericobjectmap: Provide with key/value associated to ghobject_t APIs to caller
* and avoid concerning too much. Wrap and combine KeyValueDB/ObjectMap APIs
* with ghobject_t and adding clone capacity.
*
* Prefix space structure:
*
* - GHOBJECT_TO_SEQ: Contains leaf mapping from ghobject_t->Header(including
* hobj.seq and related metadata)
* - INTERN_PREFIX: GLOBAL_STATE_KEY - contains the global state
* @see State
* @see write_state
* @see init
* @see generate_new_header
* - INTERN_PREFIX + header_key(header->seq) + COMPLETE_PREFIX: see below
* - INTERN_PREFIX + header_key(header->seq) + PARENT_KEY
* : used to store parent header(same as headers in GHOBJECT_TO_SEQ)
* - USER_PREFIX + header_key(header->seq) + [CUSTOM_PREFIX]
* : key->value which set by callers
*
* For each node (represented by a header), we
* store three mappings: the key mapping, the complete mapping, and the parent.
* The complete mapping (COMPLETE_PREFIX space) is key->key. Each x->y entry in
* this mapping indicates that the key mapping contains all entries on [x,y).
* Note, max string is represented by "", so ""->"" indicates that the parent
* is unnecessary (@see rm_keys). When looking up a key not contained in the
* the complete set, we have to check the parent if we don't find it in the
* key set. During rm_keys, we copy keys from the parent and update the
* complete set to reflect the change @see rm_keys.
*/
// This class only provide basic read capacity, suggest inherit it to
// implement write transaction to use it. @see StripObjectMap
class GenericObjectMap {
public:
boost::scoped_ptr<KeyValueDB> db;
/**
* Serializes access to next_seq as well as the in_use set
*/
Mutex header_lock;
Cond header_cond;
Cond map_header_cond;
/**
* Set of headers currently in use
*/
set<uint64_t> in_use;
set<ghobject_t> map_header_in_use;
GenericObjectMap(KeyValueDB *db) : db(db), header_lock("GenericObjectMap") {}
int get(
const coll_t &cid,
const ghobject_t &oid,
const string &prefix,
map<string, bufferlist> *out
);
int get_keys(
const coll_t &cid,
const ghobject_t &oid,
const string &prefix,
set<string> *keys
);
int get_values(
const coll_t &cid,
const ghobject_t &oid,
const string &prefix,
const set<string> &keys,
map<string, bufferlist> *out
);
int check_keys(
const coll_t &cid,
const ghobject_t &oid,
const string &prefix,
const set<string> &keys,
set<string> *out
);
/// Read initial state from backing store
int init(bool upgrade = false);
/// Upgrade store to current version
int upgrade() {return 0;}
/// Consistency check, debug, there must be no parallel writes
bool check(std::ostream &out);
/// Util, list all objects, there must be no other concurrent access
int list_objects(const coll_t &cid, ghobject_t start, int max,
vector<ghobject_t> *objs, ///< [out] objects
ghobject_t *next);
ObjectMap::ObjectMapIterator get_iterator(const coll_t &cid,
const ghobject_t &oid,
const string &prefix);
KeyValueDB::Transaction get_transaction() { return db->get_transaction(); }
int submit_transaction(KeyValueDB::Transaction t) {
return db->submit_transaction(t);
}
/// persistent state for store @see generate_header
struct State {
__u8 v;
uint64_t seq;
State() : v(0), seq(1) {}
State(uint64_t seq) : v(0), seq(seq) {}
void encode(bufferlist &bl) const {
ENCODE_START(1, 1, bl);
::encode(v, bl);
::encode(seq, bl);
ENCODE_FINISH(bl);
}
void decode(bufferlist::iterator &bl) {
DECODE_START(1, bl);
::decode(v, bl);
::decode(seq, bl);
DECODE_FINISH(bl);
}
void dump(Formatter *f) const {
f->dump_unsigned("seq", seq);
}
static void generate_test_instances(list<State*> &o) {
o.push_back(new State(0));
o.push_back(new State(20));
}
} state;
struct _Header {
uint64_t seq;
uint64_t parent;
uint64_t num_children;
coll_t cid;
ghobject_t oid;
// Used by successor
bufferlist data;
void encode(bufferlist &bl) const {
ENCODE_START(1, 1, bl);
::encode(seq, bl);
::encode(parent, bl);
::encode(num_children, bl);
::encode(cid, bl);
::encode(oid, bl);
::encode(data, bl);
ENCODE_FINISH(bl);
}
void decode(bufferlist::iterator &bl) {
DECODE_START(1, bl);
::decode(seq, bl);
::decode(parent, bl);
::decode(num_children, bl);
::decode(cid, bl);
::decode(oid, bl);
::decode(data, bl);
DECODE_FINISH(bl);
}
void dump(Formatter *f) const {
f->dump_unsigned("seq", seq);
f->dump_unsigned("parent", parent);
f->dump_unsigned("num_children", num_children);
f->dump_stream("coll") << cid;
f->dump_stream("oid") << oid;
}
_Header() : seq(0), parent(0), num_children(1) {}
};
typedef ceph::shared_ptr<_Header> Header;
Header lookup_header(const coll_t &cid, const ghobject_t &oid) {
Mutex::Locker l(header_lock);
return _lookup_header(cid, oid);
}
/// Lookup or create header for c oid
Header lookup_create_header(const coll_t &cid, const ghobject_t &oid,
KeyValueDB::Transaction t);
/// Set leaf node for c and oid to the value of header
void set_header(const coll_t &cid, const ghobject_t &oid, _Header header,
KeyValueDB::Transaction t);
// Move all modify member function to "protect", in order to indicate these
// should be made use of by sub-class
void set_keys(
const Header header,
const string &prefix,
const map<string, bufferlist> &set,
KeyValueDB::Transaction t
);
int clear(
const Header header,
KeyValueDB::Transaction t
);
int rm_keys(
const Header header,
const string &prefix,
const set<string> &to_clear,
KeyValueDB::Transaction t
);
void clone(
const Header origin_header,
const coll_t &cid,
const ghobject_t &target,
KeyValueDB::Transaction t,
Header *old_header,
Header *new_header
);
void rename(
const Header header,
const coll_t &cid,
const ghobject_t &target,
KeyValueDB::Transaction t
);
/// Ensure that all previous operations are durable
int sync(const Header header, KeyValueDB::Transaction t);
static const string GLOBAL_STATE_KEY;
static const string PARENT_KEY;
static const string USER_PREFIX;
static const string INTERN_PREFIX;
static const string PARENT_PREFIX;
static const string COMPLETE_PREFIX;
static const string GHOBJECT_TO_SEQ_PREFIX;
static const string GHOBJECT_KEY_SEP_S;
static const char GHOBJECT_KEY_SEP_C;
private:
/// Implicit lock on Header->seq
static string header_key(const coll_t &cid);
static string header_key(const coll_t &cid, const ghobject_t &oid);
static bool parse_header_key(const string &in, coll_t *c, ghobject_t *oid);
string seq_key(uint64_t seq) {
char buf[100];
snprintf(buf, sizeof(buf), "%.*" PRId64, (int)(2*sizeof(seq)), seq);
return string(buf);
}
string user_prefix(Header header, const string &prefix);
string complete_prefix(Header header);
string parent_seq_prefix(uint64_t seq);
class EmptyIteratorImpl : public ObjectMap::ObjectMapIteratorImpl {
public:
int seek_to_first() { return 0; }
int seek_to_last() { return 0; }
int upper_bound(const string &after) { return 0; }
int lower_bound(const string &to) { return 0; }
bool valid() { return false; }
int next() { assert(0); return 0; }
string key() { assert(0); return ""; }
bufferlist value() { assert(0); return bufferlist(); }
int status() { return 0; }
};
/// Iterator
class GenericObjectMapIteratorImpl : public ObjectMap::ObjectMapIteratorImpl {
public:
GenericObjectMap *map;
/// NOTE: implicit lock on header->seq AND for all ancestors
Header header;
/// parent_iter == NULL iff no parent
ceph::shared_ptr<GenericObjectMapIteratorImpl> parent_iter;
KeyValueDB::Iterator key_iter;
KeyValueDB::Iterator complete_iter;
/// cur_iter points to currently valid iterator
ceph::shared_ptr<ObjectMap::ObjectMapIteratorImpl> cur_iter;
int r;
/// init() called, key_iter, complete_iter, parent_iter filled in
bool ready;
/// past end
bool invalid;
string prefix;
GenericObjectMapIteratorImpl(GenericObjectMap *map, Header header,
const string &_prefix) : map(map), header(header), r(0), ready(false),
invalid(true), prefix(_prefix) { }
int seek_to_first();
int seek_to_last();
int upper_bound(const string &after);
int lower_bound(const string &to);
bool valid();
int next();
string key();
bufferlist value();
int status();
bool on_parent() {
return cur_iter == parent_iter;
}
/// skips to next valid parent entry
int next_parent();
/// Tests whether to_test is in complete region
int in_complete_region(const string &to_test, ///[in] key to test
string *begin, ///[out] beginning of region
string *end ///[out] end of region
); ///< @returns true if to_test is in the complete region, else false
private:
int init();
bool valid_parent();
int adjust();
};
typedef ceph::shared_ptr<GenericObjectMapIteratorImpl> GenericObjectMapIterator;
GenericObjectMapIterator _get_iterator(Header header, string prefix) {
return GenericObjectMapIterator(new GenericObjectMapIteratorImpl(this, header, prefix));
}
/// Removes node corresponding to header
void clear_header(Header header, KeyValueDB::Transaction t);
/// Set node containing input to new contents
void set_parent_header(Header input, KeyValueDB::Transaction t);
/// Remove leaf node corresponding to oid in c
void remove_header(const coll_t &cid, const ghobject_t &oid, Header header,
KeyValueDB::Transaction t);
/**
* Generate new header for c oid with new seq number
*
* Has the side effect of syncronously saving the new GenericObjectMap state
*/
Header _generate_new_header(const coll_t &cid, const ghobject_t &oid,
Header parent, KeyValueDB::Transaction t);
Header generate_new_header(const coll_t &cid, const ghobject_t &oid,
Header parent, KeyValueDB::Transaction t) {
Mutex::Locker l(header_lock);
return _generate_new_header(cid, oid, parent, t);
}
// Lookup leaf header for c oid
Header _lookup_header(const coll_t &cid, const ghobject_t &oid);
// Lookup header node for input
Header lookup_parent(Header input);
// Scan keys in header into out_keys and out_values (if nonnull)
int scan(Header header, const string &prefix, const set<string> &in_keys,
set<string> *out_keys, map<string, bufferlist> *out_values);
// Remove header and all related prefixes
int _clear(Header header, KeyValueDB::Transaction t);
// Adds to t operations necessary to add new_complete to the complete set
int merge_new_complete(Header header, const map<string, string> &new_complete,
GenericObjectMapIterator iter, KeyValueDB::Transaction t);
// Writes out State (mainly next_seq)
int write_state(KeyValueDB::Transaction _t);
// 0 if the complete set now contains all of key space, < 0 on error, 1 else
int need_parent(GenericObjectMapIterator iter);
// Copies header entry from parent @see rm_keys
int copy_up_header(Header header, KeyValueDB::Transaction t);
// Sets header @see set_header
void _set_header(Header header, const bufferlist &bl,
KeyValueDB::Transaction t);
/**
* Removes map header lock once Header is out of scope
* @see lookup_header
*/
class RemoveMapHeaderOnDelete {
public:
GenericObjectMap *db;
coll_t cid;
ghobject_t oid;
RemoveMapHeaderOnDelete(GenericObjectMap *db, const coll_t &cid,
const ghobject_t &oid) :
db(db), cid(cid), oid(oid) {}
void operator() (_Header *header) {
Mutex::Locker l(db->header_lock);
db->map_header_in_use.erase(oid);
db->map_header_cond.Signal();
delete header;
}
};
/**
* Removes header seq lock once Header is out of scope
* @see lookup_parent
* @see generate_new_header
*/
class RemoveOnDelete {
public:
GenericObjectMap *db;
RemoveOnDelete(GenericObjectMap *db) :
db(db) {}
void operator() (_Header *header) {
Mutex::Locker l(db->header_lock);
db->in_use.erase(header->seq);
db->header_cond.Signal();
delete header;
}
};
friend class RemoveOnDelete;
};
WRITE_CLASS_ENCODER(GenericObjectMap::_Header)
WRITE_CLASS_ENCODER(GenericObjectMap::State)
#endif