mirror of
https://github.com/ceph/ceph
synced 2025-01-27 13:34:31 +00:00
07ac5d3e74
git-svn-id: https://ceph.svn.sf.net/svnroot/ceph@1068 29311d96-e01e-0410-9327-a35deaab8ce9
758 lines
20 KiB
C++
758 lines
20 KiB
C++
// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
|
|
/*
|
|
* Ceph - scalable distributed file system
|
|
*
|
|
* Copyright (C) 2004-2006 Sage Weil <sage@newdream.net>
|
|
*
|
|
* This is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License version 2.1, as published by the Free Software
|
|
* Foundation. See file COPYING.
|
|
*
|
|
*/
|
|
|
|
|
|
|
|
#ifndef __CINODE_H
|
|
#define __CINODE_H
|
|
|
|
#include "config.h"
|
|
#include "include/types.h"
|
|
#include "include/lru.h"
|
|
|
|
#include "CDentry.h"
|
|
#include "Lock.h"
|
|
#include "Capability.h"
|
|
|
|
#include "mdstypes.h"
|
|
|
|
#include <cassert>
|
|
#include <list>
|
|
#include <vector>
|
|
#include <set>
|
|
#include <map>
|
|
#include <iostream>
|
|
using namespace std;
|
|
|
|
|
|
|
|
|
|
|
|
// pins for keeping an item in cache (and debugging)
|
|
#define CINODE_PIN_DIR 0
|
|
#define CINODE_PIN_CACHED 1
|
|
#define CINODE_PIN_DIRTY 2 // must flush
|
|
#define CINODE_PIN_PROXY 3 // can't expire yet
|
|
#define CINODE_PIN_WAITER 4 // waiter
|
|
|
|
#define CINODE_PIN_CAPS 5 // local fh's
|
|
|
|
#define CINODE_PIN_DNDIRTY 7 // dentry is dirty
|
|
|
|
#define CINODE_PIN_AUTHPIN 8
|
|
#define CINODE_PIN_IMPORTING 9 // multipurpose, for importing
|
|
#define CINODE_PIN_REQUEST 10 // request is logging, finishing
|
|
#define CINODE_PIN_RENAMESRC 11 // pinned on dest for foreign rename
|
|
#define CINODE_PIN_ANCHORING 12
|
|
|
|
#define CINODE_PIN_OPENINGDIR 13
|
|
|
|
#define CINODE_PIN_DENTRYLOCK 14
|
|
|
|
#define CINODE_NUM_PINS 15
|
|
|
|
static char *cinode_pin_names[CINODE_NUM_PINS] = {
|
|
"dir",
|
|
"cached",
|
|
"dirty",
|
|
"proxy",
|
|
"waiter",
|
|
"caps",
|
|
"--",
|
|
"dndirty",
|
|
"authpin",
|
|
"imping",
|
|
"request",
|
|
"rensrc",
|
|
"anching",
|
|
"opdir",
|
|
"dnlock"
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// wait reasons
|
|
#define CINODE_WAIT_AUTHPINNABLE CDIR_WAIT_UNFREEZE
|
|
// waiters: write_hard_start, read_file_start, write_file_start (mdcache)
|
|
// handle_client_chmod, handle_client_touch (mds)
|
|
// trigger: (see CDIR_WAIT_UNFREEZE)
|
|
#define CINODE_WAIT_GETREPLICA (1<<11) // update/replicate individual inode
|
|
// waiters: import_dentry_inode
|
|
// trigger: handle_inode_replicate_ack
|
|
|
|
#define CINODE_WAIT_DIR (1<<13)
|
|
// waiters: traverse_path
|
|
// triggers: handle_disocver_reply
|
|
|
|
#define CINODE_WAIT_LINK (1<<14) // as in remotely nlink++
|
|
#define CINODE_WAIT_ANCHORED (1<<15)
|
|
#define CINODE_WAIT_UNLINK (1<<16) // as in remotely nlink--
|
|
|
|
#define CINODE_WAIT_HARDR (1<<17) // 131072
|
|
#define CINODE_WAIT_HARDW (1<<18) // 262...
|
|
#define CINODE_WAIT_HARDB (1<<19)
|
|
#define CINODE_WAIT_HARDRWB (CINODE_WAIT_HARDR|CINODE_WAIT_HARDW|CINODE_WAIT_HARDB)
|
|
#define CINODE_WAIT_HARDSTABLE (1<<20)
|
|
#define CINODE_WAIT_HARDNORD (1<<21)
|
|
#define CINODE_WAIT_FILER (1<<22)
|
|
#define CINODE_WAIT_FILEW (1<<23)
|
|
#define CINODE_WAIT_FILEB (1<<24)
|
|
#define CINODE_WAIT_FILERWB (CINODE_WAIT_FILER|CINODE_WAIT_FILEW|CINODE_WAIT_FILEB)
|
|
#define CINODE_WAIT_FILESTABLE (1<<25)
|
|
#define CINODE_WAIT_FILENORD (1<<26)
|
|
#define CINODE_WAIT_FILENOWR (1<<27)
|
|
|
|
#define CINODE_WAIT_RENAMEACK (1<<28)
|
|
#define CINODE_WAIT_RENAMENOTIFYACK (1<<29)
|
|
|
|
#define CINODE_WAIT_CAPS (1<<30)
|
|
|
|
|
|
|
|
|
|
#define CINODE_WAIT_ANY 0xffffffff
|
|
|
|
|
|
// state
|
|
#define CINODE_STATE_AUTH (1<<0)
|
|
#define CINODE_STATE_ROOT (1<<1)
|
|
|
|
#define CINODE_STATE_DIRTY (1<<2)
|
|
#define CINODE_STATE_UNSAFE (1<<3) // not logged yet
|
|
#define CINODE_STATE_DANGLING (1<<4) // delete me when i expire; i have no dentry
|
|
#define CINODE_STATE_UNLINKING (1<<5)
|
|
#define CINODE_STATE_PROXY (1<<6) // can't expire yet
|
|
#define CINODE_STATE_EXPORTING (1<<7) // on nonauth bystander.
|
|
|
|
#define CINODE_STATE_ANCHORING (1<<8)
|
|
|
|
#define CINODE_STATE_OPENINGDIR (1<<9)
|
|
|
|
//#define CINODE_STATE_RENAMING (1<<8) // moving me
|
|
//#define CINODE_STATE_RENAMINGTO (1<<9) // rename target (will be unlinked)
|
|
|
|
|
|
// misc
|
|
#define CINODE_EXPORT_NONCE 1 // nonce given to replicas created by export
|
|
#define CINODE_HASHREPLICA_NONCE 1 // hashed inodes that are duped ???FIXME???
|
|
|
|
class Context;
|
|
class CDentry;
|
|
class CDir;
|
|
class MDS;
|
|
class Message;
|
|
class CInode;
|
|
class CInodeDiscover;
|
|
class MDCache;
|
|
|
|
//class MInodeSyncStart;
|
|
|
|
ostream& operator<<(ostream& out, CInode& in);
|
|
|
|
|
|
extern int cinode_pins[CINODE_NUM_PINS]; // counts
|
|
|
|
|
|
// cached inode wrapper
|
|
class CInode : public LRUObject {
|
|
public:
|
|
MDCache *mdcache;
|
|
|
|
inode_t inode; // the inode itself
|
|
|
|
CDir *dir; // directory, if we have it opened.
|
|
string symlink; // symlink dest, if symlink
|
|
|
|
// inode metadata locks
|
|
CLock hardlock;
|
|
CLock filelock;
|
|
|
|
protected:
|
|
int ref; // reference count
|
|
set<int> ref_set;
|
|
version_t parent_dir_version; // parent dir version when i was last touched.
|
|
version_t committing_version;
|
|
version_t committed_version;
|
|
|
|
unsigned state;
|
|
|
|
// parent dentries in cache
|
|
CDentry *parent; // primary link
|
|
set<CDentry*> remote_parents; // if hard linked
|
|
|
|
// -- distributed caching
|
|
set<int> cached_by; // [auth] mds's that cache me.
|
|
/* NOTE: on replicas, this doubles as replicated_by, but the
|
|
cached_by_* access methods below should NOT be used in those
|
|
cases, as the semantics are different! */
|
|
map<int,int> cached_by_nonce; // [auth] nonce issued to each replica
|
|
int replica_nonce; // [replica] defined on replica
|
|
|
|
int dangling_auth; // explicit auth, when dangling.
|
|
|
|
int num_request_pins;
|
|
|
|
// waiters
|
|
multimap<int, Context*> waiting;
|
|
|
|
// file capabilities
|
|
map<int, Capability> client_caps; // client -> caps
|
|
|
|
map<int, int> mds_caps_wanted; // [auth] mds -> caps wanted
|
|
int replica_caps_wanted; // [replica] what i've requested from auth
|
|
utime_t replica_caps_wanted_keep_until;
|
|
|
|
|
|
private:
|
|
// lock nesting
|
|
int auth_pins;
|
|
int nested_auth_pins;
|
|
|
|
public:
|
|
meta_load_t popularity[MDS_NPOP];
|
|
|
|
// friends
|
|
friend class Server;
|
|
friend class Locker;
|
|
friend class Migrator;
|
|
friend class MDCache;
|
|
friend class CDir;
|
|
friend class CInodeExport;
|
|
friend class CInodeDiscover;
|
|
|
|
public:
|
|
// ---------------------------
|
|
CInode(MDCache *c, bool auth=true);
|
|
~CInode();
|
|
|
|
|
|
// -- accessors --
|
|
bool is_file() { return ((inode.mode & INODE_TYPE_MASK) == INODE_MODE_FILE) ? true:false; }
|
|
bool is_symlink() { return ((inode.mode & INODE_TYPE_MASK) == INODE_MODE_SYMLINK) ? true:false; }
|
|
bool is_dir() { return ((inode.mode & INODE_TYPE_MASK) == INODE_MODE_DIR) ? true:false; }
|
|
|
|
bool is_anchored() { return inode.anchored; }
|
|
|
|
bool is_root() { return state & CINODE_STATE_ROOT; }
|
|
bool is_proxy() { return state & CINODE_STATE_PROXY; }
|
|
|
|
bool is_auth() { return state & CINODE_STATE_AUTH; }
|
|
void set_auth(bool auth);
|
|
bool is_replica() { return !is_auth(); }
|
|
int get_replica_nonce() { assert(!is_auth()); return replica_nonce; }
|
|
|
|
inodeno_t ino() { return inode.ino; }
|
|
inode_t& get_inode() { return inode; }
|
|
CDentry* get_parent_dn() { return parent; }
|
|
CDir *get_parent_dir();
|
|
CInode *get_parent_inode();
|
|
CInode *get_realm_root(); // import, hash, or root
|
|
|
|
CDir *get_or_open_dir(MDS *mds);
|
|
CDir *set_dir(CDir *newdir);
|
|
|
|
bool dir_is_auth();
|
|
|
|
|
|
|
|
// -- misc --
|
|
void make_path(string& s);
|
|
void make_anchor_trace(vector<class Anchor*>& trace);
|
|
|
|
|
|
|
|
// -- state --
|
|
unsigned get_state() { return state; }
|
|
void state_clear(unsigned mask) { state &= ~mask; }
|
|
void state_set(unsigned mask) { state |= mask; }
|
|
unsigned state_test(unsigned mask) { return state & mask; }
|
|
|
|
bool is_unsafe() { return state & CINODE_STATE_UNSAFE; }
|
|
bool is_dangling() { return state & CINODE_STATE_DANGLING; }
|
|
bool is_unlinking() { return state & CINODE_STATE_UNLINKING; }
|
|
|
|
void mark_unsafe() { state |= CINODE_STATE_UNSAFE; }
|
|
void mark_safe() { state &= ~CINODE_STATE_UNSAFE; }
|
|
|
|
// -- state encoding --
|
|
//void encode_basic_state(bufferlist& r);
|
|
//void decode_basic_state(bufferlist& r, int& off);
|
|
|
|
|
|
void encode_file_state(bufferlist& r);
|
|
void decode_file_state(bufferlist& r, int& off);
|
|
|
|
void encode_hard_state(bufferlist& r);
|
|
void decode_hard_state(bufferlist& r, int& off);
|
|
|
|
|
|
// -- dirtyness --
|
|
version_t get_version() { return inode.version; }
|
|
version_t get_parent_dir_version() { return parent_dir_version; }
|
|
void float_parent_dir_version(version_t ge) {
|
|
if (parent_dir_version < ge)
|
|
parent_dir_version = ge;
|
|
}
|
|
version_t get_committing_version() { return committing_version; }
|
|
version_t get_last_committed_version() { return committed_version; }
|
|
void set_committing_version(version_t v) { committing_version = v; }
|
|
void set_committed_version() {
|
|
committed_version = committing_version;
|
|
committing_version = 0;
|
|
}
|
|
|
|
bool is_dirty() { return state & CINODE_STATE_DIRTY; }
|
|
bool is_clean() { return !is_dirty(); }
|
|
|
|
void mark_dirty();
|
|
void mark_clean();
|
|
|
|
|
|
|
|
// -- cached_by -- to be used ONLY when we're authoritative or cacheproxy
|
|
bool is_cached_by_anyone() { return !cached_by.empty(); }
|
|
bool is_cached_by(int mds) { return cached_by.count(mds); }
|
|
int num_cached_by() { return cached_by.size(); }
|
|
// cached_by_add returns a nonce
|
|
int cached_by_add(int mds) {
|
|
int nonce = 1;
|
|
if (is_cached_by(mds)) { // already had it?
|
|
nonce = get_cached_by_nonce(mds) + 1; // new nonce (+1)
|
|
dout(10) << *this << " issuing new nonce " << nonce << " to mds" << mds << endl;
|
|
cached_by_nonce.erase(mds);
|
|
} else {
|
|
if (cached_by.empty())
|
|
get(CINODE_PIN_CACHED);
|
|
cached_by.insert(mds);
|
|
}
|
|
cached_by_nonce.insert(pair<int,int>(mds,nonce)); // first! serial of 1.
|
|
return nonce; // default nonce
|
|
}
|
|
void cached_by_add(int mds, int nonce) {
|
|
if (cached_by.empty())
|
|
get(CINODE_PIN_CACHED);
|
|
cached_by.insert(mds);
|
|
cached_by_nonce.insert(pair<int,int>(mds,nonce));
|
|
}
|
|
int get_cached_by_nonce(int mds) {
|
|
map<int,int>::iterator it = cached_by_nonce.find(mds);
|
|
return it->second;
|
|
}
|
|
void cached_by_remove(int mds) {
|
|
//if (!is_cached_by(mds)) return;
|
|
assert(is_cached_by(mds));
|
|
|
|
cached_by.erase(mds);
|
|
cached_by_nonce.erase(mds);
|
|
if (cached_by.empty())
|
|
put(CINODE_PIN_CACHED);
|
|
}
|
|
void cached_by_clear() {
|
|
if (cached_by.size())
|
|
put(CINODE_PIN_CACHED);
|
|
cached_by.clear();
|
|
cached_by_nonce.clear();
|
|
}
|
|
set<int>::iterator cached_by_begin() { return cached_by.begin(); }
|
|
set<int>::iterator cached_by_end() { return cached_by.end(); }
|
|
set<int>& get_cached_by() { return cached_by; }
|
|
|
|
CInodeDiscover* replicate_to(int rep);
|
|
|
|
|
|
// -- waiting --
|
|
bool waiting_for(int tag);
|
|
void add_waiter(int tag, Context *c);
|
|
void take_waiting(int tag, list<Context*>& ls);
|
|
void finish_waiting(int mask, int result = 0);
|
|
|
|
|
|
// -- caps -- (new)
|
|
// client caps
|
|
map<int,Capability>& get_client_caps() { return client_caps; }
|
|
void add_client_cap(int client, Capability& cap) {
|
|
if (client_caps.empty())
|
|
get(CINODE_PIN_CAPS);
|
|
assert(client_caps.count(client) == 0);
|
|
client_caps[client] = cap;
|
|
}
|
|
void remove_client_cap(int client) {
|
|
assert(client_caps.count(client) == 1);
|
|
client_caps.erase(client);
|
|
if (client_caps.empty())
|
|
put(CINODE_PIN_CAPS);
|
|
}
|
|
Capability* get_client_cap(int client) {
|
|
if (client_caps.count(client))
|
|
return &client_caps[client];
|
|
return 0;
|
|
}
|
|
/*
|
|
void set_client_caps(map<int,Capability>& cl) {
|
|
if (client_caps.empty() && !cl.empty())
|
|
get(CINODE_PIN_CAPS);
|
|
client_caps.clear();
|
|
client_caps = cl;
|
|
}
|
|
*/
|
|
void take_client_caps(map<int,Capability>& cl) {
|
|
if (!client_caps.empty())
|
|
put(CINODE_PIN_CAPS);
|
|
cl = client_caps;
|
|
client_caps.clear();
|
|
}
|
|
void merge_client_caps(map<int,Capability>& cl, set<int>& new_client_caps) {
|
|
if (client_caps.empty() && !cl.empty())
|
|
get(CINODE_PIN_CAPS);
|
|
for (map<int,Capability>::iterator it = cl.begin();
|
|
it != cl.end();
|
|
it++) {
|
|
new_client_caps.insert(it->first);
|
|
if (client_caps.count(it->first)) {
|
|
// merge
|
|
client_caps[it->first].merge(it->second);
|
|
} else {
|
|
// new
|
|
client_caps[it->first] = it->second;
|
|
}
|
|
}
|
|
}
|
|
|
|
// caps issued, wanted
|
|
int get_caps_issued() {
|
|
int c = 0;
|
|
for (map<int,Capability>::iterator it = client_caps.begin();
|
|
it != client_caps.end();
|
|
it++)
|
|
c |= it->second.issued();
|
|
return c;
|
|
}
|
|
int get_caps_wanted() {
|
|
int w = 0;
|
|
for (map<int,Capability>::iterator it = client_caps.begin();
|
|
it != client_caps.end();
|
|
it++) {
|
|
w |= it->second.wanted();
|
|
//cout << " get_caps_wanted client " << it->first << " " << cap_string(it->second.wanted()) << endl;
|
|
}
|
|
if (is_auth())
|
|
for (map<int,int>::iterator it = mds_caps_wanted.begin();
|
|
it != mds_caps_wanted.end();
|
|
it++) {
|
|
w |= it->second;
|
|
//cout << " get_caps_wanted mds " << it->first << " " << cap_string(it->second) << endl;
|
|
}
|
|
return w;
|
|
}
|
|
|
|
|
|
void replicate_relax_locks() {
|
|
assert(is_auth());
|
|
assert(!is_cached_by_anyone());
|
|
dout(10) << " relaxing locks on " << *this << endl;
|
|
|
|
if (hardlock.get_state() == LOCK_LOCK &&
|
|
!hardlock.is_used()) {
|
|
dout(10) << " hard now sync " << *this << endl;
|
|
hardlock.set_state(LOCK_SYNC);
|
|
}
|
|
if (filelock.get_state() == LOCK_LOCK) {
|
|
if (!filelock.is_used() &&
|
|
(get_caps_issued() & CAP_FILE_WR) == 0) {
|
|
filelock.set_state(LOCK_SYNC);
|
|
dout(10) << " file now sync " << *this << endl;
|
|
} else {
|
|
dout(10) << " can't relax filelock on " << *this << endl;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
// -- authority --
|
|
int authority();
|
|
|
|
|
|
// -- auth pins --
|
|
int is_auth_pinned() {
|
|
return auth_pins;
|
|
}
|
|
int adjust_nested_auth_pins(int a);
|
|
bool can_auth_pin();
|
|
void auth_pin();
|
|
void auth_unpin();
|
|
|
|
|
|
// -- freeze --
|
|
bool is_frozen();
|
|
bool is_frozen_dir();
|
|
bool is_freezing();
|
|
|
|
|
|
// -- reference counting --
|
|
|
|
/* these can be pinned any # of times, and are
|
|
linked to an active_request, so they're automatically cleaned
|
|
up when a request is finished. pin at will! */
|
|
void request_pin_get() {
|
|
if (num_request_pins == 0) get(CINODE_PIN_REQUEST);
|
|
num_request_pins++;
|
|
}
|
|
void request_pin_put() {
|
|
num_request_pins--;
|
|
if (num_request_pins == 0) put(CINODE_PIN_REQUEST);
|
|
assert(num_request_pins >= 0);
|
|
}
|
|
|
|
|
|
bool is_pinned() { return ref > 0; }
|
|
set<int>& get_ref_set() { return ref_set; }
|
|
void put(int by) {
|
|
cinode_pins[by]--;
|
|
if (ref == 0 || ref_set.count(by) != 1) {
|
|
dout(7) << " bad put " << *this << " by " << by << " " << cinode_pin_names[by] << " was " << ref << " (" << ref_set << ")" << endl;
|
|
assert(ref_set.count(by) == 1);
|
|
assert(ref > 0);
|
|
}
|
|
ref--;
|
|
ref_set.erase(by);
|
|
if (ref == 0)
|
|
lru_unpin();
|
|
dout(7) << " put " << *this << " by " << by << " " << cinode_pin_names[by] << " now " << ref << " (" << ref_set << ")" << endl;
|
|
}
|
|
void get(int by) {
|
|
cinode_pins[by]++;
|
|
if (ref == 0)
|
|
lru_pin();
|
|
if (ref_set.count(by)) {
|
|
dout(7) << " bad get " << *this << " by " << by << " " << cinode_pin_names[by] << " was " << ref << " (" << ref_set << ")" << endl;
|
|
assert(ref_set.count(by) == 0);
|
|
}
|
|
ref++;
|
|
ref_set.insert(by);
|
|
dout(7) << " get " << *this << " by " << by << " " << cinode_pin_names[by] << " now " << ref << " (" << ref_set << ")" << endl;
|
|
}
|
|
bool is_pinned_by(int by) {
|
|
return ref_set.count(by);
|
|
}
|
|
|
|
// -- hierarchy stuff --
|
|
void set_primary_parent(CDentry *p) {
|
|
parent = p;
|
|
}
|
|
void remove_primary_parent(CDentry *dn) {
|
|
assert(dn == parent);
|
|
parent = 0;
|
|
}
|
|
void add_remote_parent(CDentry *p) {
|
|
remote_parents.insert(p);
|
|
}
|
|
void remove_remote_parent(CDentry *p) {
|
|
remote_parents.erase(p);
|
|
}
|
|
int num_remote_parents() {
|
|
return remote_parents.size();
|
|
}
|
|
|
|
|
|
/*
|
|
// for giving to clients
|
|
void get_dist_spec(set<int>& ls, int auth, timepair_t& now) {
|
|
if (( is_dir() && popularity[MDS_POP_CURDOM].get(now) > g_conf.mds_bal_replicate_threshold) ||
|
|
(!is_dir() && popularity[MDS_POP_JUSTME].get(now) > g_conf.mds_bal_replicate_threshold)) {
|
|
//if (!cached_by.empty() && inode.ino > 1) dout(1) << "distributed spec for " << *this << endl;
|
|
ls = cached_by;
|
|
}
|
|
}
|
|
*/
|
|
|
|
// dbg
|
|
void dump(int d = 0);
|
|
};
|
|
|
|
|
|
|
|
|
|
// -- encoded state
|
|
|
|
// discover
|
|
|
|
class CInodeDiscover {
|
|
|
|
inode_t inode;
|
|
int replica_nonce;
|
|
|
|
int hardlock_state;
|
|
int filelock_state;
|
|
|
|
public:
|
|
CInodeDiscover() {}
|
|
CInodeDiscover(CInode *in, int nonce) {
|
|
inode = in->inode;
|
|
replica_nonce = nonce;
|
|
|
|
hardlock_state = in->hardlock.get_replica_state();
|
|
filelock_state = in->filelock.get_replica_state();
|
|
}
|
|
|
|
inodeno_t get_ino() { return inode.ino; }
|
|
int get_replica_nonce() { return replica_nonce; }
|
|
|
|
void update_inode(CInode *in) {
|
|
in->inode = inode;
|
|
|
|
in->replica_nonce = replica_nonce;
|
|
in->hardlock.set_state(hardlock_state);
|
|
in->filelock.set_state(filelock_state);
|
|
}
|
|
|
|
void _encode(bufferlist& bl) {
|
|
bl.append((char*)&inode, sizeof(inode));
|
|
bl.append((char*)&replica_nonce, sizeof(replica_nonce));
|
|
bl.append((char*)&hardlock_state, sizeof(hardlock_state));
|
|
bl.append((char*)&filelock_state, sizeof(filelock_state));
|
|
}
|
|
|
|
void _decode(bufferlist& bl, int& off) {
|
|
bl.copy(off,sizeof(inode_t), (char*)&inode);
|
|
off += sizeof(inode_t);
|
|
bl.copy(off, sizeof(int), (char*)&replica_nonce);
|
|
off += sizeof(int);
|
|
bl.copy(off, sizeof(hardlock_state), (char*)&hardlock_state);
|
|
off += sizeof(hardlock_state);
|
|
bl.copy(off, sizeof(filelock_state), (char*)&filelock_state);
|
|
off += sizeof(filelock_state);
|
|
}
|
|
|
|
};
|
|
|
|
|
|
// export
|
|
|
|
class CInodeExport {
|
|
|
|
struct {
|
|
inode_t inode;
|
|
meta_load_t popularity_justme;
|
|
meta_load_t popularity_curdom;
|
|
bool is_dirty; // dirty inode?
|
|
|
|
int num_caps;
|
|
} st;
|
|
|
|
set<int> cached_by;
|
|
map<int,int> cached_by_nonce;
|
|
map<int,Capability> cap_map;
|
|
|
|
CLock hardlock,filelock;
|
|
//int remaining_issued;
|
|
|
|
public:
|
|
CInodeExport() {}
|
|
CInodeExport(CInode *in) {
|
|
st.inode = in->inode;
|
|
st.is_dirty = in->is_dirty();
|
|
cached_by = in->cached_by;
|
|
cached_by_nonce = in->cached_by_nonce;
|
|
|
|
hardlock = in->hardlock;
|
|
filelock = in->filelock;
|
|
|
|
st.popularity_justme.take( in->popularity[MDS_POP_JUSTME] );
|
|
st.popularity_curdom.take( in->popularity[MDS_POP_CURDOM] );
|
|
in->popularity[MDS_POP_ANYDOM] -= st.popularity_curdom;
|
|
in->popularity[MDS_POP_NESTED] -= st.popularity_curdom;
|
|
|
|
// steal WRITER caps from inode
|
|
in->take_client_caps(cap_map);
|
|
//remaining_issued = in->get_caps_issued();
|
|
}
|
|
~CInodeExport() {
|
|
}
|
|
|
|
inodeno_t get_ino() { return st.inode.ino; }
|
|
|
|
void update_inode(CInode *in, set<int>& new_client_caps) {
|
|
in->inode = st.inode;
|
|
|
|
in->popularity[MDS_POP_JUSTME] += st.popularity_justme;
|
|
in->popularity[MDS_POP_CURDOM] += st.popularity_curdom;
|
|
in->popularity[MDS_POP_ANYDOM] += st.popularity_curdom;
|
|
in->popularity[MDS_POP_NESTED] += st.popularity_curdom;
|
|
|
|
if (st.is_dirty) {
|
|
in->mark_dirty();
|
|
}
|
|
|
|
in->cached_by.clear();
|
|
in->cached_by = cached_by;
|
|
in->cached_by_nonce = cached_by_nonce;
|
|
if (!cached_by.empty())
|
|
in->get(CINODE_PIN_CACHED);
|
|
|
|
in->hardlock = hardlock;
|
|
in->filelock = filelock;
|
|
|
|
// caps
|
|
in->merge_client_caps(cap_map, new_client_caps);
|
|
}
|
|
|
|
void _encode(bufferlist& bl) {
|
|
st.num_caps = cap_map.size();
|
|
bl.append((char*)&st, sizeof(st));
|
|
|
|
// cached_by + nonce
|
|
::_encode(cached_by, bl);
|
|
::_encode(cached_by_nonce, bl);
|
|
|
|
hardlock.encode_state(bl);
|
|
filelock.encode_state(bl);
|
|
|
|
// caps
|
|
for (map<int,Capability>::iterator it = cap_map.begin();
|
|
it != cap_map.end();
|
|
it++) {
|
|
bl.append((char*)&it->first, sizeof(it->first));
|
|
it->second._encode(bl);
|
|
}
|
|
}
|
|
|
|
int _decode(bufferlist& bl, int off = 0) {
|
|
bl.copy(off, sizeof(st), (char*)&st);
|
|
off += sizeof(st);
|
|
|
|
::_decode(cached_by, bl, off);
|
|
::_decode(cached_by_nonce, bl, off);
|
|
|
|
hardlock.decode_state(bl, off);
|
|
filelock.decode_state(bl, off);
|
|
|
|
// caps
|
|
for (int i=0; i<st.num_caps; i++) {
|
|
int c;
|
|
bl.copy(off, sizeof(c), (char*)&c);
|
|
off += sizeof(c);
|
|
cap_map[c]._decode(bl, off);
|
|
}
|
|
|
|
return off;
|
|
}
|
|
};
|
|
|
|
|
|
|
|
|
|
#endif
|