mars/mars_light.c

1829 lines
46 KiB
C
Raw Normal View History

2011-02-23 20:48:06 +00:00
// (c) 2011 Thomas Schoebel-Theuer / 1&1 Internet AG
//#define BRICK_DEBUGGING
//#define MARS_DEBUGGING
//#define IO_DEBUGGING // here means: display full statistics
#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/string.h>
#include <linux/debug_locks.h>
#include <linux/major.h>
#include <linux/genhd.h>
#include <linux/blkdev.h>
#define _STRATEGY
#include "mars.h"
#include <linux/kthread.h>
#include <linux/wait.h>
// used brick types
#include "mars_server.h"
#include "mars_client.h"
#include "mars_copy.h"
#include "mars_device_aio.h"
#include "mars_trans_logger.h"
#include "mars_if_device.h"
static struct task_struct *main_thread = NULL;
2011-02-28 18:00:32 +00:00
typedef int (*light_worker_fn)(void *buf, struct mars_dent *dent);
2011-02-23 20:48:06 +00:00
struct light_class {
char *cl_name;
int cl_len;
char cl_type;
bool cl_hostcontext;
bool cl_serial;
int cl_father;
light_worker_fn cl_forward;
light_worker_fn cl_backward;
};
///////////////////////////////////////////////////////////////////////
// internal helpers
#define MARS_DELIM ','
2011-02-28 18:00:32 +00:00
static int _parse_args(struct mars_dent *dent, char *str, int count)
2011-02-23 20:48:06 +00:00
{
int i;
int status = -EINVAL;
if (!str)
goto done;
if (!dent->d_args) {
dent->d_args = kstrdup(str, GFP_MARS);
if (!dent->d_args) {
status = -ENOMEM;
goto done;
}
}
for (i = 0; i < count; i++) {
char *tmp;
int len;
if (!*str)
goto done;
if (i == count-1) {
len = strlen(str);
} else {
char *tmp = strchr(str, MARS_DELIM);
if (!tmp)
goto done;
len = (tmp - str);
}
tmp = kzalloc(len+1, GFP_MARS);
if (!tmp) {
status = -ENOMEM;
goto done;
}
if (dent->d_argv[i]) {
kfree(dent->d_argv[i]);
}
dent->d_argv[i] = tmp;
strncpy(dent->d_argv[i], str, len);
dent->d_argv[i][len] = '\0';
str += len;
if (i != count-1)
str++;
}
status = 0;
done:
if (status < 0) {
MARS_ERR("bad syntax '%s' (should have %d args), status = %d\n", dent->d_args ? dent->d_args : "", count, status);
}
return status;
}
2011-02-25 11:46:38 +00:00
///////////////////////////////////////////////////////////////////////
static
2011-03-01 09:34:36 +00:00
int __make_copy(
struct mars_global *global,
struct mars_dent *parent,
struct mars_dent *belongs,
const char *path,
const char *argv[],
loff_t start_pos,
struct copy_brick **__copy)
2011-02-25 11:46:38 +00:00
{
struct mars_brick *copy;
struct copy_brick *_copy;
struct mars_output *output[2] = {};
struct mars_info info[2] = {};
int i;
int status = -1;
for (i = 0; i < 2; i++) {
const char *target = argv[i];
2011-03-01 09:34:36 +00:00
struct mars_brick *new;
new =
make_brick_all(global,
parent,
parent,
10 * HZ,
target,
(const struct generic_brick_type*)&device_aio_brick_type,
(const struct generic_brick_type*[]){},
target,
(const char *[]){},
0);
2011-02-25 11:46:38 +00:00
if (!new) {
MARS_DBG("cannot instantiate\n");
goto done;
}
output[i] = new->outputs[0];
}
2011-03-01 09:34:36 +00:00
copy =
make_brick_all(global,
parent,
belongs,
0,
path,
(const struct generic_brick_type*)&copy_brick_type,
(const struct generic_brick_type*[]){NULL,NULL,NULL,NULL},
"/copy",
(const char *[]){argv[0],argv[0],argv[1],argv[1]},
4);
2011-02-25 11:46:38 +00:00
if (!copy) {
2011-03-01 09:34:36 +00:00
MARS_DBG("fail '%s'\n", path);
goto done;
2011-02-25 11:46:38 +00:00
}
2011-02-27 14:17:58 +00:00
copy->log_level = 2;
2011-02-25 11:46:38 +00:00
_copy = (void*)copy;
if (__copy)
*__copy = _copy;
/* Determine the copy area, switch on when necessary
*/
if (!copy->power.button && copy->power.led_off) {
for (i = 0; i < 2; i++) {
status = output[i]->ops->mars_get_info(output[i], &info[i]);
if (status < 0) {
MARS_ERR("cannot determine current size of '%s'\n", argv[i]);
goto done;
}
}
_copy->copy_start = info[1].current_size;
if (start_pos != -1) {
_copy->copy_start = start_pos;
if (unlikely(info[0].current_size != info[1].current_size)) {
MARS_ERR("oops, devices have different size %lld != %lld at '%s'\n", info[0].current_size, info[1].current_size, parent->d_path);
status = -EINVAL;
goto done;
}
if (unlikely(start_pos > info[0].current_size)) {
MARS_ERR("bad start position %lld is larger than actual size %lld on '%s'\n", start_pos, info[0].current_size, parent->d_path);
status = -EINVAL;
goto done;
}
}
MARS_DBG("copy_start = %lld\n", _copy->copy_start);
_copy->copy_end = info[0].current_size;
MARS_DBG("copy_end = %lld\n", _copy->copy_end);
if (_copy->copy_start < _copy->copy_end) {
2011-03-01 09:34:36 +00:00
status = mars_power_button_recursive((void*)copy, true, 10 * HZ);
2011-02-25 11:46:38 +00:00
MARS_DBG("copy switch status = %d\n", status);
}
}
status = 0;
done:
MARS_DBG("status = %d\n", status);
return status;
}
2011-02-23 20:48:06 +00:00
///////////////////////////////////////////////////////////////////////
// remote workers
struct mars_peerinfo {
2011-02-24 16:37:32 +00:00
struct mars_global *global;
2011-02-23 20:48:06 +00:00
char *peer;
char *path;
struct socket *socket;
struct task_struct *thread;
wait_queue_head_t event;
light_worker_fn worker;
int maxdepth;
};
2011-02-24 16:37:32 +00:00
static
2011-02-28 18:00:32 +00:00
int _update_file(struct mars_global *global, struct mars_dent *parent, const char *peer, const char *path)
2011-02-24 16:37:32 +00:00
{
2011-02-27 14:17:58 +00:00
char tmp[MARS_PATH_MAX] = {};
2011-02-24 16:37:32 +00:00
const char *argv[2] = { tmp, path};
int status = 0;
2011-03-01 09:34:36 +00:00
snprintf(tmp, sizeof(tmp), "%s@%s", path, peer);
2011-02-24 16:37:32 +00:00
2011-03-01 09:34:36 +00:00
status = __make_copy(global, parent, parent, tmp, argv, -1, NULL);
2011-02-24 16:37:32 +00:00
return status;
}
static
int _is_peer_logfile(const char *name, const char *id)
{
int len = strlen(name);
int idlen = id ? strlen(id) : 4 + 9 + 1;
if (len <= idlen ||
2011-02-28 09:04:16 +00:00
strncmp(name, "log-", 4) != 0) {
MARS_DBG("not a logfile at all: '%s'\n", name);
2011-02-24 16:37:32 +00:00
return false;
}
2011-02-28 09:04:16 +00:00
if (id &&
name[len - idlen - 1] == '-' &&
strncmp(name + len - idlen, id, idlen) == 0) {
MARS_DBG("not a peer logfile: '%s'\n", name);
return false;
}
MARS_DBG("found peer logfile: '%s'\n", name);
2011-02-24 16:37:32 +00:00
return true;
}
static
2011-02-28 18:00:32 +00:00
int run_bones(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
int status = 0;
2011-02-24 16:37:32 +00:00
struct mars_peerinfo *peer = buf;
2011-02-27 14:17:58 +00:00
struct kstat local_stat = {};
bool stat_ok;
bool update_mtime = true;
bool update_ctime = true;
2011-02-24 16:37:32 +00:00
if (!strncmp(dent->d_name, ".tmp", 4)) {
goto done;
}
if (!strncmp(dent->d_name, "ignore", 6)) {
goto done;
}
2011-02-27 14:17:58 +00:00
status = mars_lstat(dent->d_path, &local_stat);
stat_ok = (status >= 0);
if (stat_ok) {
update_mtime = timespec_compare(&dent->new_stat.mtime, &local_stat.mtime) > 0;
update_ctime = timespec_compare(&dent->new_stat.ctime, &local_stat.ctime) > 0;
//MARS_DBG("timestamps '%s' remote = %ld.%09ld local = %ld.%09ld\n", dent->d_path, dent->new_stat.mtime.tv_sec, dent->new_stat.mtime.tv_nsec, local_stat.mtime.tv_sec, local_stat.mtime.tv_nsec);
if ((dent->new_stat.mode & S_IRWXU) !=
(local_stat.mode & S_IRWXU) &&
update_ctime) {
mode_t newmode = local_stat.mode;
MARS_DBG("chmod '%s' 0x%xd -> 0x%xd\n", dent->d_path, newmode & S_IRWXU, dent->new_stat.mode & S_IRWXU);
newmode &= ~S_IRWXU;
newmode |= (dent->new_stat.mode & S_IRWXU);
mars_chmod(dent->d_path, newmode);
mars_trigger();
}
if (dent->new_stat.uid != local_stat.uid && update_ctime) {
MARS_DBG("lchown '%s' %d -> %d\n", dent->d_path, local_stat.uid, dent->new_stat.uid);
mars_lchown(dent->d_path, dent->new_stat.uid);
mars_trigger();
}
}
2011-02-23 20:48:06 +00:00
if (S_ISDIR(dent->new_stat.mode)) {
if (strncmp(dent->d_name, "resource-", 9)) {
MARS_DBG("ignoring directory '%s'\n", dent->d_path);
2011-02-24 16:37:32 +00:00
goto done;
}
2011-02-27 14:17:58 +00:00
if (!stat_ok) {
2011-02-24 16:37:32 +00:00
status = mars_mkdir(dent->d_path);
MARS_DBG("create directory '%s' status = %d\n", dent->d_path, status);
2011-02-27 14:17:58 +00:00
mars_chmod(dent->d_path, dent->new_stat.mode);
mars_lchown(dent->d_path, dent->new_stat.uid);
2011-02-23 20:48:06 +00:00
}
} else if (S_ISLNK(dent->new_stat.mode) && dent->new_link) {
2011-02-27 14:17:58 +00:00
if (!stat_ok || update_mtime) {
status = mars_symlink(dent->new_link, dent->d_path, &dent->new_stat.mtime, dent->new_stat.uid);
2011-02-24 16:37:32 +00:00
MARS_DBG("create symlink '%s' -> '%s' status = %d\n", dent->d_path, dent->new_link, status);
2011-02-27 14:17:58 +00:00
mars_trigger();
2011-02-24 16:37:32 +00:00
}
} else if (S_ISREG(dent->new_stat.mode) && _is_peer_logfile(dent->d_name, my_id())) {
loff_t src_size = dent->new_stat.size;
2011-02-27 14:17:58 +00:00
if (!stat_ok || local_stat.size < src_size) {
2011-02-24 16:37:32 +00:00
status = _update_file(peer->global, dent->d_parent, peer->peer, dent->d_path);
2011-02-28 09:04:16 +00:00
MARS_DBG("update '%s' from peer '%s' status = %d\n", dent->d_path, peer->peer, status);
2011-02-24 16:37:32 +00:00
if (status >= 0) {
struct mars_dent *local_alias;
int len = dent->d_pathlen;
2011-02-27 14:17:58 +00:00
char tmp[MARS_PATH_MAX];
2011-02-24 16:37:32 +00:00
char *test;
for (test = dent->d_path + len - 1; *test != '-' && len > 0; test--, len--) /*skip*/;
memcpy(tmp, dent->d_path, len);
strncpy(tmp + len, my_id(), sizeof(tmp) - len);
MARS_DBG("local alias for '%s' is '%s'\n", dent->d_path, tmp);
local_alias = mars_find_dent((void*)peer->global, tmp);
if (!local_alias) {
2011-02-27 14:17:58 +00:00
status = mars_symlink(dent->d_name, tmp, &dent->new_stat.mtime, 0);
2011-02-24 16:37:32 +00:00
MARS_DBG("create alias '%s' -> '%s' status = %d\n", tmp, dent->d_name, status);
2011-02-27 14:17:58 +00:00
mars_trigger();
2011-02-24 16:37:32 +00:00
}
}
}
2011-02-23 20:48:06 +00:00
} else {
MARS_DBG("ignoring '%s'\n", dent->d_path);
}
2011-02-24 16:37:32 +00:00
done:
2011-02-23 20:48:06 +00:00
return status;
}
///////////////////////////////////////////////////////////////////////
// remote working infrastructure
2011-02-24 16:37:32 +00:00
static
void _peer_cleanup(struct mars_peerinfo *peer)
2011-02-23 20:48:06 +00:00
{
if (peer->socket) {
kernel_sock_shutdown(peer->socket, SHUT_WR);
peer->socket = NULL;
}
//...
}
2011-02-24 16:37:32 +00:00
static
int remote_thread(void *data)
2011-02-23 20:48:06 +00:00
{
struct mars_peerinfo *peer = data;
2011-02-24 16:37:32 +00:00
char *real_peer;
2011-02-23 20:48:06 +00:00
struct sockaddr_storage sockaddr = {};
int status;
if (!peer)
return -1;
2011-02-27 14:17:58 +00:00
real_peer = mars_translate_hostname(peer->global, peer->peer);
2011-02-24 16:37:32 +00:00
MARS_INF("-------- remote thread starting on peer '%s' (%s)\n", peer->peer, real_peer);
2011-02-23 20:48:06 +00:00
//fake_mm();
2011-02-24 16:37:32 +00:00
status = mars_create_sockaddr(&sockaddr, real_peer);
2011-02-23 20:48:06 +00:00
if (unlikely(status < 0)) {
2011-02-24 16:37:32 +00:00
MARS_ERR("unusable remote address '%s' (%s)\n", real_peer, peer->peer);
2011-02-23 20:48:06 +00:00
goto done;
}
while (!kthread_should_stop()) {
LIST_HEAD(tmp_list);
struct mars_cmd cmd = {
.cmd_code = CMD_GETENTS,
.cmd_str1 = peer->path,
.cmd_int1 = peer->maxdepth,
};
if (!peer->socket) {
status = mars_create_socket(&peer->socket, &sockaddr, false);
if (unlikely(status < 0)) {
peer->socket = NULL;
2011-02-24 16:37:32 +00:00
MARS_INF("no connection to '%s'\n", real_peer);
2011-02-23 20:48:06 +00:00
msleep(5000);
continue;
}
2011-02-24 16:37:32 +00:00
MARS_DBG("successfully opened socket to '%s'\n", real_peer);
2011-02-23 20:48:06 +00:00
continue;
}
status = mars_send_struct(&peer->socket, &cmd, mars_cmd_meta);
if (unlikely(status < 0)) {
MARS_ERR("communication error on send, status = %d\n", status);
_peer_cleanup(peer);
msleep(5000);
continue;
}
status = mars_recv_dent_list(&peer->socket, &tmp_list);
if (unlikely(status < 0)) {
MARS_ERR("communication error on receive, status = %d\n", status);
_peer_cleanup(peer);
msleep(5000);
continue;
}
2011-02-24 16:37:32 +00:00
//MARS_DBG("AHA!!!!!!!!!!!!!!!!!!!!\n");
2011-02-23 20:48:06 +00:00
{
struct list_head *tmp;
for (tmp = tmp_list.next; tmp != &tmp_list; tmp = tmp->next) {
2011-03-01 09:34:36 +00:00
struct mars_dent *dent = container_of(tmp, struct mars_dent, dent_link);
2011-02-23 20:48:06 +00:00
if (!dent->d_path) {
MARS_DBG("NULL\n");
continue;
}
2011-02-24 16:37:32 +00:00
//MARS_DBG("path = '%s'\n", dent->d_path);
2011-02-23 20:48:06 +00:00
if (!peer->worker)
continue;
status = peer->worker(peer, dent);
2011-02-24 16:37:32 +00:00
//MARS_DBG("path = '%s' worker status = %d\n", dent->d_path, status);
2011-02-23 20:48:06 +00:00
}
}
2011-03-01 09:34:36 +00:00
mars_free_dent_all(&tmp_list);
2011-02-23 20:48:06 +00:00
if (!kthread_should_stop())
msleep(10 * 1000);
}
MARS_INF("-------- remote thread terminating\n");
_peer_cleanup(peer);
done:
//cleanup_mm();
2011-02-24 16:37:32 +00:00
peer->thread = NULL;
if (real_peer)
kfree(real_peer);
2011-02-23 20:48:06 +00:00
return 0;
}
///////////////////////////////////////////////////////////////////////
// helpers for worker functions
2011-02-28 18:00:32 +00:00
static int _kill_peer(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
struct mars_peerinfo *peer = dent->d_private;
if (global->global_power.button) {
return 0;
}
if (!peer) {
return 0;
}
if (!peer->thread) {
MARS_ERR("oops, remote thread is not running - doing cleanup myself\n");
_peer_cleanup(peer);
dent->d_private = NULL;
return -1;
}
kthread_stop(peer->thread);
dent->d_private = NULL;
return 0;
}
2011-02-28 18:00:32 +00:00
static int _make_peer(void *buf, struct mars_dent *dent, char *mypeer, char *path, light_worker_fn worker)
2011-02-23 20:48:06 +00:00
{
static int serial = 0;
struct mars_global *global = buf;
struct mars_peerinfo *peer;
int status = 0;
if (!global->global_power.button || !dent->d_parent || !dent->new_link) {
return 0;
}
if (!mypeer) {
status = _parse_args(dent, dent->new_link, 1);
if (status < 0)
goto done;
mypeer = dent->d_argv[0];
}
MARS_DBG("peer '%s'\n", mypeer);
if (!dent->d_private) {
dent->d_private = kzalloc(sizeof(struct mars_peerinfo), GFP_MARS);
if (!dent->d_private) {
MARS_ERR("no memory for peer structure\n");
return -1;
}
peer = dent->d_private;
2011-02-24 16:37:32 +00:00
peer->global = global;
2011-02-23 20:48:06 +00:00
peer->peer = mypeer;
peer->path = path;
peer->worker = worker;
peer->maxdepth = 2;
init_waitqueue_head(&peer->event);
}
peer = dent->d_private;
if (!peer->thread) {
peer->thread = kthread_create(remote_thread, peer, "mars_remote%d", serial++);
if (unlikely(IS_ERR(peer->thread))) {
MARS_ERR("cannot start peer thread, status = %d\n", (int)PTR_ERR(peer->thread));
peer->thread = NULL;
return -1;
}
2011-02-24 16:37:32 +00:00
MARS_DBG("starting peer thread\n");
2011-02-23 20:48:06 +00:00
wake_up_process(peer->thread);
}
done:
return status;
}
2011-02-28 18:00:32 +00:00
static int _kill_remote(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
return _kill_peer(buf, dent);
}
2011-02-28 18:00:32 +00:00
static int _make_remote(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
return _make_peer(buf, dent, NULL, "/mars", NULL);
}
2011-02-28 18:00:32 +00:00
static int kill_scan(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
return _kill_peer(buf, dent);
}
2011-02-28 18:00:32 +00:00
static int make_scan(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
2011-02-24 16:37:32 +00:00
MARS_DBG("path = '%s' peer = '%s'\n", dent->d_path, dent->d_rest);
if (!strcmp(dent->d_rest, my_id())) {
return 0;
}
return _make_peer(buf, dent, dent->d_rest, "/mars", run_bones);
2011-02-23 20:48:06 +00:00
}
static
2011-02-28 18:00:32 +00:00
int kill_all(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
2011-02-27 14:17:58 +00:00
if (global->global_power.button &&
(!dent->d_kill_inactive || dent->d_activate)) {
2011-02-23 20:48:06 +00:00
return 0;
}
2011-03-01 09:34:36 +00:00
mars_kill_dent(dent);
return 0;
2011-02-23 20:48:06 +00:00
}
///////////////////////////////////////////////////////////////////////
// handlers / helpers for logfile rotation
struct mars_rotate {
2011-02-28 18:00:32 +00:00
struct mars_dent *replay_link;
struct mars_dent *aio_dent;
2011-02-23 20:48:06 +00:00
struct device_aio_brick *aio_brick;
struct mars_info aio_info;
struct trans_logger_brick *trans_brick;
2011-02-28 18:00:32 +00:00
struct mars_dent *relevant_log;
struct mars_dent *current_log;
struct mars_dent *prev_log;
struct mars_dent *next_log;
2011-02-23 20:48:06 +00:00
long long last_jiffies;
loff_t start_pos;
loff_t end_pos;
int max_sequence;
bool has_error;
bool do_replay;
bool is_primary;
bool create_once;
};
static
void _create_new_logfile(char *path)
{
struct file *f;
const int flags = O_RDWR | O_CREAT | O_EXCL;
const int prot = 0600;
mm_segment_t oldfs;
oldfs = get_fs();
set_fs(get_ds());
f = filp_open(path, flags, prot);
set_fs(oldfs);
if (f) {
filp_close(f, NULL);
MARS_DBG("created empty logfile '%s'\n", path);
mars_trigger();
}
}
static
2011-02-28 18:00:32 +00:00
int _update_link(struct mars_rotate *rot, struct mars_dent *parent, int sequence, loff_t pos)
2011-02-23 20:48:06 +00:00
{
struct timespec now = {};
2011-02-27 14:17:58 +00:00
char old[MARS_PATH_MAX] = {};
char new[MARS_PATH_MAX] = {};
2011-02-23 20:48:06 +00:00
int status = 0;
snprintf(old, sizeof(old), "log-%09d-%s,%lld", sequence, my_id(), pos);
snprintf(new, sizeof(new), "%s/replay-%s", parent->d_path, my_id());
get_lamport(&now);
2011-02-27 14:17:58 +00:00
status = mars_symlink(old, new, &now, 0);
2011-02-23 20:48:06 +00:00
if (status < 0) {
MARS_ERR("cannot create symlink '%s' -> '%s' status = %d\n", old, new, status);
} else {
MARS_DBG("make symlink '%s' -> '%s' status = %d\n", old, new, status);
}
if (status >= 0) {
rot->last_jiffies = jiffies;
}
return status;
}
/* This must be called once at every round of logfile checking.
*/
static
2011-02-28 18:00:32 +00:00
int make_log_init(void *buf, struct mars_dent *parent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
struct mars_brick *aio_brick;
struct mars_brick *trans_brick;
struct mars_rotate *rot = parent->d_private;
2011-02-28 18:00:32 +00:00
struct mars_dent *replay_link;
struct mars_dent *aio_dent;
2011-02-23 20:48:06 +00:00
struct mars_output *output;
2011-03-01 09:34:36 +00:00
char *replay_path = NULL;
char *aio_path = NULL;
2011-02-23 20:48:06 +00:00
int status;
if (!rot) {
rot = kzalloc(sizeof(struct mars_rotate), GFP_MARS);
parent->d_private = rot;
if (!rot) {
MARS_ERR("cannot allocate rot structure\n");
status = -ENOMEM;
goto done;
}
}
rot->replay_link = NULL;
rot->aio_dent = NULL;
rot->aio_brick = NULL;
rot->relevant_log = NULL;
rot->prev_log = NULL;
rot->next_log = NULL;
rot->max_sequence = 0;
rot->has_error = false;
/* Fetch the replay status symlink.
* It must exist, and its value will control everything.
*/
2011-03-01 09:34:36 +00:00
replay_path = path_make(parent, "/replay-%s", my_id());
if (unlikely(!replay_path)) {
MARS_ERR("cannot make path\n");
status = -ENOMEM;
goto done;
}
2011-02-23 20:48:06 +00:00
2011-03-01 09:34:36 +00:00
replay_link = (void*)mars_find_dent(global, replay_path);
if (unlikely(!replay_link || !replay_link->new_link)) {
MARS_ERR("replay status symlink '%s' does not exist (%p)\n", replay_path, replay_link);
2011-02-23 20:48:06 +00:00
status = -ENOENT;
goto done;
}
status = _parse_args(replay_link, replay_link->new_link, 2);
2011-03-01 09:34:36 +00:00
if (unlikely(status < 0)) {
2011-02-23 20:48:06 +00:00
goto done;
}
rot->replay_link = replay_link;
/* Fetch the referenced AIO dentry.
*/
2011-03-01 09:34:36 +00:00
aio_path = path_make(parent, "/%s", replay_link->d_argv[0]);
if (unlikely(!aio_path)) {
MARS_ERR("cannot make path\n");
status = -ENOMEM;
goto done;
}
2011-02-23 20:48:06 +00:00
2011-03-01 09:34:36 +00:00
aio_dent = (void*)mars_find_dent(global, aio_path);
2011-02-23 20:48:06 +00:00
if (unlikely(!aio_dent)) {
2011-03-01 09:34:36 +00:00
MARS_ERR("logfile '%s' does not exist\n", aio_path);
2011-02-23 20:48:06 +00:00
status = -ENOENT;
if (rot->is_primary) { // try to create an empty logfile
2011-03-01 09:34:36 +00:00
_create_new_logfile(aio_path);
2011-02-23 20:48:06 +00:00
}
goto done;
}
rot->aio_dent = aio_dent;
/* Fetch / make the AIO brick instance
*/
2011-03-01 09:34:36 +00:00
aio_brick =
make_brick_all(global,
NULL,
parent,
1 * HZ,
aio_path,
(const struct generic_brick_type*)&device_aio_brick_type,
(const struct generic_brick_type*[]){},
"%s/%s",
(const char *[]){},
0,
parent->d_path,
replay_link->d_argv[0]);
2011-02-23 20:48:06 +00:00
if (!aio_brick) {
2011-03-01 09:34:36 +00:00
MARS_ERR("cannot access '%s'\n", aio_path);
status = -EIO;
goto done;
2011-02-23 20:48:06 +00:00
}
rot->aio_brick = (void*)aio_brick;
/* Fetch the actual logfile size
*/
output = aio_brick->outputs[0];
status = output->ops->mars_get_info(output, &rot->aio_info);
if (status < 0) {
2011-03-01 09:34:36 +00:00
MARS_ERR("cannot get info on '%s'\n", aio_path);
2011-02-23 20:48:06 +00:00
goto done;
}
2011-03-01 09:34:36 +00:00
MARS_DBG("logfile '%s' size = %lld\n", aio_path, rot->aio_info.current_size);
2011-02-23 20:48:06 +00:00
2011-03-01 09:34:36 +00:00
/* Fetch / make the transaction logger.
* We deliberately "forget" to connect the log input here.
* Will be carried out later in make_log().
* The final switch-on will be started in make_log_finalize().
2011-02-23 20:48:06 +00:00
*/
2011-03-01 09:34:36 +00:00
trans_brick =
make_brick_all(global,
parent,
parent,
0,
aio_path,
(const struct generic_brick_type*)&trans_logger_brick_type,
(const struct generic_brick_type*[]){(const struct generic_brick_type*)&device_aio_brick_type},
"/logger",
(const char *[]){"/data-%s"},
1,
my_id());
status = -ENOENT;
2011-02-23 20:48:06 +00:00
if (!trans_brick) {
2011-03-01 09:34:36 +00:00
goto done;
2011-02-23 20:48:06 +00:00
}
rot->trans_brick = (void*)trans_brick;
/* For safety, default is to try an (unnecessary) replay in case
* something goes wrong later.
*/
rot->do_replay = true;
status = 0;
done:
2011-03-01 09:34:36 +00:00
if (aio_path)
kfree(aio_path);
if (replay_path)
kfree(replay_path);
2011-02-23 20:48:06 +00:00
return status;
}
/* Internal helper. Return codes:
* ret < 0 : error
* ret == 0 : not relevant
* ret == 1 : relevant, no transaction replay
* ret == 2 : relevant for transaction replay
* ret == 3 : relevant for appending
*/
static
2011-02-28 18:00:32 +00:00
int _check_logging_status(struct mars_global *global, struct mars_dent *dent, long long *oldpos, long long *newpos)
2011-02-23 20:48:06 +00:00
{
2011-02-28 18:00:32 +00:00
struct mars_dent *parent = dent->d_parent;
2011-02-23 20:48:06 +00:00
struct mars_rotate *rot = parent->d_private;
int status = -EINVAL;
CHECK_PTR(rot, done);
status = 0;
if (!rot->replay_link || !rot->aio_dent || !rot->aio_brick) {
//MARS_DBG("nothing to do on '%s'\n", dent->d_path);
goto done;
}
if (rot->aio_dent->d_serial != dent->d_serial) {
//MARS_DBG("serial number %d not relevant\n", dent->d_serial);
goto done;
}
if (sscanf(rot->replay_link->d_argv[1], "%lld", oldpos) != 1) {
MARS_ERR("bad position argument '%s'\n", rot->replay_link->d_argv[1]);
status = -EINVAL;
goto done;
}
if (unlikely(rot->aio_info.current_size < *oldpos)) {
MARS_ERR("oops, bad replay position attempted in logfile '%s' (file length %lld should never be smaller than requested position %lld, is your filesystem corrupted?) => please repair this by hand\n", rot->aio_dent->d_path, rot->aio_info.current_size, *oldpos);
status = -EINVAL;
goto done;
}
if (rot->aio_info.current_size > *oldpos) {
MARS_INF("transaction log replay is necessary on '%s' from %lld to %lld\n", rot->aio_dent->d_path, *oldpos, rot->aio_info.current_size);
*newpos = rot->aio_info.current_size;
status = 2;
} else if (rot->aio_info.current_size > 0) {
MARS_INF("transaction log '%s' is already applied (would be usable for appending at position %lld, but a fresh log is needed for safety reasons)\n", rot->aio_dent->d_path, *oldpos);
*newpos = rot->aio_info.current_size;
status = 1;
} else if (!rot->is_primary) {
MARS_INF("empty transaction log '%s' would be usable, but I am not primary\n", rot->aio_dent->d_path);
status = 0;
} else {
MARS_INF("empty transaction log '%s' is usable for me as a primary node\n", rot->aio_dent->d_path);
status = 3;
}
done:
return status;
}
/* Note: this is strictly called in d_serial order.
* This is important!
*/
static
2011-02-28 18:00:32 +00:00
int make_log(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
2011-02-28 18:00:32 +00:00
struct mars_dent *parent = dent->d_parent;
2011-02-23 20:48:06 +00:00
struct mars_rotate *rot = parent->d_private;
struct trans_logger_brick *trans_brick;
2011-02-28 18:00:32 +00:00
struct mars_dent *prev_log;
2011-02-23 20:48:06 +00:00
loff_t start_pos = 0;
loff_t end_pos = 0;
int status = -EINVAL;
CHECK_PTR(rot, err);
status = 0;
trans_brick = rot->trans_brick;
if (!global->global_power.button || !dent->d_parent || !trans_brick || rot->has_error) {
2011-03-01 09:34:36 +00:00
MARS_DBG("nothing to do rot_error = %d\n", rot->has_error);
2011-02-23 20:48:06 +00:00
goto done;
}
if (dent->d_serial > rot->max_sequence) {
rot->max_sequence = dent->d_serial;
}
/* Check for consecutiveness of logfiles
*/
prev_log = rot->next_log;
if (prev_log && prev_log->d_serial + 1 != dent->d_serial) {
MARS_ERR("transaction logs are not consecutive at '%s' (%d ~> %d)\n", dent->d_path, prev_log->d_serial, dent->d_serial);
status = -EINVAL;
goto done;
}
/* Skip any logfiles after the relevant one.
* This should happen only when replaying multiple logfiles
* in sequence, or when starting a new logfile for writing.
*/
if (rot->relevant_log) {
if (rot->do_replay) {
status = 0;
goto ok;
}
if (rot->aio_dent->new_stat.size > 0) {
MARS_ERR("oops, the new logfile '%s' is not empty -- for safety, I will not use it -- log rotation is disabled now\n", dent->d_path);
status = -EINVAL;
goto done;
}
MARS_DBG("considering next logfile '%s' for rotation\n", dent->d_path);
}
/* Find current logging status.
*/
status = _check_logging_status(global, dent, &start_pos, &end_pos);
if (status < 0) {
goto done;
}
/* Relevant or not?
*/
switch (status) {
case 0: // not relevant
goto ok;
case 1: // relevant, but transaction replay already finished
if (!trans_brick->power.button && !trans_brick->power.led_on && trans_brick->power.led_off) {
_update_link(rot, dent->d_parent, dent->d_serial + 1, 0);
mars_trigger();
}
status = -EAGAIN;
goto done;
case 2: // relevant for transaction replay
MARS_DBG("replaying transaction log '%s' from %lld to %lld\n", dent->d_path, start_pos, end_pos);
rot->do_replay = true;
rot->start_pos = start_pos;
rot->end_pos = end_pos;
rot->relevant_log = dent;
break;
case 3: // relevant for appending
MARS_DBG("appending to transaction log '%s'\n", dent->d_path);
rot->do_replay = false;
rot->start_pos = 0;
rot->end_pos = 0;
rot->relevant_log = dent;
break;
default:
MARS_ERR("bad internal status %d\n", status);
status = -EINVAL;
goto done;
}
ok:
/* All ok: switch over the indicators.
*/
rot->prev_log = rot->next_log;
rot->next_log = dent;
done:
if (status < 0) {
rot->has_error = true;
}
err:
return status;
}
static
int _start_trans(struct mars_rotate *rot)
{
struct trans_logger_brick *trans_brick = rot->trans_brick;
int status = 0;
if (trans_brick->power.button) {
goto done;
}
/* Internal safety checks
*/
status = -EINVAL;
if (unlikely(!rot->aio_brick || !rot->relevant_log)) {
MARS_ERR("something is missing, this should not happen\n");
goto done;
}
/* For safety, disconnect old connection first
*/
if (trans_brick->inputs[1]->connect) {
(void)generic_disconnect((void*)trans_brick->inputs[1]);
}
/* Connect to new transaction log
*/
status = generic_connect((void*)trans_brick->inputs[1], (void*)rot->aio_brick->outputs[0]);
if (status < 0) {
goto done;
}
/* Supply all relevant parameters
*/
trans_brick->sequence = rot->relevant_log->d_serial;
trans_brick->do_replay = rot->do_replay;
trans_brick->current_pos = rot->start_pos;
trans_brick->start_pos = rot->start_pos;
trans_brick->end_pos = rot->end_pos;
/* Switch on....
*/
2011-02-28 18:00:32 +00:00
status = mars_power_button((void*)trans_brick, true);
2011-02-23 20:48:06 +00:00
MARS_DBG("status = %d\n", status);
done:
return status;
}
static
int _stop_trans(struct mars_rotate *rot)
{
struct trans_logger_brick *trans_brick = rot->trans_brick;
int status = 0;
if (!trans_brick->power.button) {
goto done;
}
/* Switch off....
*/
2011-02-28 18:00:32 +00:00
status = mars_power_button((void*)trans_brick, false);
2011-02-23 20:48:06 +00:00
MARS_DBG("status = %d\n", status);
if (status < 0) {
goto done;
}
/* Disconnect old connection
*/
if (trans_brick->inputs[1]->connect && trans_brick->power.led_off) {
(void)generic_disconnect((void*)trans_brick->inputs[1]);
}
done:
return status;
}
static
2011-02-28 18:00:32 +00:00
int make_log_finalize(struct mars_global *global, struct mars_dent *parent)
2011-02-23 20:48:06 +00:00
{
struct mars_rotate *rot = parent->d_private;
struct trans_logger_brick *trans_brick;
int status = -EINVAL;
CHECK_PTR(rot, done);
trans_brick = rot->trans_brick;
status = 0;
if (!trans_brick) {
MARS_DBG("nothing to do\n");
goto done;
}
/* Stopping is also possible in case of errors
*/
if (trans_brick->power.button && trans_brick->power.led_on && !trans_brick->power.led_off) {
bool do_stop =
(rot->do_replay || trans_brick->do_replay)
? (trans_brick->current_pos == trans_brick->end_pos)
: (rot->relevant_log && rot->relevant_log != rot->current_log);
MARS_DBG("do_stop = %d\n", (int)do_stop);
if (do_stop || (long long)jiffies > rot->last_jiffies + 5 * HZ) {
status = _update_link(rot, parent, trans_brick->sequence, trans_brick->current_pos);
}
if (do_stop) {
status = _stop_trans(rot);
}
goto done;
}
/* Special case: after a fresh start, when no logfile exists,
* create one. This is a thin exception from the rule that
* normally userspace should control what happens in MARS.
*/
if (!rot->relevant_log && rot->is_primary && !rot->has_error && rot->max_sequence > 0 && !rot->create_once) { // try to create an empty logfile
2011-02-27 14:17:58 +00:00
char tmp[MARS_PATH_MAX] = {};
2011-02-23 20:48:06 +00:00
snprintf(tmp, sizeof(tmp), "%s/log-%09d-%s", parent->d_path, rot->max_sequence + 1, my_id());
_create_new_logfile(tmp);
rot->create_once = true;
msleep(1000);
goto done;
}
/* Starting is only possible when no error ocurred.
*/
if (!rot->relevant_log || rot->has_error) {
MARS_DBG("nothing to do\n");
goto done;
}
/* Start when necessary
*/
if (!trans_brick->power.button && !trans_brick->power.led_on && trans_brick->power.led_off) {
bool do_start = (!rot->do_replay || rot->start_pos != rot->end_pos);
MARS_DBG("do_start = %d\n", (int)do_start);
if (do_start) {
status = _start_trans(rot);
rot->current_log = rot->relevant_log;
}
} else {
MARS_DBG("trans_brick %d %d %d\n", trans_brick->power.button, trans_brick->power.led_on, trans_brick->power.led_off);
}
done:
return status;
}
///////////////////////////////////////////////////////////////////////
// specific handlers
static
2011-02-28 18:00:32 +00:00
int make_primary(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
2011-02-28 18:00:32 +00:00
struct mars_dent *parent;
2011-02-27 14:17:58 +00:00
struct mars_rotate *rot;
2011-02-23 20:48:06 +00:00
int status = -EINVAL;
2011-02-27 14:17:58 +00:00
parent = dent->d_parent;
CHECK_PTR(parent, done);
rot = parent->d_private;
2011-02-23 20:48:06 +00:00
CHECK_PTR(rot, done);
rot->is_primary = (dent->new_link && !strcmp(dent->new_link, my_id()));
status = 0;
done:
return status;
}
static
2011-02-28 18:00:32 +00:00
int make_aio(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
struct mars_brick *brick;
struct device_aio_brick *_brick;
2011-02-27 14:17:58 +00:00
int status = 0;
2011-02-23 20:48:06 +00:00
2011-02-27 14:17:58 +00:00
if (!global->global_power.button || !dent->d_activate) {
goto done;
2011-02-23 20:48:06 +00:00
}
if (mars_find_brick(global, &device_aio_brick_type, dent->d_path)) {
2011-02-27 14:17:58 +00:00
goto done;
2011-02-23 20:48:06 +00:00
}
2011-02-27 14:17:58 +00:00
dent->d_kill_inactive = true;
2011-03-01 09:34:36 +00:00
brick =
make_brick_all(global,
NULL,
dent->d_parent,
10 * HZ,
dent->d_path,
(const struct generic_brick_type*)&device_aio_brick_type,
(const struct generic_brick_type*[]){},
dent->d_path,
(const char *[]){},
0);
2011-02-27 14:17:58 +00:00
if (unlikely(!brick)) {
status = -ENXIO;
goto done;
}
2011-02-23 20:48:06 +00:00
brick->outputs[0]->output_name = dent->d_path;
_brick = (void*)brick;
_brick->outputs[0]->o_fdsync = true;
2011-02-28 18:00:32 +00:00
status = mars_power_button((void*)brick, true);
2011-02-23 20:48:06 +00:00
if (status < 0) {
2011-02-28 18:00:32 +00:00
kill_all(buf, dent);
2011-02-23 20:48:06 +00:00
}
2011-02-27 14:17:58 +00:00
done:
2011-02-23 20:48:06 +00:00
return status;
}
2011-02-28 18:00:32 +00:00
static int make_dev(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
2011-02-28 18:00:32 +00:00
struct mars_dent *parent = dent->d_parent;
2011-02-23 20:48:06 +00:00
struct mars_rotate *rot = parent->d_private;
struct mars_brick *dev_brick;
int status = 0;
if (!global->global_power.button || !dent->d_parent || !dent->new_link) {
MARS_DBG("nothing to do\n");
goto done;
}
status = make_log_finalize(global, dent->d_parent);
if (status < 0) {
MARS_DBG("logger not initialized\n");
goto done;
}
if (!rot || !rot->is_primary) {
MARS_DBG("I am not primary, don't show the device\n");
goto done;
}
if (!rot->trans_brick || rot->trans_brick->do_replay || !rot->trans_brick->power.led_on || rot->trans_brick->power.led_off) {
MARS_DBG("transaction logger not ready for writing\n");
goto done;
}
status = _parse_args(dent, dent->new_link, 1);
if (status < 0) {
2011-03-01 09:34:36 +00:00
MARS_DBG("fail\n");
2011-02-23 20:48:06 +00:00
goto done;
}
2011-03-01 09:34:36 +00:00
dev_brick =
make_brick_all(global,
dent->d_parent,
dent,
10 * HZ,
dent->d_path,
(const struct generic_brick_type*)&if_device_brick_type,
(const struct generic_brick_type*[]){(const struct generic_brick_type*)&trans_logger_brick_type},
dent->d_argv[0],
(const char *[]){"/logger"},
1);
2011-02-23 20:48:06 +00:00
if (!dev_brick) {
2011-03-01 09:34:36 +00:00
MARS_DBG("fail\n");
return -1;
2011-02-23 20:48:06 +00:00
}
2011-02-27 14:17:58 +00:00
dev_brick->log_level = 1;
2011-02-23 20:48:06 +00:00
done:
return status;
}
2011-02-28 18:00:32 +00:00
static int _make_direct(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
struct mars_brick *brick;
int status;
if (!global->global_power.button || !dent->d_parent || !dent->new_link) {
return 0;
}
status = _parse_args(dent, dent->new_link, 2);
if (status < 0) {
goto done;
}
2011-03-01 09:34:36 +00:00
brick =
make_brick_all(global,
dent->d_parent,
dent,
10 * HZ,
dent->d_argv[0],
(const struct generic_brick_type*)&device_aio_brick_type,
(const struct generic_brick_type*[]){},
dent->d_argv[0],
(const char *[]){},
0);
status = -1;
2011-02-23 20:48:06 +00:00
if (!brick) {
2011-03-01 09:34:36 +00:00
MARS_DBG("fail\n");
goto done;
2011-02-23 20:48:06 +00:00
}
2011-03-01 09:34:36 +00:00
brick =
make_brick_all(global,
dent->d_parent,
dent,
10 * HZ,
dent->d_argv[1],
(const struct generic_brick_type*)&if_device_brick_type,
(const struct generic_brick_type*[]){NULL},
dent->d_argv[1],
(const char *[]){dent->d_argv[0]},
1);
status = -1;
2011-02-23 20:48:06 +00:00
if (!brick) {
2011-03-01 09:34:36 +00:00
MARS_DBG("fail\n");
goto done;
2011-02-23 20:48:06 +00:00
}
2011-03-01 09:34:36 +00:00
2011-02-23 20:48:06 +00:00
status = 0;
done:
MARS_DBG("status = %d\n", status);
return status;
}
2011-02-28 18:00:32 +00:00
static int _make_copy(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
2011-02-25 11:46:38 +00:00
struct mars_global *global = buf;
int status;
2011-02-23 20:48:06 +00:00
2011-02-25 11:46:38 +00:00
if (!global->global_power.button || !dent->d_parent || !dent->new_link) {
return 0;
2011-02-23 20:48:06 +00:00
}
2011-02-25 11:46:38 +00:00
status = _parse_args(dent, dent->new_link, 2);
if (status < 0) {
goto done;
2011-02-23 20:48:06 +00:00
}
2011-03-01 09:34:36 +00:00
status = __make_copy(global, dent->d_parent, dent, dent->d_path, (const char**)dent->d_argv, -1, NULL);
2011-02-23 20:48:06 +00:00
done:
MARS_DBG("status = %d\n", status);
return status;
}
2011-02-28 18:00:32 +00:00
static int make_sync(void *buf, struct mars_dent *dent)
2011-02-23 20:48:06 +00:00
{
struct mars_global *global = buf;
2011-02-25 11:46:38 +00:00
loff_t start_pos = 0;
2011-02-28 18:00:32 +00:00
struct mars_dent *connect_dent;
2011-02-25 11:46:38 +00:00
char *peer;
struct copy_brick *copy = NULL;
2011-02-27 14:17:58 +00:00
char src[MARS_PATH_MAX];
char dst[MARS_PATH_MAX];
2011-02-25 11:46:38 +00:00
const char *argv[2] = { src, dst };
2011-02-23 20:48:06 +00:00
int status;
2011-02-27 14:17:58 +00:00
if (!global->global_power.button || !dent->d_activate || !dent->d_parent || !dent->new_link) {
2011-02-23 20:48:06 +00:00
return 0;
}
2011-02-25 11:46:38 +00:00
/* Analyze replay position
*/
status = sscanf(dent->new_link, "%lld", &start_pos);
if (status != 1) {
MARS_ERR("bad syncstatus symlink syntax '%s' (%s)\n", dent->new_link, dent->d_path);
status = -EINVAL;
goto done;
}
2011-02-27 14:17:58 +00:00
dent->d_kill_inactive = true;
2011-02-25 11:46:38 +00:00
/* Determine peer
*/
snprintf(src, sizeof(src), "%s/connect-%s", dent->d_parent->d_path, my_id());
connect_dent = (void*)mars_find_dent(global, src);
if (!connect_dent || !connect_dent->new_link) {
MARS_ERR("cannot determine peer, symlink '%s' is missing\n", src);
status = -ENOENT;
2011-02-23 20:48:06 +00:00
goto done;
}
2011-02-27 14:17:58 +00:00
connect_dent->d_kill_inactive = true;
if (!connect_dent->d_activate) {
MARS_DBG("sync paused: symlink '%s' is deactivated\n", src);
status = 0;
goto done;
}
2011-02-25 11:46:38 +00:00
peer = connect_dent->new_link;
/* Start copy
*/
2011-03-01 09:34:36 +00:00
snprintf(src, sizeof(src), "%s/data-%s@%s", dent->d_parent->d_path, peer, peer);
2011-02-25 11:46:38 +00:00
snprintf(dst, sizeof(dst), "%s/data-%s", dent->d_parent->d_path, my_id());
MARS_DBG("starting initial sync '%s' => '%s'\n", src, dst);
2011-03-01 09:34:36 +00:00
status = __make_copy(global, dent->d_parent, dent, dent->d_path, argv, start_pos, &copy);
2011-02-23 20:48:06 +00:00
2011-02-25 11:46:38 +00:00
/* Update syncstatus symlink
*/
if (status >= 0 && copy && copy->power.button && copy->power.led_on) {
snprintf(src, sizeof(src), "%lld", copy->copy_last);
snprintf(dst, sizeof(dst), "%s/syncstatus-%s", dent->d_parent->d_path, my_id());
2011-02-27 14:17:58 +00:00
status = mars_symlink(src, dst, NULL, 0);
2011-02-25 11:46:38 +00:00
if (status >= 0 && copy->copy_last == copy->copy_end) {
2011-02-28 18:00:32 +00:00
status = mars_power_button((void*)copy, false);
2011-02-25 11:46:38 +00:00
MARS_DBG("copy switch status = %d\n", status);
}
}
2011-02-23 20:48:06 +00:00
done:
MARS_DBG("status = %d\n", status);
return status;
}
///////////////////////////////////////////////////////////////////////
// the order is important!
enum {
2011-02-25 11:46:38 +00:00
// root element: this must have index 0
CL_ROOT,
// replacement for DNS in kernelspace
2011-02-23 20:48:06 +00:00
CL_IPS,
CL_PEERS,
2011-02-25 11:46:38 +00:00
// resource definitions
2011-02-23 20:48:06 +00:00
CL_RESOURCE,
2011-02-25 11:46:38 +00:00
CL_CONNECT,
2011-02-23 20:48:06 +00:00
CL_DATA,
CL_PRIMARY,
CL__FILE,
CL_SYNC,
CL__COPY,
CL__REMOTE,
CL__DIRECT,
CL_REPLAYSTATUS,
CL_LOG,
CL_DEVICE,
};
/* Please keep the order the same as in the enum.
*/
static const struct light_class light_classes[] = {
/* Placeholder for root node /mars/
*/
[CL_ROOT] = {
},
/* Directory containing the addresses of all peers
*/
[CL_IPS] = {
.cl_name = "ips",
.cl_len = 3,
.cl_type = 'd',
.cl_father = CL_ROOT,
2011-02-24 16:37:32 +00:00
#if 0
2011-02-23 20:48:06 +00:00
.cl_forward = make_scan,
.cl_backward = kill_scan,
#endif
},
/* Anyone participating in a MARS cluster must
* be named here (symlink pointing to the IP address).
* We have no DNS in kernel space.
*/
[CL_PEERS] = {
.cl_name = "ip-",
.cl_len = 3,
.cl_type = 'l',
.cl_father = CL_IPS,
2011-02-24 16:37:32 +00:00
#if 1
.cl_forward = make_scan,
.cl_backward = kill_scan,
#endif
2011-02-23 20:48:06 +00:00
},
/* Directory containing all items of a resource
*/
[CL_RESOURCE] = {
.cl_name = "resource-",
.cl_len = 9,
.cl_type = 'd',
.cl_father = CL_ROOT,
.cl_forward = make_log_init,
.cl_backward = NULL,
},
2011-02-25 11:46:38 +00:00
/* Symlink indicating the current peer
*/
[CL_CONNECT] = {
.cl_name = "connect-",
.cl_len = 8,
.cl_type = 'l',
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = NULL,
.cl_backward = NULL,
},
2011-02-23 20:48:06 +00:00
/* File or symlink to the real device / real (sparse) file
* when hostcontext is missing, the corresponding peer will
* not participate in that resource.
*/
[CL_DATA] = {
.cl_name = "data-",
.cl_len = 5,
.cl_type = 'F',
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = make_aio,
2011-02-28 18:00:32 +00:00
.cl_backward = kill_all,
2011-02-23 20:48:06 +00:00
},
/* Symlink pointing to the name of the primary node
*/
[CL_PRIMARY] = {
.cl_name = "primary",
.cl_len = 7,
.cl_type = 'l',
.cl_hostcontext = false,
.cl_father = CL_RESOURCE,
.cl_forward = make_primary,
.cl_backward = NULL,
},
/* Only for testing: open local file
*/
[CL__FILE] = {
.cl_name = "_file-",
.cl_len = 6,
.cl_type = 'F',
.cl_serial = true,
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = make_aio,
2011-02-28 18:00:32 +00:00
.cl_backward = kill_all,
2011-02-23 20:48:06 +00:00
},
/* symlink indicating the current status / end
* of initial data sync.
*/
[CL_SYNC] = {
.cl_name = "syncstatus-",
.cl_len = 11,
.cl_type = 'l',
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
2011-02-25 11:46:38 +00:00
#if 1
2011-02-23 20:48:06 +00:00
.cl_forward = make_sync,
2011-02-28 18:00:32 +00:00
.cl_backward = kill_all,
2011-02-23 20:48:06 +00:00
#endif
},
/* Only for testing: make a copy instance
*/
[CL__COPY] = {
.cl_name = "_copy-",
.cl_len = 6,
.cl_type = 'l',
.cl_serial = true,
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = _make_copy,
.cl_backward = kill_all,
},
/* Only for testing: access remote data directly
*/
[CL__REMOTE] = {
.cl_name = "_remote-",
.cl_len = 8,
.cl_type = 'l',
.cl_serial = true,
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = _make_remote,
.cl_backward = _kill_remote,
},
/* Only for testing: access local data
*/
[CL__DIRECT] = {
.cl_name = "_direct-",
.cl_len = 8,
.cl_type = 'l',
.cl_serial = true,
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = _make_direct,
.cl_backward = kill_all,
},
/* Passive symlink indicating the last state of
* transaction log replay.
*/
[CL_REPLAYSTATUS] = {
.cl_name = "replay-",
.cl_len = 7,
.cl_type = 'l',
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
2011-02-27 14:17:58 +00:00
#if 0
.cl_forward = make_replay,
.cl_backward = kill_all,
#endif
2011-02-23 20:48:06 +00:00
},
/* Logfiles for transaction logger
*/
[CL_LOG] = {
.cl_name = "log-",
.cl_len = 4,
.cl_type = 'F',
.cl_serial = true,
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
#if 1
.cl_forward = make_log,
.cl_backward = kill_all,
#endif
},
/* Name of the device appearing at the primary
*/
[CL_DEVICE] = {
.cl_name = "device-",
.cl_len = 7,
.cl_type = 'l',
.cl_hostcontext = true,
.cl_father = CL_RESOURCE,
.cl_forward = make_dev,
2011-02-28 18:00:32 +00:00
.cl_backward = kill_all,
2011-02-23 20:48:06 +00:00
},
{}
};
/* Helper routine to pre-determine the relevance of a name from the filesystem.
*/
static int light_checker(const char *path, const char *_name, int namlen, unsigned int d_type, int *prefix, int *serial)
{
char name[namlen+1];
int class;
memcpy(name, _name, namlen);
name[namlen] = '\0';
//MARS_DBG("trying '%s' '%s'\n", path, name);
for (class = CL_ROOT + 1; ; class++) {
const struct light_class *test = &light_classes[class];
int len = test->cl_len;
if (!len || !test->cl_name)
break;
//MARS_DBG(" testing class '%s'\n", test->cl_name);
#if 0
if (len != strlen(test->cl_name)) {
MARS_ERR("internal table '%s': %d != %d\n", test->cl_name, len, (int)strlen(test->cl_name));
len = strlen(test->cl_name);
}
#endif
if (namlen >= len && !memcmp(name, test->cl_name, len)) {
//MARS_DBG("path '%s/%s' matches class %d '%s'\n", path, name, class, test->cl_name);
// special contexts
if (test->cl_serial) {
int plus = 0;
int count;
count = sscanf(name+len, "%d%n", serial, &plus);
if (count < 1) {
//MARS_DBG("'%s' serial number mismatch at '%s'\n", name, name+len);
return -1;
}
len += plus;
if (name[len] == '-')
len++;
}
*prefix = len;
if (test->cl_hostcontext) {
if (memcmp(name+len, my_id(), namlen-len)) {
//MARS_DBG("context mismatch '%s' at '%s'\n", name, name+len);
return -1;
}
}
return class;
}
}
//MARS_DBG("no match for '%s' '%s'\n", path, name);
return -2;
}
/* Do some syntactic checks, then delegate work to the real worker functions
* from the light_classes[] table.
*/
static int light_worker(struct mars_global *global, struct mars_dent *dent, bool direction)
{
light_worker_fn worker;
int class = dent->d_class;
if (class < 0 || class >= sizeof(light_classes)/sizeof(struct light_class)) {
MARS_ERR_ONCE(dent, "bad internal class %d of '%s'\n", class, dent->d_path);
return -EINVAL;
}
switch (light_classes[class].cl_type) {
case 'd':
if (!S_ISDIR(dent->new_stat.mode)) {
MARS_ERR_ONCE(dent, "'%s' should be a directory, but is something else\n", dent->d_path);
return -EINVAL;
}
break;
case 'f':
if (!S_ISREG(dent->new_stat.mode)) {
MARS_ERR_ONCE(dent, "'%s' should be a regular file, but is something else\n", dent->d_path);
return -EINVAL;
}
break;
case 'F':
if (!S_ISREG(dent->new_stat.mode) && !S_ISLNK(dent->new_stat.mode)) {
MARS_ERR_ONCE(dent, "'%s' should be a regular file or a symlink, but is something else\n", dent->d_path);
return -EINVAL;
}
break;
case 'l':
if (!S_ISLNK(dent->new_stat.mode)) {
MARS_ERR_ONCE(dent, "'%s' should be a symlink, but is something else\n", dent->d_path);
return -EINVAL;
}
break;
}
if (likely(class > CL_ROOT)) {
int father = light_classes[class].cl_father;
if (father == CL_ROOT) {
if (unlikely(dent->d_parent)) {
MARS_ERR_ONCE(dent, "'%s' is not at the root of the hierarchy\n", dent->d_path);
return -EINVAL;
}
} else if (unlikely(!dent->d_parent || dent->d_parent->d_class != father)) {
MARS_ERR_ONCE(dent, "last component '%s' from '%s' is at the wrong position in the hierarchy (class = %d, parent_class = %d, parent = '%s')\n", dent->d_name, dent->d_path, father, dent->d_parent ? dent->d_parent->d_class : -9999, dent->d_parent ? dent->d_parent->d_path : "");
return -EINVAL;
}
}
if (direction) {
worker = light_classes[class].cl_backward;
} else {
worker = light_classes[class].cl_forward;
}
if (worker) {
int status;
//MARS_DBG("working %s on '%s' rest='%s'\n", direction ? "backward" : "forward", dent->d_path, dent->d_rest);
status = worker(global, (void*)dent);
MARS_DBG("worked %s on '%s', status = %d\n", direction ? "backward" : "forward", dent->d_path, status);
return status;
}
return 0;
}
static int light_thread(void *data)
{
char *id = my_id();
int status = 0;
struct mars_global global = {
.dent_anchor = LIST_HEAD_INIT(global.dent_anchor),
.brick_anchor = LIST_HEAD_INIT(global.brick_anchor),
.global_power = {
.button = true,
},
.mutex = __SEMAPHORE_INITIALIZER(global.mutex, 1),
.main_event = __WAIT_QUEUE_HEAD_INITIALIZER(global.main_event),
};
mars_global = &global; // TODO: cleanup, avoid stack
if (!id || strlen(id) < 2) {
MARS_ERR("invalid hostname\n");
status = -EFAULT;
goto done;
}
fake_mm();
MARS_INF("-------- starting as host '%s' ----------\n", id);
while (global.global_power.button || !list_empty(&global.brick_anchor)) {
int status;
global.global_power.button = !kthread_should_stop();
2011-02-28 18:00:32 +00:00
status = mars_dent_work(&global, "/mars", sizeof(struct mars_dent), light_checker, light_worker, &global, 3);
2011-02-23 20:48:06 +00:00
MARS_DBG("worker status = %d\n", status);
2011-02-27 14:17:58 +00:00
{
struct list_head *tmp;
down(&global.mutex);
for (tmp = global.brick_anchor.next; tmp != &global.brick_anchor; tmp = tmp->next) {
struct mars_brick *test;
const char *path;
int pos;
char *src;
char dst[MARS_PATH_MAX];
2011-03-01 09:34:36 +00:00
test = container_of(tmp, struct mars_brick, global_brick_link);
2011-02-27 14:17:58 +00:00
if (test->log_level <= 0)
continue;
path = test->brick_path;
if (!path || *path != '/')
continue;
pos = strlen(path);
while (pos > 0 && path[pos] != '/') pos--;
memcpy(dst, path, pos);
snprintf(dst + pos, sizeof(dst) - pos, "/actual.%s", path + pos + 1);
src = test->power.led_on ? "1" : "0";
status = mars_symlink(src, dst, NULL, 0);
MARS_DBG("status symlink '%s' -> '%s' status = %d\n", dst, src, status);
if (test->log_level > 1) {
char perc[8];
pos = strlen(dst);
strncpy(dst + pos, ".percent", sizeof(dst) - pos);
snprintf(perc, sizeof(perc), "%d", test->power.percent_done);
status = mars_symlink(perc, dst, NULL, 0);
MARS_DBG("percent symlink '%s' -> '%s' status = %d\n", dst, src, status);
}
}
up(&global.mutex);
}
2011-02-23 20:48:06 +00:00
wait_event_interruptible_timeout(global.main_event, global.main_trigger, 30 * HZ);
global.main_trigger = false;
#ifdef MARS_DEBUGGING
{
struct list_head *tmp;
int dent_count = 0;
int brick_count = 0;
down(&global.mutex);
MARS_IO("----------- lists:\n");
for (tmp = global.dent_anchor.next; tmp != &global.dent_anchor; tmp = tmp->next) {
struct mars_dent *dent;
2011-03-01 09:34:36 +00:00
dent = container_of(tmp, struct mars_dent, dent_link);
2011-02-23 20:48:06 +00:00
MARS_IO("dent '%s'\n", dent->d_path);
dent_count++;
}
for (tmp = global.brick_anchor.next; tmp != &global.brick_anchor; tmp = tmp->next) {
struct mars_brick *test;
2011-03-01 09:34:36 +00:00
test = container_of(tmp, struct mars_brick, global_brick_link);
2011-02-27 14:17:58 +00:00
MARS_IO("brick type = %s path = '%s' name = '%s' button = %d on = %d off = %d\n", test->type->type_name, test->brick_path, test->brick_name, test->power.button, test->power.led_on, test->power.led_off);
2011-02-23 20:48:06 +00:00
brick_count++;
}
up(&global.mutex);
MARS_INF("----------- STATISTICS: %d dents, %d bricks\n", dent_count, brick_count);
}
msleep(500);
#endif
}
done:
MARS_INF("-------- cleaning up ----------\n");
2011-03-01 09:34:36 +00:00
mars_free_dent_all(&global.dent_anchor);
2011-02-23 20:48:06 +00:00
cleanup_mm();
mars_global = NULL;
main_thread = NULL;
MARS_INF("-------- done status = %d ----------\n", status);
return status;
}
static void __exit exit_light(void)
{
// TODO: make this thread-safe.
struct task_struct *thread = main_thread;
if (thread) {
main_thread = NULL;
MARS_DBG("====================== stopping everything...\n");
kthread_stop_nowait(thread);
mars_trigger();
kthread_stop(thread);
put_task_struct(thread);
MARS_DBG("====================== stopped everything.\n");
}
}
static int __init init_light(void)
{
struct task_struct *thread;
thread = kthread_create(light_thread, NULL, "mars_light");
if (IS_ERR(thread)) {
return PTR_ERR(thread);
}
get_task_struct(thread);
main_thread = thread;
wake_up_process(thread);
return 0;
}
MODULE_DESCRIPTION("MARS Light");
MODULE_AUTHOR("Thomas Schoebel-Theuer <tst@1und1.de>");
MODULE_LICENSE("GPL");
module_init(init_light);
module_exit(exit_light);