mars/kernel/mars_copy.c

1283 lines
33 KiB
C
Raw Normal View History

2014-11-21 10:51:34 +00:00
/*
* MARS Long Distance Replication Software
*
* This file is part of MARS project: http://schoebel.github.io/mars/
*
* Copyright (C) 2010-2014 Thomas Schoebel-Theuer
* Copyright (C) 2011-2014 1&1 Internet AG
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
*/
2011-02-23 20:48:06 +00:00
// Copy brick (just for demonstration)
//#define BRICK_DEBUGGING
//#define MARS_DEBUGGING
//#define IO_DEBUGGING
#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/string.h>
#include "mars.h"
#include "lib_limiter.h"
2011-02-23 20:48:06 +00:00
2012-02-22 13:34:04 +00:00
#ifndef READ
#define READ 0
#define WRITE 1
#endif
#define COPY_CHUNK (PAGE_SIZE)
2017-04-03 10:24:18 +00:00
#define NR_COPY_REQUESTS (128 * 1024 * 1024 / COPY_CHUNK)
#define STATES_PER_PAGE (PAGE_SIZE / sizeof(struct copy_state))
#define MAX_SUB_TABLES (NR_COPY_REQUESTS / STATES_PER_PAGE + (NR_COPY_REQUESTS % STATES_PER_PAGE ? 1 : 0))
#define GET_STATE(brick,index) \
2021-04-16 08:17:01 +00:00
((brick)->st[(unsigned)(index) / STATES_PER_PAGE][(unsigned)(index) % STATES_PER_PAGE])
2011-02-23 20:48:06 +00:00
///////////////////////// own type definitions ////////////////////////
#include "mars_copy.h"
int mars_copy_overlap = 1;
EXPORT_SYMBOL_GPL(mars_copy_overlap);
2017-05-18 12:18:54 +00:00
/* Always leave at 1, disable only for throughput _testing_ */
int mars_copy_strict_write_order = 1;
int mars_copy_timeout = 180;
int mars_copy_read_prio = MARS_PRIO_NORMAL;
EXPORT_SYMBOL_GPL(mars_copy_read_prio);
int mars_copy_write_prio = MARS_PRIO_NORMAL;
EXPORT_SYMBOL_GPL(mars_copy_write_prio);
2017-04-11 06:31:56 +00:00
int mars_copy_read_max_fly = 32768;
2013-07-22 07:15:53 +00:00
EXPORT_SYMBOL_GPL(mars_copy_read_max_fly);
2017-04-11 06:31:56 +00:00
int mars_copy_write_max_fly = 32768;
2013-07-22 07:15:53 +00:00
EXPORT_SYMBOL_GPL(mars_copy_write_max_fly);
2017-04-11 06:27:24 +00:00
atomic_t global_copy_read_flight;
atomic_t global_copy_write_flight;
2013-07-22 07:15:53 +00:00
#define is_read_limited(brick) \
2017-04-11 06:27:24 +00:00
(mars_copy_read_max_fly > 0 && atomic_read(&global_copy_read_flight) >= mars_copy_read_max_fly)
2013-07-22 07:15:53 +00:00
#define is_write_limited(brick) \
2017-04-11 06:27:24 +00:00
(mars_copy_write_max_fly > 0 && atomic_read(&global_copy_write_flight) >= mars_copy_write_max_fly)
2013-07-22 07:15:53 +00:00
2011-02-23 20:48:06 +00:00
///////////////////////// own helper functions ////////////////////////
/* TODO:
* The clash logic is untested / alpha stage (Feb. 2011).
*
* For now, the output is never used, so this cannot do harm.
*
* In order to get the output really working / enterprise grade,
* some larger test effort should be invested.
*/
static inline
void _clash(struct copy_brick *brick)
{
set_bit(0, &brick->clash);
2012-12-20 10:22:41 +00:00
atomic_inc(&brick->total_clash_count);
WRITE_ONCE(brick->trigger, true);
2011-02-23 20:48:06 +00:00
wake_up_interruptible(&brick->event);
}
static inline
int _clear_clash(struct copy_brick *brick)
{
int old;
old = test_and_clear_bit(0, &brick->clash);
return old;
}
2021-07-12 08:29:40 +00:00
/* Current semantics (NOT REALLY IMPLEMENTED because OUTPUT IS NOT IN USE)
2011-02-23 20:48:06 +00:00
*
2021-07-12 08:29:40 +00:00
* All writes from the OUTPUT are always going to the original input A. They are _not_
2011-02-23 20:48:06 +00:00
* replicated to B.
*
* In order to get B really uptodate, you have to replay the right
* transaction logs there (at the right time).
* [If you had no writes on A at all during the copy, of course
* this is not necessary]
*
2011-05-26 14:32:32 +00:00
* When utilize_mode is on, reads can utilize the already copied
2011-02-23 20:48:06 +00:00
* region from B, but only as long as this region has not been
* invalidated by writes (indicated by low_dirty).
*
* TODO: implement replicated writes, together with some transaction
* replay logic applying the transaction logs _only_ after
* crashes during inconsistency caused by partial replication of writes.
*/
2011-02-23 20:48:06 +00:00
static
struct copy_input *_determine_input(struct copy_brick *brick, struct mref_object *mref)
2011-02-23 20:48:06 +00:00
{
struct copy_mref_aspect *mref_a;
2011-02-23 20:48:06 +00:00
mref_a = copy_mref_get_aspect(brick, mref);
if (unlikely(!mref_a)) {
MARS_FAT("cannot get own aspect from %p %p\n",
brick, mref);
return NULL;
}
/* TODO: implement the new logic, for the envisioned
* new use cases.
*/
return mref_a->input;
2011-02-23 20:48:06 +00:00
}
2021-04-16 08:33:51 +00:00
#define GET_INDEX(pos) (((unsigned long)(pos) / COPY_CHUNK) % NR_COPY_REQUESTS)
#define GET_OFFSET(pos) ((unsigned long)(pos) % COPY_CHUNK)
2011-02-23 20:48:06 +00:00
2012-01-23 12:39:08 +00:00
static
2021-04-16 08:24:31 +00:00
void __clear_mref(struct copy_brick *brick, struct mref_object *mref, unsigned queue)
2012-01-23 12:39:08 +00:00
{
struct copy_input *input;
2021-04-16 08:24:31 +00:00
2021-07-12 08:29:40 +00:00
input = queue ? brick->inputs[INPUT_B] : brick->inputs[INPUT_A];
2021-06-29 08:52:11 +00:00
GENERIC_INPUT_CALL_VOID(input, mref_put, mref);
2012-01-23 12:39:08 +00:00
}
static
2021-04-16 08:40:47 +00:00
void _clear_mref(struct copy_brick *brick, unsigned index, unsigned queue)
2012-01-23 12:39:08 +00:00
{
struct copy_state *st = &GET_STATE(brick, index);
struct mref_object *mref = READ_ONCE(st->table[queue]);
2012-01-23 12:39:08 +00:00
if (mref) {
/* This should never happen */
if (unlikely(READ_ONCE(st->active[queue]))) {
WRITE_ONCE(st->active[queue], false);
2021-04-16 08:40:47 +00:00
MARS_ERR("clearing active mref, index = %u queue = %u\n",
2021-04-16 08:24:31 +00:00
index, queue);
2012-12-20 16:54:22 +00:00
}
2012-01-23 12:39:08 +00:00
__clear_mref(brick, mref, queue);
WRITE_ONCE(st->table[queue], NULL);
2012-01-23 12:39:08 +00:00
}
}
static
void _clear_all_mref(struct copy_brick *brick)
{
2021-04-16 08:40:47 +00:00
unsigned i;
for (i = 0; i < NR_COPY_REQUESTS; i++) {
GET_STATE(brick, i).state = COPY_STATE_START;
2012-01-23 12:39:08 +00:00
_clear_mref(brick, i, 0);
_clear_mref(brick, i, 1);
}
}
static
void _clear_state_table(struct copy_brick *brick)
{
2021-04-16 08:17:01 +00:00
unsigned i;
for (i = 0; i < MAX_SUB_TABLES; i++) {
struct copy_state *sub_table = brick->st[i];
2021-04-16 08:17:01 +00:00
memset(sub_table, 0, PAGE_SIZE);
}
2022-05-19 20:32:08 +00:00
mb();
}
2011-02-23 20:48:06 +00:00
static
void copy_endio(struct generic_callback *cb)
{
struct copy_mref_aspect *mref_a;
struct mref_object *mref;
2017-04-07 05:56:28 +00:00
struct copy_input *input;
2011-02-23 20:48:06 +00:00
struct copy_brick *brick;
2011-06-10 13:57:52 +00:00
struct copy_state *st;
2022-05-19 20:32:08 +00:00
struct mref_object *old_mref;
2021-04-16 08:40:47 +00:00
unsigned index;
2022-05-19 21:56:57 +00:00
unsigned check_index;
2021-04-16 08:24:31 +00:00
unsigned queue;
2011-06-10 13:57:52 +00:00
int error = 0;
2011-02-23 20:48:06 +00:00
LAST_CALLBACK(cb);
2011-02-23 20:48:06 +00:00
mref_a = cb->cb_private;
CHECK_PTR(mref_a, err);
mref = mref_a->object;
CHECK_PTR(mref, err);
brick = mref_a->brick;
CHECK_PTR(brick, err);
2017-03-01 07:49:10 +00:00
/* This is racy, but affects only a _hint_ for
* performance optimization.
*/
2017-04-07 05:56:28 +00:00
input = mref_a->input;
if (input &&
(!input->check_hint || mref->ref_pos < input->check_hint))
input->check_hint = mref->ref_pos;
2017-02-25 16:42:37 +00:00
2022-05-19 21:56:57 +00:00
queue = mref_a->saved_queue;
index = mref_a->saved_index;
/* index paranoia */
check_index = GET_INDEX(mref_a->orig_ref_pos);
if (unlikely(check_index != index)) {
/* This should not happen */
MARS_ERR("index slippery %u != %u on queue=%u: mref=%p mref_a=%p cb=%p err=%d\n",
index, check_index,
queue,
mref, mref_a,
cb, cb->cb_error);
error = -EEXIST;
goto exit;
}
st = &GET_STATE(brick, index);
2011-06-10 13:57:52 +00:00
2022-05-19 20:32:08 +00:00
MARS_IO("queue=%u index=%u pos=%lld state=%d err=%d\n",
2021-04-16 08:24:31 +00:00
queue, index,
mref->ref_pos,
2022-05-19 20:32:08 +00:00
st->state,
2021-04-16 08:24:31 +00:00
cb->cb_error);
if (unlikely(queue >= 2)) {
2022-05-19 20:32:08 +00:00
MARS_ERR("bad queue %u at %p %p state=%d err=%d\n",
2021-04-16 08:24:31 +00:00
queue,
2022-05-19 20:32:08 +00:00
cb, mref_a,
st->state,
cb->cb_error);
2011-06-10 13:57:52 +00:00
error = -EINVAL;
2011-02-23 20:48:06 +00:00
goto exit;
}
2022-05-19 20:32:08 +00:00
old_mref = READ_ONCE(st->table[queue]);
if (unlikely(old_mref != mref)) {
2022-05-19 21:56:57 +00:00
MARS_ERR("table corruption at index=%u queue=%u: %p => %p state=%d err=%d\n",
2022-05-19 20:32:08 +00:00
index, queue,
old_mref, mref,
st->state,
cb->cb_error);
2011-06-10 13:57:52 +00:00
error = -EEXIST;
2011-02-23 20:48:06 +00:00
goto exit;
}
if (unlikely(cb->cb_error < 0)) {
2011-06-10 13:57:52 +00:00
error = cb->cb_error;
2012-08-22 12:37:34 +00:00
/* This is racy, but does no harm.
* Worst case just produces more error output.
*/
if (!brick->copy_error_count++) {
2022-05-19 20:32:08 +00:00
MARS_WRN("IO error on index=%u state=%d err=%d\n",
2021-04-16 08:40:47 +00:00
index,
2022-05-19 20:32:08 +00:00
st->state,
cb->cb_error);
2012-08-22 12:37:34 +00:00
}
2011-02-23 20:48:06 +00:00
}
exit:
if (unlikely(error < 0)) {
WRITE_ONCE(st->error, error);
2011-06-10 13:57:52 +00:00
_clash(brick);
}
WRITE_ONCE(st->active[queue], false);
if (mref->ref_flags & MREF_WRITE) {
2013-07-22 07:15:53 +00:00
atomic_dec(&brick->copy_write_flight);
2017-04-11 06:27:24 +00:00
atomic_dec(&global_copy_write_flight);
2013-07-22 07:15:53 +00:00
} else {
atomic_dec(&brick->copy_read_flight);
2017-04-11 06:27:24 +00:00
atomic_dec(&global_copy_read_flight);
2013-07-22 07:15:53 +00:00
}
WRITE_ONCE(brick->trigger, true);
2011-02-23 20:48:06 +00:00
wake_up_interruptible(&brick->event);
return;
err:
MARS_FAT("cannot handle callback\n");
}
static
2021-04-16 08:24:31 +00:00
int _make_mref(struct copy_brick *brick,
2022-05-19 21:56:57 +00:00
const unsigned index,
/* let the compiler check for 0 <= queue <= 1 */
const bool _queue,
2021-04-16 08:24:31 +00:00
void *data,
2019-03-25 08:12:45 +00:00
loff_t pos, loff_t end_pos,
__u32 flags)
2011-02-23 20:48:06 +00:00
{
struct mref_object *mref;
struct copy_mref_aspect *mref_a;
struct copy_input *input;
struct copy_state *st;
2022-05-19 20:32:08 +00:00
struct mref_object *old_mref;
2022-05-19 21:56:57 +00:00
const unsigned queue = _queue;
unsigned input_index;
2021-04-16 09:04:52 +00:00
unsigned offset;
unsigned len;
2012-02-22 13:34:04 +00:00
int status = -EAGAIN;
2011-02-23 20:48:06 +00:00
2022-05-19 20:32:08 +00:00
/* Does it make sense to create a new mref right here? */
2021-04-16 08:07:55 +00:00
if (brick->clash || pos < 0 || end_pos <= 0 || pos >= end_pos)
2011-02-23 20:48:06 +00:00
goto done;
2022-05-19 20:32:08 +00:00
/* Some safeguards */
if (unlikely(queue < 0 || queue >= 2)) {
MARS_ERR("trying bad queue %d\n",
queue);
status = -EINVAL;
goto done;
}
if (unlikely(index > NR_COPY_REQUESTS)) {
MARS_ERR("trying bad index=%u at queue=%d pos=%lld end_pos=%lld flags=%d\n",
index, queue, pos, end_pos, flags);
status = -EINVAL;
goto done;
}
st = &GET_STATE(brick, index);
old_mref = READ_ONCE(st->table[queue]);
if (unlikely(old_mref)) {
MARS_ERR("cannot overrride old_mref=%p at index=%u queue=%d pos=%lld end_pos=%lld flags=%d\n",
old_mref,
index, queue, pos, end_pos, flags);
status = -EEXIST;
goto done;
}
/* Now create the new mref and remember in st->table[] */
2012-02-02 15:25:43 +00:00
mref = copy_alloc_mref(brick);
2011-02-23 20:48:06 +00:00
status = -ENOMEM;
if (unlikely(!mref))
goto done;
mref_a = copy_mref_get_aspect(brick, mref);
2011-02-23 20:48:06 +00:00
if (unlikely(!mref_a)) {
2022-05-19 20:32:08 +00:00
MARS_FAT("cannot get aspect from %p %p\n",
brick, mref);
2011-02-23 20:48:06 +00:00
goto done;
}
2022-05-19 21:56:57 +00:00
/* Save some important values for the lifetime of
* of the mref object and the corresponding aspect instance.
*/
/*input = queue ? brick->inputs[INPUT_B] : brick->inputs[INPUT_A];*/
input_index = INPUT_A + (queue * (INPUT_B - INPUT_A));
input = brick->inputs[input_index];
mref_a->input = input;
2011-02-23 20:48:06 +00:00
mref_a->brick = brick;
2022-05-19 21:56:57 +00:00
mref_a->orig_ref_pos = pos;
mref_a->saved_queue = queue;
mref_a->saved_index = index;
/* Compute the start values for the new mref */
mref->ref_flags = flags;
2011-02-23 20:48:06 +00:00
mref->ref_data = data;
mref->ref_pos = pos;
2011-06-10 13:57:52 +00:00
offset = GET_OFFSET(pos);
len = COPY_CHUNK - offset;
2012-02-22 13:34:04 +00:00
if (pos + len > end_pos) {
2021-04-16 09:04:52 +00:00
unsigned new_len = end_pos - pos;
if (new_len < len)
len = new_len;
2011-02-23 20:48:06 +00:00
}
mref->ref_len = len;
mref->ref_prio = (flags & MREF_WRITE) ?
mars_copy_write_prio :
mars_copy_read_prio;
if (mref->ref_prio < MARS_PRIO_HIGH || mref->ref_prio > MARS_PRIO_LOW)
mref->ref_prio = brick->io_prio;
2021-03-01 10:01:37 +00:00
st->len = len;
WRITE_ONCE(st->table[queue], mref);
WRITE_ONCE(st->active[queue], true);
SETUP_CALLBACK(mref, copy_endio, mref_a);
2011-02-23 20:48:06 +00:00
status = GENERIC_INPUT_CALL(input, mref_get, mref);
if (unlikely(status < 0)) {
2021-04-16 09:04:52 +00:00
MARS_ERR("mref_get %u status = %d\n",
len, status);
2011-02-23 20:48:06 +00:00
mars_free_mref(mref);
goto done;
}
2021-04-16 09:04:52 +00:00
/* in general, mref_get() may deliver a shorter buffer */
2022-05-19 22:01:19 +00:00
if (mref->ref_len < len) {
2021-03-01 10:01:37 +00:00
st->len = mref->ref_len;
2022-05-19 22:01:19 +00:00
MARS_DBG("shorten len %d < %u at queue=%d index=%u\n",
mref->ref_len, len, queue, index);
2012-02-22 13:34:04 +00:00
}
2011-02-23 20:48:06 +00:00
if (flags & MREF_WRITE) {
2013-07-22 07:15:53 +00:00
atomic_inc(&brick->copy_write_flight);
2017-04-11 06:27:24 +00:00
atomic_inc(&global_copy_write_flight);
2013-07-22 07:15:53 +00:00
} else {
atomic_inc(&brick->copy_read_flight);
2017-04-11 06:27:24 +00:00
atomic_inc(&global_copy_read_flight);
2013-07-22 07:15:53 +00:00
}
2021-06-29 08:52:11 +00:00
GENERIC_INPUT_CALL_VOID(input, mref_io, mref);
2011-02-23 20:48:06 +00:00
done:
return status;
}
2011-03-07 05:55:10 +00:00
static
void _update_percent(struct copy_brick *brick, bool force)
2011-03-07 05:55:10 +00:00
{
if (force
|| brick->copy_last > brick->copy_start + 8 * 1024 * 1024
2011-03-07 05:55:10 +00:00
|| (long long)jiffies > brick->last_jiffies + 5 * HZ
2011-06-17 11:32:38 +00:00
|| (brick->copy_last == brick->copy_end && brick->copy_end > 0)) {
brick->copy_start = brick->copy_last;
2011-03-07 05:55:10 +00:00
brick->last_jiffies = jiffies;
brick->power.percent_done = brick->copy_end > 0 ? brick->copy_start * 100 / brick->copy_end : 0;
MARS_INF("'%s' copied %lld / %lld bytes (%d%%)\n", brick->brick_path, brick->copy_last, brick->copy_end, brick->power.percent_done);
2011-03-07 05:55:10 +00:00
}
}
2019-03-25 08:12:45 +00:00
static inline
2019-03-26 09:57:33 +00:00
__u32 _make_flags(bool verify_mode, bool is_local)
2019-03-25 08:12:45 +00:00
{
if (!verify_mode)
return 0;
2019-03-26 09:57:33 +00:00
if (is_local)
return available_digest_mask | MREF_NODATA;
2019-07-23 07:41:42 +00:00
return (usable_digest_mask & ~disabled_net_digests) | MREF_NODATA;
2019-03-25 08:12:45 +00:00
}
2012-08-02 08:16:55 +00:00
/* The heart of this brick.
* State transition function of the finite automaton.
* In case no progress is possible (e.g. preconditions not
* yet true), the state is left as is (idempotence property:
* calling this too often does no harm, just costs performance).
*/
2011-02-23 20:48:06 +00:00
static
2021-04-16 08:40:47 +00:00
int _next_state(struct copy_brick *brick, unsigned index, loff_t pos)
2011-02-23 20:48:06 +00:00
{
2011-06-17 11:32:38 +00:00
struct mref_object *mref0;
2011-02-23 20:48:06 +00:00
struct mref_object *mref1;
2011-06-10 13:57:52 +00:00
struct copy_state *st;
enum _copy_state state;
enum _copy_state next_state;
2013-08-06 08:29:12 +00:00
bool do_restart = false;
2012-08-22 12:37:34 +00:00
int progress = 0;
2011-02-23 20:48:06 +00:00
int status;
st = &GET_STATE(brick, index);
2012-08-22 12:37:34 +00:00
next_state = st->state;
restart:
state = next_state;
2011-02-23 20:48:06 +00:00
2021-04-16 09:04:52 +00:00
MARS_IO("ENTER index=%u state=%d pos=%lld table[0]=%p table[1]=%p active[0]=%d active[1]=%d writeout=%d prev=%d len=%u error=%d do_restart=%d\n",
2013-08-06 08:29:12 +00:00
index,
state,
pos,
2022-05-19 20:32:08 +00:00
READ_ONCE(st->table[0]),
READ_ONCE(st->table[1]),
READ_ONCE(st->active[0]),
READ_ONCE(st->active[1]),
2013-08-06 08:29:12 +00:00
st->writeout,
st->prev,
st->len,
st->error,
do_restart);
do_restart = false;
2011-02-23 20:48:06 +00:00
switch (state) {
case COPY_STATE_RESET:
/* This state is only entered after errors or
* in restarting situations.
*/
_clear_mref(brick, index, 1);
_clear_mref(brick, index, 0);
next_state = COPY_STATE_START;
/* fallthrough */
2011-02-23 20:48:06 +00:00
case COPY_STATE_START:
/* This is the relgular starting state.
* It must be zero, automatically entered via memset()
*/
if ((unsigned long)READ_ONCE(st->table[0]) |
(unsigned long)READ_ONCE(st->table[1])) {
2021-04-16 08:40:47 +00:00
MARS_ERR("index %u not startable at pos=%lld\n",
index, pos);
2012-08-22 12:37:34 +00:00
progress = -EPROTO;
goto idle;
2011-02-23 20:48:06 +00:00
}
2012-02-22 13:34:04 +00:00
2012-12-20 16:54:22 +00:00
st->writeout = false;
WRITE_ONCE(st->error, 0);
2012-01-23 12:39:08 +00:00
2013-07-22 07:15:53 +00:00
if (brick->is_aborting ||
is_read_limited(brick))
goto idle;
2012-08-02 08:16:55 +00:00
2019-03-25 08:12:45 +00:00
status = _make_mref(brick, index, 0, NULL,
pos, brick->copy_end,
2019-03-26 09:57:33 +00:00
_make_flags(brick->verify_mode, false));
2012-02-22 13:34:04 +00:00
if (unlikely(status < 0)) {
2014-04-01 11:34:09 +00:00
MARS_DBG("status = %d\n", status);
2012-08-22 12:37:34 +00:00
progress = status;
break;
2012-02-22 13:34:04 +00:00
}
2011-02-23 20:48:06 +00:00
next_state = COPY_STATE_READ1;
2012-08-02 08:16:55 +00:00
if (!brick->verify_mode) {
break;
}
next_state = COPY_STATE_START2;
/* fallthrough */
case COPY_STATE_START2:
2019-03-25 08:12:45 +00:00
status = _make_mref(brick, index, 1, NULL,
pos, brick->copy_end,
2019-03-26 09:57:33 +00:00
_make_flags(true, true));
2012-08-02 08:16:55 +00:00
if (unlikely(status < 0)) {
2014-04-01 11:34:09 +00:00
MARS_DBG("status = %d\n", status);
2012-08-22 12:37:34 +00:00
progress = status;
break;
2011-02-23 20:48:06 +00:00
}
next_state = COPY_STATE_READ2;
/* fallthrough */
2011-02-23 20:48:06 +00:00
case COPY_STATE_READ2:
if (READ_ONCE(st->active[1])) {
/* idempotence: wait by unchanged state */
goto idle;
2011-02-23 20:48:06 +00:00
}
2021-01-30 15:38:36 +00:00
/* wait for both mrefs to appear */
/* fallthrough */
2011-02-23 20:48:06 +00:00
case COPY_STATE_READ1:
2012-08-02 08:16:55 +00:00
case COPY_STATE_READ3:
if (READ_ONCE(st->active[0])) {
/* idempotence: wait by unchanged state */
goto idle;
2011-02-23 20:48:06 +00:00
}
mref0 = READ_ONCE(st->table[0]);
2013-07-15 10:12:54 +00:00
if (brick->copy_limiter) {
int amount = (mref0->ref_len - 1) / 1024 + 1;
mars_limit_sleep(brick->copy_limiter, amount);
}
2011-06-17 11:32:38 +00:00
// on append mode: increase the end pointer dynamically
if (brick->append_mode > 0 && mref0->ref_total_size && mref0->ref_total_size > brick->copy_end) {
brick->copy_end = mref0->ref_total_size;
2011-05-26 14:32:32 +00:00
}
2011-06-17 11:32:38 +00:00
// do verify (when applicable)
mref1 = READ_ONCE(st->table[1]);
2012-08-02 08:16:55 +00:00
if (mref1 && state != COPY_STATE_READ3) {
2011-06-17 11:32:38 +00:00
int len = mref0->ref_len;
2012-08-02 08:16:55 +00:00
bool ok;
if (len != mref1->ref_len) {
ok = false;
2019-03-25 08:12:45 +00:00
} else if (mref0->ref_flags & MREF_CHKSUM_ANY) {
2012-08-02 08:16:55 +00:00
static unsigned char null[sizeof(mref0->ref_checksum)];
ok = !memcmp(mref0->ref_checksum, mref1->ref_checksum, sizeof(mref0->ref_checksum));
if (ok)
ok = memcmp(mref0->ref_checksum, null, sizeof(mref0->ref_checksum)) != 0;
} else if (!mref0->ref_data || !mref1->ref_data) {
ok = false;
} else {
ok = !memcmp(mref0->ref_data, mref1->ref_data, len);
}
2011-06-17 11:32:38 +00:00
_clear_mref(brick, index, 1);
2012-08-02 08:16:55 +00:00
if (ok)
brick->verify_ok_count++;
else
brick->verify_error_count++;
if (ok || !brick->repair_mode) {
2011-02-23 20:48:06 +00:00
/* skip start of writing, goto final treatment of writeout */
2012-08-02 08:16:55 +00:00
next_state = COPY_STATE_CLEANUP;
break;
2011-02-23 20:48:06 +00:00
}
}
2012-08-02 08:16:55 +00:00
2019-03-25 08:12:45 +00:00
if ((mref0->ref_flags & MREF_CHKSUM_ANY) && (mref0->ref_flags & MREF_NODATA)) {
/* re-read, this time with data */
2012-08-02 08:16:55 +00:00
_clear_mref(brick, index, 0);
2019-03-25 08:12:45 +00:00
status = _make_mref(brick, index, 0, NULL,
pos, brick->copy_end,
2019-03-26 09:57:33 +00:00
_make_flags(false, false));
2012-08-02 08:16:55 +00:00
if (unlikely(status < 0)) {
2014-04-01 11:34:09 +00:00
MARS_DBG("status = %d\n", status);
2012-08-22 12:37:34 +00:00
progress = status;
next_state = COPY_STATE_RESET;
break;
2012-08-02 08:16:55 +00:00
}
next_state = COPY_STATE_READ3;
break;
}
2011-02-23 20:48:06 +00:00
next_state = COPY_STATE_WRITE;
2011-06-17 11:32:38 +00:00
/* fallthrough */
2011-02-23 20:48:06 +00:00
case COPY_STATE_WRITE:
2013-07-22 07:15:53 +00:00
if (is_write_limited(brick))
goto idle;
2011-06-17 11:32:38 +00:00
/* Obey ordering to get a strict "append" behaviour.
* We assume that we don't need to wait for completion
* of the previous write to avoid a sparse result file
* under all circumstances, i.e. we only assure that
* _starting_ the writes is in order.
* This is only correct when all lower bricks obey the
* order of ref_io() operations.
* Currenty, bio and aio are obeying this. Be careful when
* implementing new IO bricks!
*/
2017-05-18 12:18:54 +00:00
if (mars_copy_strict_write_order &&
st->prev >= 0 &&
!GET_STATE(brick, st->prev).writeout) {
goto idle;
2011-02-23 20:48:06 +00:00
}
mref0 = READ_ONCE(st->table[0]);
2012-08-02 08:16:55 +00:00
if (unlikely(!mref0 || !mref0->ref_data)) {
2021-04-16 08:40:47 +00:00
MARS_ERR("src buffer for write does not exist, state %d at index %u\n",
state, index);
2012-08-22 12:37:34 +00:00
progress = -EILSEQ;
break;
2011-06-17 11:32:38 +00:00
}
if (unlikely(READ_ONCE(st->active[0]))) {
2021-04-16 08:40:47 +00:00
MARS_ERR("src buffer for write is active, state %d at index %u\n",
state, index);
progress = -EILSEQ;
break;
}
2012-08-22 12:37:34 +00:00
if (unlikely(brick->is_aborting)) {
progress = -EINTR;
break;
2012-08-22 12:37:34 +00:00
}
2011-06-17 11:32:38 +00:00
/* start writeout */
2019-03-25 08:12:45 +00:00
status = _make_mref(brick, index, 1, mref0->ref_data,
pos, pos + mref0->ref_len,
MREF_WRITE | MREF_MAY_WRITE);
2012-08-22 12:37:34 +00:00
if (unlikely(status < 0)) {
2014-04-01 11:34:09 +00:00
MARS_DBG("status = %d\n", status);
2012-08-22 12:37:34 +00:00
progress = status;
next_state = COPY_STATE_RESET;
2012-08-22 12:37:34 +00:00
break;
}
/* Attention! overlapped IO behind EOF could
* lead to temporary inconsistent state of the
* file, because the write order may be different from
* strict O_APPEND behaviour.
*/
if (mars_copy_overlap)
st->writeout = true;
2011-06-17 11:32:38 +00:00
next_state = COPY_STATE_WRITTEN;
/* fallthrough */
2011-06-17 11:32:38 +00:00
case COPY_STATE_WRITTEN:
if (READ_ONCE(st->active[1])) {
/* idempotence: wait by unchanged state */
2011-06-17 11:32:38 +00:00
MARS_IO("irrelevant\n");
goto idle;
}
st->writeout = true;
/* rechecking means to start over again.
* ATTENTIION! this may lead to infinite request
* submission loops, intentionally.
* TODO: implement some timeout means.
*/
if (brick->recheck_mode && brick->repair_mode) {
next_state = COPY_STATE_RESET;
break;
2011-02-23 20:48:06 +00:00
}
next_state = COPY_STATE_CLEANUP;
/* fallthrough */
case COPY_STATE_CLEANUP:
_clear_mref(brick, index, 1);
2011-06-17 11:32:38 +00:00
_clear_mref(brick, index, 0);
next_state = COPY_STATE_FINISHED;
/* fallthrough */
2011-06-17 11:32:38 +00:00
case COPY_STATE_FINISHED:
2012-08-02 08:16:55 +00:00
/* Indicate successful completion by remaining in this state.
* Restart of the finite automaton must be done externally.
*/
goto idle;
2011-02-23 20:48:06 +00:00
default:
2021-04-16 08:40:47 +00:00
MARS_ERR("illegal state %d at index %u\n",
state, index);
2011-02-23 20:48:06 +00:00
_clash(brick);
2012-08-22 12:37:34 +00:00
progress = -EILSEQ;
2011-02-23 20:48:06 +00:00
}
2012-08-22 12:37:34 +00:00
do_restart = (state != next_state);
idle:
2012-08-22 12:37:34 +00:00
if (unlikely(progress < 0)) {
if (READ_ONCE(st->error) >= 0)
WRITE_ONCE(st->error, progress);
2014-04-01 11:34:09 +00:00
MARS_DBG("progress = %d\n", progress);
2012-08-22 12:37:34 +00:00
progress = 0;
2011-02-23 20:48:06 +00:00
_clash(brick);
} else if (do_restart) {
goto restart;
2012-08-22 12:37:34 +00:00
} else if (st->state != next_state) {
progress++;
2011-02-23 20:48:06 +00:00
}
2013-08-06 08:29:12 +00:00
2021-04-16 09:04:52 +00:00
MARS_IO("LEAVE index=%u state=%d next_state=%d table[0]=%p table[1]=%p active[0]=%d active[1]=%d writeout=%d prev=%d len=%u error=%d progress=%d\n",
2013-08-06 08:29:12 +00:00
index,
st->state,
next_state,
2022-05-19 20:32:08 +00:00
READ_ONCE(st->table[0]),
READ_ONCE(st->table[1]),
READ_ONCE(st->active[0]),
READ_ONCE(st->active[1]),
2013-08-06 08:29:12 +00:00
st->writeout,
st->prev,
st->len,
st->error,
progress);
2012-08-22 12:37:34 +00:00
// save the resulting state
st->state = next_state;
return progress;
2011-02-23 20:48:06 +00:00
}
static
2017-02-25 16:12:20 +00:00
int _run_copy(struct copy_brick *brick, loff_t this_start)
2011-02-23 20:48:06 +00:00
{
int all_max;
2011-02-23 20:48:06 +00:00
int max;
loff_t pos;
2011-06-17 11:32:38 +00:00
short prev;
2012-08-22 12:37:34 +00:00
int progress;
2011-02-23 20:48:06 +00:00
2011-06-17 11:32:38 +00:00
if (unlikely(_clear_clash(brick))) {
2011-02-23 20:48:06 +00:00
MARS_DBG("clash\n");
2013-07-22 07:15:53 +00:00
if (atomic_read(&brick->copy_read_flight) + atomic_read(&brick->copy_write_flight) > 0) {
2011-02-23 20:48:06 +00:00
/* wait until all pending copy IO has finished
*/
_clash(brick);
MARS_DBG("re-clash\n");
brick_msleep(100);
return 0;
2011-02-23 20:48:06 +00:00
}
_clear_all_mref(brick);
_clear_state_table(brick);
2011-02-23 20:48:06 +00:00
}
2017-02-25 16:12:20 +00:00
if (this_start < brick->copy_last)
this_start = brick->copy_last;
else if (this_start > brick->copy_dirty && brick->copy_dirty)
this_start = brick->copy_dirty;
2011-06-10 13:57:52 +00:00
/* Do at most max iterations in the below loop
*/
2017-05-16 13:07:04 +00:00
max = NR_COPY_REQUESTS - 1 - atomic_read(&brick->io_flight) * 2;
if (unlikely(max < 32))
max = 32;
all_max = max;
2011-02-23 20:48:06 +00:00
MARS_IO("max = %d\n", max);
2011-06-17 11:32:38 +00:00
prev = -1;
2017-02-25 16:12:20 +00:00
if (this_start > brick->copy_last) {
2021-04-16 09:23:17 +00:00
if (this_start >= COPY_CHUNK)
prev = GET_INDEX(this_start - COPY_CHUNK);
2017-02-25 16:12:20 +00:00
max -= (this_start - brick->copy_last) / COPY_CHUNK;
all_max = max;
}
2012-08-22 12:37:34 +00:00
progress = 0;
2017-02-25 16:12:20 +00:00
for (pos = this_start;
pos < brick->copy_end || brick->append_mode > 1;
pos = ((pos / COPY_CHUNK) + 1) * COPY_CHUNK) {
2021-04-16 08:40:47 +00:00
unsigned index = GET_INDEX(pos);
struct copy_state *st = &GET_STATE(brick, index);
int this_progress;
if (max-- <= 0) {
2011-02-23 20:48:06 +00:00
break;
2011-05-26 14:32:32 +00:00
}
2011-06-17 11:32:38 +00:00
st->prev = prev;
prev = index;
if (READ_ONCE(st->active[0]) & READ_ONCE(st->active[1]))
break;
2011-06-17 11:32:38 +00:00
// call the finite state automaton
this_progress = _next_state(brick, index, pos);
2017-02-25 16:12:20 +00:00
if (this_progress <= 0)
break;
2017-03-01 06:23:36 +00:00
progress += this_progress;
2017-03-01 06:23:36 +00:00
if (pos > brick->copy_dirty)
brick->copy_dirty = pos;
2011-06-10 13:57:52 +00:00
}
2011-06-17 11:32:38 +00:00
// check the resulting state: can we advance the copy_last pointer?
2017-02-25 16:12:20 +00:00
if (this_start == brick->copy_last && progress && !brick->clash) {
2011-06-10 13:57:52 +00:00
int count = 0;
int error;
max = all_max;
for (pos = brick->copy_last;
pos < brick->copy_end;
pos = ((pos / COPY_CHUNK) + 1) * COPY_CHUNK) {
2021-04-16 09:04:52 +00:00
unsigned len;
2021-04-16 08:40:47 +00:00
unsigned index = GET_INDEX(pos);
struct copy_state *st = &GET_STATE(brick, index);
2017-02-25 16:12:20 +00:00
2011-06-17 11:32:38 +00:00
if (st->state != COPY_STATE_FINISHED) {
2011-06-10 13:57:52 +00:00
break;
2011-06-17 11:32:38 +00:00
}
if (max-- <= 0) {
break;
}
error = READ_ONCE(st->error);
if (unlikely(error < 0)) {
/* check for fatal consistency errors */
if (error == -EMEDIUMTYPE) {
brick->copy_error = error;
brick->abort_mode = true;
MARS_WRN("Consistency is violated\n");
}
2012-08-22 12:37:34 +00:00
if (!brick->copy_error) {
brick->copy_error = error;
MARS_WRN("IO error = %d\n", error);
2012-08-22 12:37:34 +00:00
}
if (brick->abort_mode) {
brick->is_aborting = true;
}
2011-06-17 11:32:38 +00:00
break;
}
// rollover
st->state = COPY_STATE_START;
2021-04-16 09:04:52 +00:00
len = st->len;
count += len;
2011-06-17 11:32:38 +00:00
// check contiguity
2021-04-16 09:04:52 +00:00
if (unlikely(GET_OFFSET(pos) + len != COPY_CHUNK)) {
2020-04-04 21:09:49 +00:00
/* Short read detected: shorten the copy_end.
*/
2021-04-16 09:04:52 +00:00
brick->copy_end = pos + len;
2011-06-17 11:32:38 +00:00
break;
}
2011-06-10 13:57:52 +00:00
}
if (count > 0) {
2011-06-17 11:32:38 +00:00
brick->copy_last += count;
2017-04-15 06:21:21 +00:00
get_lamport(NULL, &brick->copy_last_stamp);
2011-06-17 11:32:38 +00:00
MARS_IO("new copy_last += %d => %lld\n", count, brick->copy_last);
_update_percent(brick, false);
2011-06-10 13:57:52 +00:00
}
2011-02-23 20:48:06 +00:00
}
2012-08-22 12:37:34 +00:00
return progress;
2011-02-23 20:48:06 +00:00
}
static
bool _is_done(struct copy_brick *brick)
{
2017-01-08 07:39:01 +00:00
if (!brick->power.led_on || brick_thread_should_stop())
2012-08-22 12:37:34 +00:00
brick->is_aborting = true;
return brick->is_aborting &&
2013-07-22 07:15:53 +00:00
atomic_read(&brick->copy_read_flight) + atomic_read(&brick->copy_write_flight) <= 0;
}
2011-02-23 20:48:06 +00:00
static int _copy_thread(void *data)
{
struct copy_brick *brick = data;
struct lamport_time last_progress;
2017-04-07 05:56:28 +00:00
int i;
2011-02-23 20:48:06 +00:00
MARS_DBG("--------------- copy_thread %p starting\n", brick);
brick->copy_error = 0;
2012-08-22 12:37:34 +00:00
brick->copy_error_count = 0;
2012-08-02 08:16:55 +00:00
brick->verify_ok_count = 0;
brick->verify_error_count = 0;
2017-04-07 05:56:28 +00:00
for (i = 0; i < COPY_INPUT_NR; i++)
brick->inputs[i]->check_hint = 0;
get_real_lamport(&last_progress);
2017-06-01 06:34:26 +00:00
if (brick->copy_limiter)
mars_limit_reset(brick->copy_limiter);
_update_percent(brick, true);
WRITE_ONCE(brick->trigger, true);
2011-02-23 20:48:06 +00:00
while (!_is_done(brick)) {
2011-02-23 20:48:06 +00:00
loff_t old_start = brick->copy_start;
loff_t old_end = brick->copy_end;
2012-08-22 12:37:34 +00:00
int progress = 0;
2017-02-25 16:42:37 +00:00
loff_t check_hint;
2011-06-10 13:57:52 +00:00
if (old_end > 0) {
2017-04-04 05:42:10 +00:00
loff_t old_last = brick->copy_last;
loff_t old_dirty = brick->copy_dirty;
2017-02-25 16:12:20 +00:00
progress = _run_copy(brick, -1);
2017-04-07 05:56:28 +00:00
2017-02-25 16:42:37 +00:00
/* This is racy, deliberately.
* Missing some events does no harm.
*/
2017-04-07 05:56:28 +00:00
for (i = 0; i < COPY_INPUT_NR; i++) {
check_hint = brick->inputs[i]->check_hint;
if (check_hint > 0) {
brick->inputs[i]->check_hint = 0;
progress += _run_copy(brick, check_hint);
}
2017-02-25 16:42:37 +00:00
}
2017-04-04 05:42:10 +00:00
/* earlier resume working at the tail */
if (brick->copy_last > old_last && old_dirty)
progress += _run_copy(brick, old_dirty);
/* abort when no progress is made for a longer time */
if (progress > 0) {
get_real_lamport(&last_progress);
} else {
struct lamport_time next_progress;
get_real_lamport(&next_progress);
next_progress.tv_sec -= mars_copy_timeout;
2019-02-19 09:18:29 +00:00
if (lamport_time_compare(&next_progress, &last_progress) > 0)
brick->is_aborting = true;
}
2011-06-10 13:57:52 +00:00
}
2011-02-23 20:48:06 +00:00
wait_event_interruptible_timeout(brick->event,
2012-08-22 12:37:34 +00:00
progress > 0 ||
READ_ONCE(brick->trigger) ||
2012-08-22 12:37:34 +00:00
brick->copy_start != old_start ||
brick->copy_end != old_end ||
_is_done(brick),
1 * HZ);
WRITE_ONCE(brick->trigger, false);
2011-02-23 20:48:06 +00:00
}
2017-06-01 06:34:26 +00:00
if (brick->copy_limiter)
mars_limit_reset(brick->copy_limiter);
/* check for fatal consistency errors */
if (brick->copy_error == -EMEDIUMTYPE) {
/* reset the whole area */
brick->copy_start = 0;
brick->copy_last = 0;
2017-03-01 06:23:36 +00:00
brick->copy_dirty = 0;
MARS_WRN("resetting the full copy area\n");
}
_update_percent(brick, true);
2013-07-22 07:15:53 +00:00
MARS_DBG("--------------- copy_thread terminating (%d read requests / %d write requests flying, copy_start = %lld copy_end = %lld)\n",
atomic_read(&brick->copy_read_flight),
atomic_read(&brick->copy_write_flight),
brick->copy_start,
brick->copy_end);
_clear_all_mref(brick);
2019-01-31 19:31:38 +00:00
brick->terminated = true;
2020-02-07 06:32:35 +00:00
mars_trigger();
2011-02-23 20:48:06 +00:00
MARS_DBG("--------------- copy_thread done.\n");
return 0;
}
////////////////// own brick / input / output operations //////////////////
static int copy_get_info(struct copy_output *output, struct mars_info *info)
{
2021-07-12 08:29:40 +00:00
struct copy_input *input = output->brick->inputs[INPUT_B];
2011-02-23 20:48:06 +00:00
return GENERIC_INPUT_CALL(input, mars_get_info, info);
}
static int copy_ref_get(struct copy_output *output, struct mref_object *mref)
{
struct copy_input *input;
int status;
2021-04-16 08:17:01 +00:00
input = _determine_input(output->brick, mref);
2011-02-23 20:48:06 +00:00
status = GENERIC_INPUT_CALL(input, mref_get, mref);
if (status >= 0) {
atomic_inc(&output->brick->io_flight);
}
return status;
}
static void copy_ref_put(struct copy_output *output, struct mref_object *mref)
{
struct copy_brick *brick = output->brick;
2011-02-23 20:48:06 +00:00
struct copy_input *input;
input = _determine_input(brick, mref);
2021-06-29 08:52:11 +00:00
GENERIC_INPUT_CALL_VOID(input, mref_put, mref);
if (atomic_dec_and_test(&brick->io_flight)) {
WRITE_ONCE(brick->trigger, true);
wake_up_interruptible(&brick->event);
2011-02-23 20:48:06 +00:00
}
}
static void copy_ref_io(struct copy_output *output, struct mref_object *mref)
{
struct copy_input *input;
2021-04-16 08:17:01 +00:00
input = _determine_input(output->brick, mref);
2021-06-29 08:52:11 +00:00
GENERIC_INPUT_CALL_VOID(input, mref_io, mref);
2011-02-23 20:48:06 +00:00
}
static int copy_switch(struct copy_brick *brick)
{
static int version = 0;
MARS_DBG("power.button = %d\n", brick->power.button);
2019-01-31 19:31:38 +00:00
if (brick->power.button && !brick->terminated) {
if (brick->power.led_on || brick->thread)
goto done;
2011-02-23 20:48:06 +00:00
mars_power_led_off((void*)brick, false);
brick->is_aborting = false;
2011-02-23 20:48:06 +00:00
if (!brick->thread) {
2011-02-25 11:46:38 +00:00
brick->copy_last = brick->copy_start;
2017-03-01 06:23:36 +00:00
brick->copy_dirty = 0;
2019-01-31 19:31:38 +00:00
brick->terminated = false;
mars_power_led_on((void*)brick, true);
2017-04-15 06:21:21 +00:00
get_lamport(NULL, &brick->copy_last_stamp);
brick->thread = brick_thread_create(_copy_thread, brick, "mars_copy%d", version++);
2011-02-23 20:48:06 +00:00
if (brick->thread) {
WRITE_ONCE(brick->trigger, true);
2011-02-23 20:48:06 +00:00
} else {
2019-01-31 19:31:38 +00:00
mars_power_led_on((void*)brick, false);
2011-02-23 20:48:06 +00:00
mars_power_led_off((void*)brick, true);
MARS_ERR("could not start copy thread\n");
}
}
} else {
2017-01-08 07:39:01 +00:00
/* Tell thread to stop asynchronously */
2011-02-23 20:48:06 +00:00
mars_power_led_on((void*)brick, false);
if (brick->thread) {
2017-01-08 07:39:01 +00:00
/* Notice: this will be reported by the thread */
2019-01-31 19:31:38 +00:00
if (!brick->terminated)
2017-01-08 07:39:01 +00:00
goto done;
2011-08-25 10:16:32 +00:00
MARS_INF("stopping thread...\n");
brick_thread_stop(brick->thread);
2011-02-23 20:48:06 +00:00
}
2017-04-20 15:31:42 +00:00
/* for safety, and when the thread was not started */
mars_power_led_off((void*)brick, true);
2019-01-31 19:31:38 +00:00
brick->terminated = false;
2011-02-23 20:48:06 +00:00
}
done:
2011-02-23 20:48:06 +00:00
return 0;
}
2011-06-17 11:32:38 +00:00
//////////////// informational / statistics ///////////////
static
char *copy_statistics(struct copy_brick *brick, int verbose)
{
char *res = brick_string_alloc(1024);
2011-06-17 11:32:38 +00:00
if (!res)
return NULL;
snprintf(res, 1024,
2012-02-12 11:19:57 +00:00
"copy_start = %lld "
"copy_last = %lld "
2017-03-01 06:23:36 +00:00
"copy_dirty = %lld "
2012-02-12 11:19:57 +00:00
"copy_end = %lld "
2017-04-07 05:56:28 +00:00
"check_hint[0] = %lld "
"check_hint[1] = %lld "
2012-02-12 11:19:57 +00:00
"copy_error = %d "
2012-08-22 12:37:34 +00:00
"copy_error_count = %d "
2012-08-02 08:16:55 +00:00
"verify_ok_count = %d "
"verify_error_count = %d "
2012-02-12 11:19:57 +00:00
"low_dirty = %d "
"is_aborting = %d "
"clash = %lu | "
2012-12-20 10:22:41 +00:00
"total clash_count = %d | "
2012-02-12 11:19:57 +00:00
"io_flight = %d "
2013-07-22 07:15:53 +00:00
"copy_read_flight = %d "
"copy_write_flight = %d\n",
2012-02-12 11:19:57 +00:00
brick->copy_start,
brick->copy_last,
2017-03-01 06:23:36 +00:00
brick->copy_dirty,
2012-02-12 11:19:57 +00:00
brick->copy_end,
2017-04-07 05:56:28 +00:00
brick->inputs[0]->check_hint,
brick->inputs[1]->check_hint,
2012-02-12 11:19:57 +00:00
brick->copy_error,
2012-08-22 12:37:34 +00:00
brick->copy_error_count,
2012-08-02 08:16:55 +00:00
brick->verify_ok_count,
brick->verify_error_count,
2012-02-12 11:19:57 +00:00
brick->low_dirty,
brick->is_aborting,
brick->clash,
2012-12-20 10:22:41 +00:00
atomic_read(&brick->total_clash_count),
2012-02-12 11:19:57 +00:00
atomic_read(&brick->io_flight),
2013-07-22 07:15:53 +00:00
atomic_read(&brick->copy_read_flight),
atomic_read(&brick->copy_write_flight));
2011-06-17 11:32:38 +00:00
return res;
}
static
void copy_reset_statistics(struct copy_brick *brick)
{
2012-12-20 10:22:41 +00:00
atomic_set(&brick->total_clash_count, 0);
2011-06-17 11:32:38 +00:00
}
2011-02-23 20:48:06 +00:00
//////////////// object / aspect constructors / destructors ///////////////
static int copy_mref_aspect_init_fn(struct generic_aspect *_ini)
2011-02-23 20:48:06 +00:00
{
struct copy_mref_aspect *ini = (void*)_ini;
2021-04-16 09:26:03 +00:00
2011-02-23 20:48:06 +00:00
(void)ini;
return 0;
}
static void copy_mref_aspect_exit_fn(struct generic_aspect *_ini)
2011-02-23 20:48:06 +00:00
{
struct copy_mref_aspect *ini = (void*)_ini;
2021-04-16 09:26:03 +00:00
2011-02-23 20:48:06 +00:00
(void)ini;
}
MARS_MAKE_STATICS(copy);
////////////////////// brick constructors / destructors ////////////////////
static
void _free_pages(struct copy_brick *brick)
{
2021-04-16 08:17:01 +00:00
unsigned i;
for (i = 0; i < MAX_SUB_TABLES; i++) {
struct copy_state *sub_table = brick->st[i];
if (!sub_table) {
continue;
}
brick_block_free(sub_table, PAGE_SIZE);
}
brick_block_free(brick->st, PAGE_SIZE);
}
2011-02-23 20:48:06 +00:00
static int copy_brick_construct(struct copy_brick *brick)
{
2021-04-16 08:17:01 +00:00
unsigned i;
brick->st = brick_block_alloc(0, PAGE_SIZE);
if (unlikely(!brick->st)) {
MARS_ERR("cannot allocate state directory table.\n");
return -ENOMEM;
}
memset(brick->st, 0, PAGE_SIZE);
for (i = 0; i < MAX_SUB_TABLES; i++) {
struct copy_state *sub_table;
// this should be usually optimized away as dead code
if (unlikely(i >= MAX_SUB_TABLES)) {
2021-04-16 08:17:01 +00:00
MARS_ERR("sorry, subtable index %u is too large.\n", i);
_free_pages(brick);
return -EINVAL;
}
sub_table = brick_block_alloc(0, PAGE_SIZE);
brick->st[i] = sub_table;
if (unlikely(!sub_table)) {
2021-04-16 08:17:01 +00:00
MARS_ERR("cannot allocate state subtable %u\n", i);
_free_pages(brick);
return -ENOMEM;
}
memset(sub_table, 0, PAGE_SIZE);
}
2011-02-23 20:48:06 +00:00
init_waitqueue_head(&brick->event);
return 0;
}
static int copy_brick_destruct(struct copy_brick *brick)
{
_free_pages(brick);
2011-02-23 20:48:06 +00:00
return 0;
}
static int copy_output_construct(struct copy_output *output)
{
return 0;
}
static int copy_output_destruct(struct copy_output *output)
{
return 0;
}
///////////////////////// static structs ////////////////////////
static struct copy_brick_ops copy_brick_ops = {
.brick_switch = copy_switch,
2011-06-17 11:32:38 +00:00
.brick_statistics = copy_statistics,
.reset_statistics = copy_reset_statistics,
2011-02-23 20:48:06 +00:00
};
static struct copy_output_ops copy_output_ops = {
.mars_get_info = copy_get_info,
.mref_get = copy_ref_get,
.mref_put = copy_ref_put,
.mref_io = copy_ref_io,
};
const struct copy_input_type copy_input_type = {
.type_name = "copy_input",
.input_size = sizeof(struct copy_input),
};
static const struct copy_input_type *copy_input_types[] = {
&copy_input_type,
&copy_input_type,
&copy_input_type,
&copy_input_type,
};
const struct copy_output_type copy_output_type = {
.type_name = "copy_output",
.output_size = sizeof(struct copy_output),
.master_ops = &copy_output_ops,
.output_construct = &copy_output_construct,
.output_destruct = &copy_output_destruct,
};
static const struct copy_output_type *copy_output_types[] = {
&copy_output_type,
};
const struct copy_brick_type copy_brick_type = {
.type_name = "copy_brick",
.brick_size = sizeof(struct copy_brick),
.max_inputs = 4,
.max_outputs = 1,
.master_ops = &copy_brick_ops,
.aspect_types = copy_aspect_types,
2011-02-23 20:48:06 +00:00
.default_input_types = copy_input_types,
.default_output_types = copy_output_types,
.brick_construct = &copy_brick_construct,
.brick_destruct = &copy_brick_destruct,
};
EXPORT_SYMBOL_GPL(copy_brick_type);
////////////////// module init stuff /////////////////////////
2011-08-25 10:16:32 +00:00
int __init init_mars_copy(void)
2011-02-23 20:48:06 +00:00
{
MARS_INF("init_copy()\n");
return copy_register_brick_type();
}
2014-04-23 11:16:26 +00:00
void exit_mars_copy(void)
2011-02-23 20:48:06 +00:00
{
MARS_INF("exit_copy()\n");
copy_unregister_brick_type();
}