2008-11-20 14:52:48 +00:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2008 Oracle. All rights reserved.
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public
|
|
|
|
* License v2 as published by the Free Software Foundation.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public
|
|
|
|
* License along with this program; if not, write to the
|
|
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
|
|
* Boston, MA 021110-1307, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <pthread.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <fcntl.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#include <dirent.h>
|
|
|
|
#include <zlib.h>
|
2015-06-10 22:04:19 +00:00
|
|
|
#include <getopt.h>
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
#include "kerncompat.h"
|
2019-09-25 13:37:27 +00:00
|
|
|
#include "crypto/crc32c.h"
|
2008-11-20 14:52:48 +00:00
|
|
|
#include "ctree.h"
|
|
|
|
#include "disk-io.h"
|
|
|
|
#include "transaction.h"
|
2019-06-19 23:46:21 +00:00
|
|
|
#include "common/utils.h"
|
2013-03-19 13:43:13 +00:00
|
|
|
#include "volumes.h"
|
2020-08-18 13:56:04 +00:00
|
|
|
#include "kernel-shared/extent_io.h"
|
2020-08-18 09:12:28 +00:00
|
|
|
#include "common/extent-cache.h"
|
2019-06-19 23:46:21 +00:00
|
|
|
#include "common/help.h"
|
2019-07-01 22:42:23 +00:00
|
|
|
#include "common/device-utils.h"
|
2017-10-19 22:24:13 +00:00
|
|
|
#include "image/metadump.h"
|
2017-10-19 22:48:30 +00:00
|
|
|
#include "image/sanitize.h"
|
2015-06-21 16:23:19 +00:00
|
|
|
#include "common/box.h"
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2016-11-02 23:53:43 +00:00
|
|
|
#define MAX_WORKER_THREADS (32)
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
struct async_work {
|
|
|
|
struct list_head list;
|
|
|
|
struct list_head ordered;
|
|
|
|
u64 start;
|
|
|
|
u64 size;
|
|
|
|
u8 *buffer;
|
|
|
|
size_t bufsize;
|
2013-03-18 18:50:45 +00:00
|
|
|
int error;
|
2008-11-20 14:52:48 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
struct metadump_struct {
|
|
|
|
struct btrfs_root *root;
|
|
|
|
FILE *out;
|
|
|
|
|
2016-11-03 00:23:18 +00:00
|
|
|
union {
|
|
|
|
struct meta_cluster cluster;
|
|
|
|
char meta_cluster_bytes[BLOCK_SIZE];
|
|
|
|
};
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2016-11-02 23:57:43 +00:00
|
|
|
pthread_t threads[MAX_WORKER_THREADS];
|
2008-11-20 14:52:48 +00:00
|
|
|
size_t num_threads;
|
|
|
|
pthread_mutex_t mutex;
|
|
|
|
pthread_cond_t cond;
|
2013-03-22 14:52:07 +00:00
|
|
|
struct rb_root name_tree;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
struct list_head list;
|
|
|
|
struct list_head ordered;
|
|
|
|
size_t num_items;
|
|
|
|
size_t num_ready;
|
|
|
|
|
|
|
|
u64 pending_start;
|
|
|
|
u64 pending_size;
|
|
|
|
|
|
|
|
int compress_level;
|
|
|
|
int done;
|
2013-03-19 13:43:13 +00:00
|
|
|
int data;
|
2017-10-19 23:01:43 +00:00
|
|
|
enum sanitize_mode sanitize_names;
|
2014-06-26 02:53:02 +00:00
|
|
|
|
|
|
|
int error;
|
2013-03-22 14:52:07 +00:00
|
|
|
};
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
struct mdrestore_struct {
|
|
|
|
FILE *in;
|
|
|
|
FILE *out;
|
|
|
|
|
2016-11-02 23:57:43 +00:00
|
|
|
pthread_t threads[MAX_WORKER_THREADS];
|
2008-11-20 14:52:48 +00:00
|
|
|
size_t num_threads;
|
|
|
|
pthread_mutex_t mutex;
|
|
|
|
pthread_cond_t cond;
|
|
|
|
|
2019-07-04 06:10:57 +00:00
|
|
|
/*
|
|
|
|
* Records system chunk ranges, so restore can use this to determine
|
|
|
|
* if an item is in chunk tree range.
|
|
|
|
*/
|
|
|
|
struct cache_tree sys_chunks;
|
2013-05-08 15:40:36 +00:00
|
|
|
struct rb_root chunk_tree;
|
2015-01-26 01:39:24 +00:00
|
|
|
struct rb_root physical_tree;
|
2008-11-20 14:52:48 +00:00
|
|
|
struct list_head list;
|
2015-01-26 01:39:24 +00:00
|
|
|
struct list_head overlapping_chunks;
|
2020-05-27 10:28:09 +00:00
|
|
|
struct btrfs_super_block *original_super;
|
2008-11-20 14:52:48 +00:00
|
|
|
size_t num_items;
|
2016-04-01 10:57:11 +00:00
|
|
|
u32 nodesize;
|
2013-03-27 20:55:41 +00:00
|
|
|
u64 devid;
|
2015-01-28 20:38:03 +00:00
|
|
|
u64 alloced_chunks;
|
2015-01-26 01:39:24 +00:00
|
|
|
u64 last_physical_offset;
|
2019-07-04 06:10:57 +00:00
|
|
|
/* An quicker checker for if a item is in sys chunk range */
|
|
|
|
u64 sys_chunk_end;
|
2013-03-27 20:55:41 +00:00
|
|
|
u8 uuid[BTRFS_UUID_SIZE];
|
|
|
|
u8 fsid[BTRFS_FSID_SIZE];
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
int compress_method;
|
|
|
|
int done;
|
2013-03-18 18:50:45 +00:00
|
|
|
int error;
|
2013-03-27 20:55:41 +00:00
|
|
|
int old_restore;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int fixup_offset;
|
|
|
|
int multi_devices;
|
2015-01-26 01:39:24 +00:00
|
|
|
int clear_space_cache;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
struct btrfs_fs_info *info;
|
2008-11-20 14:52:48 +00:00
|
|
|
};
|
|
|
|
|
2013-03-22 14:52:07 +00:00
|
|
|
static struct extent_buffer *alloc_dummy_eb(u64 bytenr, u32 size);
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
static void csum_block(u8 *buf, size_t len)
|
|
|
|
{
|
2019-09-25 13:37:24 +00:00
|
|
|
u16 csum_size = btrfs_csum_type_size(BTRFS_CSUM_TYPE_CRC32);
|
|
|
|
u8 result[csum_size];
|
2008-11-20 14:52:48 +00:00
|
|
|
u32 crc = ~(u32)0;
|
|
|
|
crc = crc32c(crc, buf + BTRFS_CSUM_SIZE, len - BTRFS_CSUM_SIZE);
|
2019-09-03 15:00:39 +00:00
|
|
|
put_unaligned_le32(~crc, result);
|
2019-09-25 13:37:24 +00:00
|
|
|
memcpy(buf, result, csum_size);
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2013-03-22 14:52:07 +00:00
|
|
|
static int has_name(struct btrfs_key *key)
|
|
|
|
{
|
|
|
|
switch (key->type) {
|
|
|
|
case BTRFS_DIR_ITEM_KEY:
|
|
|
|
case BTRFS_DIR_INDEX_KEY:
|
|
|
|
case BTRFS_INODE_REF_KEY:
|
|
|
|
case BTRFS_INODE_EXTREF_KEY:
|
2013-07-31 14:23:58 +00:00
|
|
|
case BTRFS_XATTR_ITEM_KEY:
|
2013-03-22 14:52:07 +00:00
|
|
|
return 1;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
static int chunk_cmp(struct rb_node *a, struct rb_node *b, int fuzz)
|
|
|
|
{
|
2015-01-26 01:39:24 +00:00
|
|
|
struct fs_chunk *entry = rb_entry(a, struct fs_chunk, l);
|
|
|
|
struct fs_chunk *ins = rb_entry(b, struct fs_chunk, l);
|
2013-05-08 15:40:36 +00:00
|
|
|
|
|
|
|
if (fuzz && ins->logical >= entry->logical &&
|
|
|
|
ins->logical < entry->logical + entry->bytes)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (ins->logical < entry->logical)
|
|
|
|
return -1;
|
|
|
|
else if (ins->logical > entry->logical)
|
|
|
|
return 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
static int physical_cmp(struct rb_node *a, struct rb_node *b, int fuzz)
|
|
|
|
{
|
|
|
|
struct fs_chunk *entry = rb_entry(a, struct fs_chunk, p);
|
|
|
|
struct fs_chunk *ins = rb_entry(b, struct fs_chunk, p);
|
|
|
|
|
|
|
|
if (fuzz && ins->physical >= entry->physical &&
|
|
|
|
ins->physical < entry->physical + entry->bytes)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (fuzz && entry->physical >= ins->physical &&
|
|
|
|
entry->physical < ins->physical + ins->bytes)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (ins->physical < entry->physical)
|
|
|
|
return -1;
|
|
|
|
else if (ins->physical > entry->physical)
|
|
|
|
return 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
static void tree_insert(struct rb_root *root, struct rb_node *ins,
|
|
|
|
int (*cmp)(struct rb_node *a, struct rb_node *b,
|
|
|
|
int fuzz))
|
2013-03-22 14:52:07 +00:00
|
|
|
{
|
|
|
|
struct rb_node ** p = &root->rb_node;
|
|
|
|
struct rb_node * parent = NULL;
|
|
|
|
int dir;
|
|
|
|
|
|
|
|
while(*p) {
|
|
|
|
parent = *p;
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
dir = cmp(*p, ins, 1);
|
2013-03-22 14:52:07 +00:00
|
|
|
if (dir < 0)
|
|
|
|
p = &(*p)->rb_left;
|
|
|
|
else if (dir > 0)
|
|
|
|
p = &(*p)->rb_right;
|
|
|
|
else
|
|
|
|
BUG();
|
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
rb_link_node(ins, parent, p);
|
|
|
|
rb_insert_color(ins, root);
|
2013-03-22 14:52:07 +00:00
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
static struct rb_node *tree_search(struct rb_root *root,
|
|
|
|
struct rb_node *search,
|
|
|
|
int (*cmp)(struct rb_node *a,
|
|
|
|
struct rb_node *b, int fuzz),
|
|
|
|
int fuzz)
|
2013-03-22 14:52:07 +00:00
|
|
|
{
|
|
|
|
struct rb_node *n = root->rb_node;
|
|
|
|
int dir;
|
|
|
|
|
|
|
|
while (n) {
|
2013-05-08 15:40:36 +00:00
|
|
|
dir = cmp(n, search, fuzz);
|
2013-03-22 14:52:07 +00:00
|
|
|
if (dir < 0)
|
|
|
|
n = n->rb_left;
|
|
|
|
else if (dir > 0)
|
|
|
|
n = n->rb_right;
|
|
|
|
else
|
2013-05-08 15:40:36 +00:00
|
|
|
return n;
|
2013-03-22 14:52:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2016-05-26 09:43:00 +00:00
|
|
|
static u64 logical_to_physical(struct mdrestore_struct *mdres, u64 logical,
|
|
|
|
u64 *size, u64 *physical_dup)
|
2015-01-26 01:39:24 +00:00
|
|
|
{
|
|
|
|
struct fs_chunk *fs_chunk;
|
|
|
|
struct rb_node *entry;
|
|
|
|
struct fs_chunk search;
|
|
|
|
u64 offset;
|
|
|
|
|
|
|
|
if (logical == BTRFS_SUPER_INFO_OFFSET)
|
|
|
|
return logical;
|
|
|
|
|
|
|
|
search.logical = logical;
|
|
|
|
entry = tree_search(&mdres->chunk_tree, &search.l, chunk_cmp, 1);
|
|
|
|
if (!entry) {
|
|
|
|
if (mdres->in != stdin)
|
2016-09-30 11:00:24 +00:00
|
|
|
warning("cannot find a chunk, using logical");
|
2015-01-26 01:39:24 +00:00
|
|
|
return logical;
|
|
|
|
}
|
|
|
|
fs_chunk = rb_entry(entry, struct fs_chunk, l);
|
|
|
|
if (fs_chunk->logical > logical || fs_chunk->logical + fs_chunk->bytes < logical)
|
|
|
|
BUG();
|
|
|
|
offset = search.logical - fs_chunk->logical;
|
|
|
|
|
2016-05-26 09:43:00 +00:00
|
|
|
if (physical_dup) {
|
|
|
|
/* Only in dup case, physical_dup is not equal to 0 */
|
|
|
|
if (fs_chunk->physical_dup)
|
|
|
|
*physical_dup = fs_chunk->physical_dup + offset;
|
|
|
|
else
|
|
|
|
*physical_dup = 0;
|
|
|
|
}
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
*size = min(*size, fs_chunk->bytes + fs_chunk->logical - logical);
|
|
|
|
return fs_chunk->physical + offset;
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
/*
|
|
|
|
* zero inline extents and csum items
|
|
|
|
*/
|
2013-03-22 14:52:07 +00:00
|
|
|
static void zero_items(struct metadump_struct *md, u8 *dst,
|
|
|
|
struct extent_buffer *src)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
struct btrfs_file_extent_item *fi;
|
|
|
|
struct btrfs_item *item;
|
|
|
|
struct btrfs_key key;
|
|
|
|
u32 nritems = btrfs_header_nritems(src);
|
|
|
|
size_t size;
|
|
|
|
unsigned long ptr;
|
|
|
|
int i, extent_type;
|
|
|
|
|
|
|
|
for (i = 0; i < nritems; i++) {
|
2013-09-20 09:55:26 +00:00
|
|
|
item = btrfs_item_nr(i);
|
2008-11-20 14:52:48 +00:00
|
|
|
btrfs_item_key_to_cpu(src, &key, i);
|
|
|
|
if (key.type == BTRFS_CSUM_ITEM_KEY) {
|
|
|
|
size = btrfs_item_size_nr(src, i);
|
|
|
|
memset(dst + btrfs_leaf_data(src) +
|
|
|
|
btrfs_item_offset_nr(src, i), 0, size);
|
|
|
|
continue;
|
|
|
|
}
|
2013-03-22 14:52:07 +00:00
|
|
|
|
|
|
|
if (md->sanitize_names && has_name(&key)) {
|
2017-10-19 23:11:11 +00:00
|
|
|
sanitize_name(md->sanitize_names, &md->name_tree, dst,
|
|
|
|
src, &key, i);
|
2013-03-22 14:52:07 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
if (key.type != BTRFS_EXTENT_DATA_KEY)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
fi = btrfs_item_ptr(src, i, struct btrfs_file_extent_item);
|
|
|
|
extent_type = btrfs_file_extent_type(src, fi);
|
|
|
|
if (extent_type != BTRFS_FILE_EXTENT_INLINE)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
ptr = btrfs_file_extent_inline_start(fi);
|
|
|
|
size = btrfs_file_extent_inline_item_len(src, item);
|
|
|
|
memset(dst + ptr, 0, size);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* copy buffer and zero useless data in the buffer
|
|
|
|
*/
|
2013-03-22 14:52:07 +00:00
|
|
|
static void copy_buffer(struct metadump_struct *md, u8 *dst,
|
|
|
|
struct extent_buffer *src)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
int level;
|
|
|
|
size_t size;
|
|
|
|
u32 nritems;
|
|
|
|
|
|
|
|
memcpy(dst, src->data, src->len);
|
|
|
|
if (src->start == BTRFS_SUPER_INFO_OFFSET)
|
|
|
|
return;
|
|
|
|
|
|
|
|
level = btrfs_header_level(src);
|
|
|
|
nritems = btrfs_header_nritems(src);
|
|
|
|
|
|
|
|
if (nritems == 0) {
|
|
|
|
size = sizeof(struct btrfs_header);
|
|
|
|
memset(dst + size, 0, src->len - size);
|
|
|
|
} else if (level == 0) {
|
|
|
|
size = btrfs_leaf_data(src) +
|
|
|
|
btrfs_item_offset_nr(src, nritems - 1) -
|
|
|
|
btrfs_item_nr_offset(nritems);
|
|
|
|
memset(dst + btrfs_item_nr_offset(nritems), 0, size);
|
2013-03-22 14:52:07 +00:00
|
|
|
zero_items(md, dst, src);
|
2008-11-20 14:52:48 +00:00
|
|
|
} else {
|
|
|
|
size = offsetof(struct btrfs_node, ptrs) +
|
|
|
|
sizeof(struct btrfs_key_ptr) * nritems;
|
|
|
|
memset(dst + size, 0, src->len - size);
|
|
|
|
}
|
|
|
|
csum_block(dst, src->len);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void *dump_worker(void *data)
|
|
|
|
{
|
|
|
|
struct metadump_struct *md = (struct metadump_struct *)data;
|
|
|
|
struct async_work *async;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
while (1) {
|
|
|
|
pthread_mutex_lock(&md->mutex);
|
|
|
|
while (list_empty(&md->list)) {
|
|
|
|
if (md->done) {
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
pthread_cond_wait(&md->cond, &md->mutex);
|
|
|
|
}
|
|
|
|
async = list_entry(md->list.next, struct async_work, list);
|
|
|
|
list_del_init(&async->list);
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
|
|
|
|
if (md->compress_level > 0) {
|
|
|
|
u8 *orig = async->buffer;
|
|
|
|
|
|
|
|
async->bufsize = compressBound(async->size);
|
|
|
|
async->buffer = malloc(async->bufsize);
|
2014-06-26 02:53:02 +00:00
|
|
|
if (!async->buffer) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for async buffer");
|
2014-06-26 02:53:02 +00:00
|
|
|
pthread_mutex_lock(&md->mutex);
|
|
|
|
if (!md->error)
|
|
|
|
md->error = -ENOMEM;
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
pthread_exit(NULL);
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2008-12-02 12:19:08 +00:00
|
|
|
ret = compress2(async->buffer,
|
|
|
|
(unsigned long *)&async->bufsize,
|
|
|
|
orig, async->size, md->compress_level);
|
2013-03-18 18:50:45 +00:00
|
|
|
|
|
|
|
if (ret != Z_OK)
|
|
|
|
async->error = 1;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
free(orig);
|
|
|
|
}
|
|
|
|
|
|
|
|
pthread_mutex_lock(&md->mutex);
|
|
|
|
md->num_ready++;
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
pthread_exit(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void meta_cluster_init(struct metadump_struct *md, u64 start)
|
|
|
|
{
|
|
|
|
struct meta_cluster_header *header;
|
|
|
|
|
|
|
|
md->num_items = 0;
|
|
|
|
md->num_ready = 0;
|
2016-11-03 00:23:18 +00:00
|
|
|
header = &md->cluster.header;
|
2008-11-20 14:52:48 +00:00
|
|
|
header->magic = cpu_to_le64(HEADER_MAGIC);
|
|
|
|
header->bytenr = cpu_to_le64(start);
|
|
|
|
header->nritems = cpu_to_le32(0);
|
|
|
|
header->compress = md->compress_level > 0 ?
|
|
|
|
COMPRESS_ZLIB : COMPRESS_NONE;
|
|
|
|
}
|
|
|
|
|
2014-03-21 01:06:23 +00:00
|
|
|
static void metadump_destroy(struct metadump_struct *md, int num_threads)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
struct rb_node *n;
|
|
|
|
|
|
|
|
pthread_mutex_lock(&md->mutex);
|
|
|
|
md->done = 1;
|
|
|
|
pthread_cond_broadcast(&md->cond);
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
|
|
|
|
for (i = 0; i < num_threads; i++)
|
|
|
|
pthread_join(md->threads[i], NULL);
|
|
|
|
|
|
|
|
pthread_cond_destroy(&md->cond);
|
|
|
|
pthread_mutex_destroy(&md->mutex);
|
|
|
|
|
|
|
|
while ((n = rb_first(&md->name_tree))) {
|
|
|
|
struct name *name;
|
|
|
|
|
|
|
|
name = rb_entry(n, struct name, n);
|
|
|
|
rb_erase(n, &md->name_tree);
|
|
|
|
free(name->val);
|
|
|
|
free(name->sub);
|
|
|
|
free(name);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
static int metadump_init(struct metadump_struct *md, struct btrfs_root *root,
|
2013-03-22 14:52:07 +00:00
|
|
|
FILE *out, int num_threads, int compress_level,
|
2017-10-19 23:01:43 +00:00
|
|
|
enum sanitize_mode sanitize_names)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
2013-03-27 20:55:41 +00:00
|
|
|
int i, ret = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
memset(md, 0, sizeof(*md));
|
|
|
|
INIT_LIST_HEAD(&md->list);
|
|
|
|
INIT_LIST_HEAD(&md->ordered);
|
|
|
|
md->root = root;
|
|
|
|
md->out = out;
|
|
|
|
md->pending_start = (u64)-1;
|
|
|
|
md->compress_level = compress_level;
|
2013-03-22 14:52:07 +00:00
|
|
|
md->sanitize_names = sanitize_names;
|
2017-10-19 23:01:43 +00:00
|
|
|
if (sanitize_names == SANITIZE_COLLISIONS)
|
2013-03-22 14:52:07 +00:00
|
|
|
crc32c_optimization_init();
|
|
|
|
|
2015-11-06 17:31:27 +00:00
|
|
|
md->name_tree.rb_node = NULL;
|
|
|
|
md->num_threads = num_threads;
|
|
|
|
pthread_cond_init(&md->cond, NULL);
|
|
|
|
pthread_mutex_init(&md->mutex, NULL);
|
2008-11-20 14:52:48 +00:00
|
|
|
meta_cluster_init(md, 0);
|
2015-11-06 17:31:27 +00:00
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
if (!num_threads)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
for (i = 0; i < num_threads; i++) {
|
|
|
|
ret = pthread_create(md->threads + i, NULL, dump_worker, md);
|
|
|
|
if (ret)
|
|
|
|
break;
|
|
|
|
}
|
2013-03-18 18:50:45 +00:00
|
|
|
|
2014-03-21 01:06:23 +00:00
|
|
|
if (ret)
|
|
|
|
metadump_destroy(md, i + 1);
|
2013-03-18 18:50:45 +00:00
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int write_zero(FILE *out, size_t size)
|
|
|
|
{
|
|
|
|
static char zero[BLOCK_SIZE];
|
|
|
|
return fwrite(zero, size, 1, out);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int write_buffers(struct metadump_struct *md, u64 *next)
|
|
|
|
{
|
2016-11-03 00:23:18 +00:00
|
|
|
struct meta_cluster_header *header = &md->cluster.header;
|
2008-11-20 14:52:48 +00:00
|
|
|
struct meta_cluster_item *item;
|
|
|
|
struct async_work *async;
|
|
|
|
u64 bytenr = 0;
|
|
|
|
u32 nritems = 0;
|
|
|
|
int ret;
|
2013-03-18 18:50:45 +00:00
|
|
|
int err = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
if (list_empty(&md->ordered))
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
/* wait until all buffers are compressed */
|
2014-06-26 02:53:02 +00:00
|
|
|
while (!err && md->num_items > md->num_ready) {
|
2008-11-20 14:52:48 +00:00
|
|
|
struct timespec ts = {
|
|
|
|
.tv_sec = 0,
|
|
|
|
.tv_nsec = 10000000,
|
|
|
|
};
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
|
|
|
nanosleep(&ts, NULL);
|
|
|
|
pthread_mutex_lock(&md->mutex);
|
2014-06-26 02:53:02 +00:00
|
|
|
err = md->error;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (err) {
|
2018-10-25 12:10:54 +00:00
|
|
|
errno = -err;
|
|
|
|
error("one of the threads failed: %m");
|
2014-06-26 02:53:02 +00:00
|
|
|
goto out;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* setup and write index block */
|
|
|
|
list_for_each_entry(async, &md->ordered, ordered) {
|
2016-11-03 00:23:18 +00:00
|
|
|
item = &md->cluster.items[nritems];
|
2008-11-20 14:52:48 +00:00
|
|
|
item->bytenr = cpu_to_le64(async->start);
|
|
|
|
item->size = cpu_to_le32(async->bufsize);
|
|
|
|
nritems++;
|
|
|
|
}
|
|
|
|
header->nritems = cpu_to_le32(nritems);
|
|
|
|
|
2016-11-03 00:23:18 +00:00
|
|
|
ret = fwrite(&md->cluster, BLOCK_SIZE, 1, md->out);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to write out cluster: %m");
|
2016-09-08 13:57:42 +00:00
|
|
|
return -errno;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
/* write buffers */
|
|
|
|
bytenr += le64_to_cpu(header->bytenr) + BLOCK_SIZE;
|
|
|
|
while (!list_empty(&md->ordered)) {
|
|
|
|
async = list_entry(md->ordered.next, struct async_work,
|
|
|
|
ordered);
|
|
|
|
list_del_init(&async->ordered);
|
|
|
|
|
|
|
|
bytenr += async->bufsize;
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!err)
|
|
|
|
ret = fwrite(async->buffer, async->bufsize, 1,
|
|
|
|
md->out);
|
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to write out cluster: %m");
|
2016-09-08 13:57:42 +00:00
|
|
|
err = -errno;
|
2013-03-18 18:50:45 +00:00
|
|
|
ret = 0;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* zero unused space in the last block */
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!err && bytenr & BLOCK_MASK) {
|
2008-11-20 14:52:48 +00:00
|
|
|
size_t size = BLOCK_SIZE - (bytenr & BLOCK_MASK);
|
|
|
|
|
|
|
|
bytenr += size;
|
|
|
|
ret = write_zero(md->out, size);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to zero out buffer: %m");
|
2016-09-08 13:57:42 +00:00
|
|
|
err = -errno;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
out:
|
|
|
|
*next = bytenr;
|
2013-03-18 18:50:45 +00:00
|
|
|
return err;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2013-03-19 13:43:13 +00:00
|
|
|
static int read_data_extent(struct metadump_struct *md,
|
|
|
|
struct async_work *async)
|
|
|
|
{
|
2015-08-21 03:21:27 +00:00
|
|
|
struct btrfs_root *root = md->root;
|
2017-06-13 09:19:24 +00:00
|
|
|
struct btrfs_fs_info *fs_info = root->fs_info;
|
2013-03-19 13:43:13 +00:00
|
|
|
u64 bytes_left = async->size;
|
|
|
|
u64 logical = async->start;
|
|
|
|
u64 offset = 0;
|
|
|
|
u64 read_len;
|
2015-08-21 03:21:27 +00:00
|
|
|
int num_copies;
|
|
|
|
int cur_mirror;
|
2013-03-19 13:43:13 +00:00
|
|
|
int ret;
|
|
|
|
|
2017-06-13 09:19:18 +00:00
|
|
|
num_copies = btrfs_num_copies(root->fs_info, logical, bytes_left);
|
2015-08-21 03:21:27 +00:00
|
|
|
|
|
|
|
/* Try our best to read data, just like read_tree_block() */
|
2018-03-30 07:35:27 +00:00
|
|
|
for (cur_mirror = 1; cur_mirror <= num_copies; cur_mirror++) {
|
2015-08-21 03:21:27 +00:00
|
|
|
while (bytes_left) {
|
|
|
|
read_len = bytes_left;
|
2017-06-13 09:19:24 +00:00
|
|
|
ret = read_extent_data(fs_info,
|
2015-08-21 03:21:27 +00:00
|
|
|
(char *)(async->buffer + offset),
|
|
|
|
logical, &read_len, cur_mirror);
|
|
|
|
if (ret < 0)
|
|
|
|
break;
|
|
|
|
offset += read_len;
|
|
|
|
logical += read_len;
|
|
|
|
bytes_left -= read_len;
|
2013-03-19 13:43:13 +00:00
|
|
|
}
|
|
|
|
}
|
2015-08-21 03:21:27 +00:00
|
|
|
if (bytes_left)
|
|
|
|
return -EIO;
|
2013-03-19 13:43:13 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2015-01-14 19:40:21 +00:00
|
|
|
static int get_dev_fd(struct btrfs_root *root)
|
|
|
|
{
|
|
|
|
struct btrfs_device *dev;
|
|
|
|
|
|
|
|
dev = list_first_entry(&root->fs_info->fs_devices->devices,
|
|
|
|
struct btrfs_device, dev_list);
|
|
|
|
return dev->fd;
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
static int flush_pending(struct metadump_struct *md, int done)
|
|
|
|
{
|
|
|
|
struct async_work *async = NULL;
|
|
|
|
struct extent_buffer *eb;
|
2016-10-05 08:07:48 +00:00
|
|
|
u64 start = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
u64 size;
|
|
|
|
size_t offset;
|
2013-03-18 18:50:45 +00:00
|
|
|
int ret = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
if (md->pending_size) {
|
|
|
|
async = calloc(1, sizeof(*async));
|
|
|
|
if (!async)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
async->start = md->pending_start;
|
|
|
|
async->size = md->pending_size;
|
|
|
|
async->bufsize = async->size;
|
|
|
|
async->buffer = malloc(async->bufsize);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!async->buffer) {
|
|
|
|
free(async);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
offset = 0;
|
|
|
|
start = async->start;
|
|
|
|
size = async->size;
|
2013-03-19 13:43:13 +00:00
|
|
|
|
|
|
|
if (md->data) {
|
|
|
|
ret = read_data_extent(md, async);
|
|
|
|
if (ret) {
|
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-01-14 19:40:21 +00:00
|
|
|
/*
|
|
|
|
* Balance can make the mapping not cover the super block, so
|
|
|
|
* just copy directly from one of the devices.
|
|
|
|
*/
|
|
|
|
if (start == BTRFS_SUPER_INFO_OFFSET) {
|
|
|
|
int fd = get_dev_fd(md->root);
|
|
|
|
|
|
|
|
ret = pread64(fd, async->buffer, size, start);
|
|
|
|
if (ret < size) {
|
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to read superblock at %llu: %m",
|
|
|
|
(unsigned long long)start);
|
2016-09-08 13:57:42 +00:00
|
|
|
return -errno;
|
2015-01-14 19:40:21 +00:00
|
|
|
}
|
|
|
|
size = 0;
|
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
|
2013-03-19 13:43:13 +00:00
|
|
|
while (!md->data && size > 0) {
|
2017-08-25 14:20:16 +00:00
|
|
|
u64 this_read = min((u64)md->root->fs_info->nodesize,
|
|
|
|
size);
|
|
|
|
|
2017-08-25 14:54:16 +00:00
|
|
|
eb = read_tree_block(md->root->fs_info, start, 0);
|
2015-01-28 02:12:55 +00:00
|
|
|
if (!extent_buffer_uptodate(eb)) {
|
2013-03-18 18:50:45 +00:00
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to read metadata block %llu",
|
|
|
|
(unsigned long long)start);
|
2013-03-18 18:50:45 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
2013-03-22 14:52:07 +00:00
|
|
|
copy_buffer(md, async->buffer + offset, eb);
|
2008-11-20 14:52:48 +00:00
|
|
|
free_extent_buffer(eb);
|
2013-05-03 20:18:46 +00:00
|
|
|
start += this_read;
|
|
|
|
offset += this_read;
|
|
|
|
size -= this_read;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
md->pending_start = (u64)-1;
|
|
|
|
md->pending_size = 0;
|
|
|
|
} else if (!done) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
pthread_mutex_lock(&md->mutex);
|
|
|
|
if (async) {
|
|
|
|
list_add_tail(&async->ordered, &md->ordered);
|
|
|
|
md->num_items++;
|
|
|
|
if (md->compress_level > 0) {
|
|
|
|
list_add_tail(&async->list, &md->list);
|
|
|
|
pthread_cond_signal(&md->cond);
|
|
|
|
} else {
|
|
|
|
md->num_ready++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (md->num_items >= ITEMS_PER_CLUSTER || done) {
|
|
|
|
ret = write_buffers(md, &start);
|
2018-10-25 12:10:54 +00:00
|
|
|
if (ret) {
|
|
|
|
errno = -ret;
|
|
|
|
error("unable to write buffers: %m");
|
|
|
|
} else {
|
2013-03-18 18:50:45 +00:00
|
|
|
meta_cluster_init(md, start);
|
2018-10-25 12:10:54 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
pthread_mutex_unlock(&md->mutex);
|
2013-03-18 18:50:45 +00:00
|
|
|
return ret;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2013-03-19 13:43:13 +00:00
|
|
|
static int add_extent(u64 start, u64 size, struct metadump_struct *md,
|
|
|
|
int data)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
int ret;
|
2013-03-19 13:43:13 +00:00
|
|
|
if (md->data != data ||
|
|
|
|
md->pending_size + size > MAX_PENDING_SIZE ||
|
2008-11-20 14:52:48 +00:00
|
|
|
md->pending_start + md->pending_size != start) {
|
|
|
|
ret = flush_pending(md, 0);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
md->pending_start = start;
|
|
|
|
}
|
2017-08-25 16:07:15 +00:00
|
|
|
readahead_tree_block(md->root->fs_info, start, 0);
|
2008-11-20 14:52:48 +00:00
|
|
|
md->pending_size += size;
|
2013-03-19 13:43:13 +00:00
|
|
|
md->data = data;
|
2008-11-20 14:52:48 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-03-28 14:26:09 +00:00
|
|
|
static int copy_tree_blocks(struct btrfs_root *root, struct extent_buffer *eb,
|
|
|
|
struct metadump_struct *metadump, int root_tree)
|
2013-03-18 20:03:44 +00:00
|
|
|
{
|
|
|
|
struct extent_buffer *tmp;
|
|
|
|
struct btrfs_root_item *ri;
|
|
|
|
struct btrfs_key key;
|
2017-05-18 02:51:08 +00:00
|
|
|
struct btrfs_fs_info *fs_info = root->fs_info;
|
2013-03-18 20:03:44 +00:00
|
|
|
u64 bytenr;
|
|
|
|
int level;
|
|
|
|
int nritems = 0;
|
|
|
|
int i = 0;
|
|
|
|
int ret;
|
|
|
|
|
2017-05-18 02:51:08 +00:00
|
|
|
ret = add_extent(btrfs_header_bytenr(eb), fs_info->nodesize,
|
2017-05-18 01:29:54 +00:00
|
|
|
metadump, 0);
|
2013-03-18 20:03:44 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to add metadata block %llu: %d",
|
|
|
|
btrfs_header_bytenr(eb), ret);
|
2013-03-18 20:03:44 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2013-03-28 14:26:09 +00:00
|
|
|
if (btrfs_header_level(eb) == 0 && !root_tree)
|
2013-03-18 20:03:44 +00:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
level = btrfs_header_level(eb);
|
|
|
|
nritems = btrfs_header_nritems(eb);
|
|
|
|
for (i = 0; i < nritems; i++) {
|
|
|
|
if (level == 0) {
|
|
|
|
btrfs_item_key_to_cpu(eb, &key, i);
|
|
|
|
if (key.type != BTRFS_ROOT_ITEM_KEY)
|
|
|
|
continue;
|
|
|
|
ri = btrfs_item_ptr(eb, i, struct btrfs_root_item);
|
|
|
|
bytenr = btrfs_disk_root_bytenr(eb, ri);
|
2017-08-25 14:54:16 +00:00
|
|
|
tmp = read_tree_block(fs_info, bytenr, 0);
|
2015-01-28 02:12:55 +00:00
|
|
|
if (!extent_buffer_uptodate(tmp)) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to read log root block");
|
2013-03-18 20:03:44 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
2013-03-28 14:26:09 +00:00
|
|
|
ret = copy_tree_blocks(root, tmp, metadump, 0);
|
2013-03-18 20:03:44 +00:00
|
|
|
free_extent_buffer(tmp);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
} else {
|
|
|
|
bytenr = btrfs_node_blockptr(eb, i);
|
2017-08-25 14:54:16 +00:00
|
|
|
tmp = read_tree_block(fs_info, bytenr, 0);
|
2015-01-28 02:12:55 +00:00
|
|
|
if (!extent_buffer_uptodate(tmp)) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to read log root block");
|
2013-03-18 20:03:44 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
2013-03-28 14:26:09 +00:00
|
|
|
ret = copy_tree_blocks(root, tmp, metadump, root_tree);
|
2013-03-18 20:03:44 +00:00
|
|
|
free_extent_buffer(tmp);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int copy_log_trees(struct btrfs_root *root,
|
2017-02-09 16:42:02 +00:00
|
|
|
struct metadump_struct *metadump)
|
2013-03-18 20:03:44 +00:00
|
|
|
{
|
|
|
|
u64 blocknr = btrfs_super_log_root(root->fs_info->super_copy);
|
|
|
|
|
|
|
|
if (blocknr == 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (!root->fs_info->log_root_tree ||
|
|
|
|
!root->fs_info->log_root_tree->node) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to copy tree log, it has not been setup");
|
2013-03-18 20:03:44 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
2013-03-28 14:26:09 +00:00
|
|
|
return copy_tree_blocks(root, root->fs_info->log_root_tree->node,
|
|
|
|
metadump, 1);
|
2013-03-18 20:03:44 +00:00
|
|
|
}
|
|
|
|
|
2013-03-19 13:43:13 +00:00
|
|
|
static int copy_space_cache(struct btrfs_root *root,
|
|
|
|
struct metadump_struct *metadump,
|
|
|
|
struct btrfs_path *path)
|
|
|
|
{
|
|
|
|
struct extent_buffer *leaf;
|
|
|
|
struct btrfs_file_extent_item *fi;
|
|
|
|
struct btrfs_key key;
|
|
|
|
u64 bytenr, num_bytes;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
root = root->fs_info->tree_root;
|
|
|
|
|
|
|
|
key.objectid = 0;
|
|
|
|
key.type = BTRFS_EXTENT_DATA_KEY;
|
|
|
|
key.offset = 0;
|
|
|
|
|
|
|
|
ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
|
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("free space inode not found: %d", ret);
|
2013-03-19 13:43:13 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-06-19 01:46:00 +00:00
|
|
|
leaf = path->nodes[0];
|
|
|
|
|
2013-03-19 13:43:13 +00:00
|
|
|
while (1) {
|
|
|
|
if (path->slots[0] >= btrfs_header_nritems(leaf)) {
|
|
|
|
ret = btrfs_next_leaf(root, path);
|
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("cannot go to next leaf %d", ret);
|
2013-03-19 13:43:13 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
if (ret > 0)
|
|
|
|
break;
|
|
|
|
leaf = path->nodes[0];
|
|
|
|
}
|
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(leaf, &key, path->slots[0]);
|
|
|
|
if (key.type != BTRFS_EXTENT_DATA_KEY) {
|
|
|
|
path->slots[0]++;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
fi = btrfs_item_ptr(leaf, path->slots[0],
|
|
|
|
struct btrfs_file_extent_item);
|
|
|
|
if (btrfs_file_extent_type(leaf, fi) !=
|
|
|
|
BTRFS_FILE_EXTENT_REG) {
|
|
|
|
path->slots[0]++;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
bytenr = btrfs_file_extent_disk_bytenr(leaf, fi);
|
|
|
|
num_bytes = btrfs_file_extent_disk_num_bytes(leaf, fi);
|
|
|
|
ret = add_extent(bytenr, num_bytes, metadump, 1);
|
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to add space cache blocks %d", ret);
|
2013-08-03 00:52:43 +00:00
|
|
|
btrfs_release_path(path);
|
2013-03-19 13:43:13 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
path->slots[0]++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-03-28 14:26:09 +00:00
|
|
|
static int copy_from_extent_tree(struct metadump_struct *metadump,
|
|
|
|
struct btrfs_path *path)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
struct btrfs_root *extent_root;
|
|
|
|
struct extent_buffer *leaf;
|
2009-05-29 20:35:30 +00:00
|
|
|
struct btrfs_extent_item *ei;
|
2008-11-20 14:52:48 +00:00
|
|
|
struct btrfs_key key;
|
|
|
|
u64 bytenr;
|
|
|
|
u64 num_bytes;
|
|
|
|
int ret;
|
|
|
|
|
2013-03-28 14:26:09 +00:00
|
|
|
extent_root = metadump->root->fs_info->extent_root;
|
2014-06-26 02:53:06 +00:00
|
|
|
bytenr = BTRFS_SUPER_INFO_OFFSET + BTRFS_SUPER_INFO_SIZE;
|
2008-11-20 14:52:48 +00:00
|
|
|
key.objectid = bytenr;
|
|
|
|
key.type = BTRFS_EXTENT_ITEM_KEY;
|
|
|
|
key.offset = 0;
|
|
|
|
|
|
|
|
ret = btrfs_search_slot(NULL, extent_root, &key, path, 0, 0);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("extent root not found: %d", ret);
|
2013-03-28 14:26:09 +00:00
|
|
|
return ret;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2013-03-28 14:26:09 +00:00
|
|
|
ret = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2014-06-19 01:46:00 +00:00
|
|
|
leaf = path->nodes[0];
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
while (1) {
|
|
|
|
if (path->slots[0] >= btrfs_header_nritems(leaf)) {
|
|
|
|
ret = btrfs_next_leaf(extent_root, path);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("cannot go to next leaf %d", ret);
|
2013-03-28 14:26:09 +00:00
|
|
|
break;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2013-03-28 14:26:09 +00:00
|
|
|
if (ret > 0) {
|
|
|
|
ret = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
break;
|
2013-03-28 14:26:09 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
leaf = path->nodes[0];
|
|
|
|
}
|
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(leaf, &key, path->slots[0]);
|
|
|
|
if (key.objectid < bytenr ||
|
2013-03-15 19:32:16 +00:00
|
|
|
(key.type != BTRFS_EXTENT_ITEM_KEY &&
|
|
|
|
key.type != BTRFS_METADATA_ITEM_KEY)) {
|
2008-11-20 14:52:48 +00:00
|
|
|
path->slots[0]++;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
bytenr = key.objectid;
|
2016-10-03 12:52:30 +00:00
|
|
|
if (key.type == BTRFS_METADATA_ITEM_KEY) {
|
2017-05-18 01:29:54 +00:00
|
|
|
num_bytes = extent_root->fs_info->nodesize;
|
2016-10-03 12:52:30 +00:00
|
|
|
} else {
|
2013-06-22 05:32:41 +00:00
|
|
|
num_bytes = key.offset;
|
2016-10-03 12:52:30 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (num_bytes == 0) {
|
|
|
|
error("extent length 0 at bytenr %llu key type %d",
|
|
|
|
(unsigned long long)bytenr, key.type);
|
|
|
|
ret = -EIO;
|
|
|
|
break;
|
|
|
|
}
|
2009-05-29 20:35:30 +00:00
|
|
|
|
|
|
|
if (btrfs_item_size_nr(leaf, path->slots[0]) > sizeof(*ei)) {
|
|
|
|
ei = btrfs_item_ptr(leaf, path->slots[0],
|
|
|
|
struct btrfs_extent_item);
|
|
|
|
if (btrfs_extent_flags(leaf, ei) &
|
|
|
|
BTRFS_EXTENT_FLAG_TREE_BLOCK) {
|
2013-03-28 14:26:09 +00:00
|
|
|
ret = add_extent(bytenr, num_bytes, metadump,
|
2013-03-19 13:43:13 +00:00
|
|
|
0);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to add block %llu: %d",
|
|
|
|
(unsigned long long)bytenr, ret);
|
2013-03-28 14:26:09 +00:00
|
|
|
break;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
2009-05-29 20:35:30 +00:00
|
|
|
} else {
|
2016-09-08 13:57:42 +00:00
|
|
|
error(
|
2019-05-29 07:27:23 +00:00
|
|
|
"either extent tree is corrupted or deprecated extent ref format");
|
2013-03-28 14:26:09 +00:00
|
|
|
ret = -EIO;
|
|
|
|
break;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
bytenr += num_bytes;
|
|
|
|
}
|
|
|
|
|
2013-08-03 00:52:43 +00:00
|
|
|
btrfs_release_path(path);
|
2013-03-28 14:26:09 +00:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int create_metadump(const char *input, FILE *out, int num_threads,
|
2017-10-19 23:01:43 +00:00
|
|
|
int compress_level, enum sanitize_mode sanitize,
|
|
|
|
int walk_trees)
|
2013-03-28 14:26:09 +00:00
|
|
|
{
|
|
|
|
struct btrfs_root *root;
|
2016-11-02 23:37:51 +00:00
|
|
|
struct btrfs_path path;
|
2013-03-28 14:26:09 +00:00
|
|
|
struct metadump_struct metadump;
|
|
|
|
int ret;
|
|
|
|
int err = 0;
|
|
|
|
|
|
|
|
root = open_ctree(input, 0, 0);
|
|
|
|
if (!root) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("open ctree failed");
|
2013-03-28 14:26:09 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = metadump_init(&metadump, root, out, num_threads,
|
2013-03-22 14:52:07 +00:00
|
|
|
compress_level, sanitize);
|
2013-03-28 14:26:09 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("failed to initialize metadump: %d", ret);
|
2013-03-28 14:26:09 +00:00
|
|
|
close_ctree(root);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-06-26 02:53:06 +00:00
|
|
|
ret = add_extent(BTRFS_SUPER_INFO_OFFSET, BTRFS_SUPER_INFO_SIZE,
|
|
|
|
&metadump, 0);
|
2013-03-28 14:26:09 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to add metadata: %d", ret);
|
2013-03-28 14:26:09 +00:00
|
|
|
err = ret;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
btrfs_init_path(&path);
|
2013-03-28 14:26:09 +00:00
|
|
|
|
|
|
|
if (walk_trees) {
|
|
|
|
ret = copy_tree_blocks(root, root->fs_info->chunk_root->node,
|
|
|
|
&metadump, 1);
|
|
|
|
if (ret) {
|
|
|
|
err = ret;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = copy_tree_blocks(root, root->fs_info->tree_root->node,
|
|
|
|
&metadump, 1);
|
|
|
|
if (ret) {
|
|
|
|
err = ret;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
} else {
|
2016-11-02 23:37:51 +00:00
|
|
|
ret = copy_from_extent_tree(&metadump, &path);
|
2013-03-28 14:26:09 +00:00
|
|
|
if (ret) {
|
|
|
|
err = ret;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
2013-03-19 13:43:13 +00:00
|
|
|
|
2017-02-09 16:42:02 +00:00
|
|
|
ret = copy_log_trees(root, &metadump);
|
2013-03-19 13:43:13 +00:00
|
|
|
if (ret) {
|
2013-03-18 20:03:44 +00:00
|
|
|
err = ret;
|
2013-03-19 13:43:13 +00:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
ret = copy_space_cache(root, &metadump, &path);
|
2013-03-18 18:50:45 +00:00
|
|
|
out:
|
2008-11-20 14:52:48 +00:00
|
|
|
ret = flush_pending(&metadump, 1);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret) {
|
|
|
|
if (!err)
|
2013-03-28 14:26:09 +00:00
|
|
|
err = ret;
|
2016-09-08 13:57:42 +00:00
|
|
|
error("failed to flush pending data: %d", ret);
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2014-03-21 01:06:23 +00:00
|
|
|
metadump_destroy(&metadump, num_threads);
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
btrfs_release_path(&path);
|
2008-11-20 14:52:48 +00:00
|
|
|
ret = close_ctree(root);
|
2013-03-18 18:50:45 +00:00
|
|
|
return err ? err : ret;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
static void update_super_old(u8 *buffer)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
struct btrfs_super_block *super = (struct btrfs_super_block *)buffer;
|
|
|
|
struct btrfs_chunk *chunk;
|
|
|
|
struct btrfs_disk_key *key;
|
|
|
|
u32 sectorsize = btrfs_super_sectorsize(super);
|
|
|
|
u64 flags = btrfs_super_flags(super);
|
|
|
|
|
|
|
|
flags |= BTRFS_SUPER_FLAG_METADUMP;
|
|
|
|
btrfs_set_super_flags(super, flags);
|
|
|
|
|
|
|
|
key = (struct btrfs_disk_key *)(super->sys_chunk_array);
|
|
|
|
chunk = (struct btrfs_chunk *)(super->sys_chunk_array +
|
|
|
|
sizeof(struct btrfs_disk_key));
|
|
|
|
|
|
|
|
btrfs_set_disk_key_objectid(key, BTRFS_FIRST_CHUNK_TREE_OBJECTID);
|
|
|
|
btrfs_set_disk_key_type(key, BTRFS_CHUNK_ITEM_KEY);
|
|
|
|
btrfs_set_disk_key_offset(key, 0);
|
|
|
|
|
|
|
|
btrfs_set_stack_chunk_length(chunk, (u64)-1);
|
|
|
|
btrfs_set_stack_chunk_owner(chunk, BTRFS_EXTENT_TREE_OBJECTID);
|
2013-12-16 12:33:58 +00:00
|
|
|
btrfs_set_stack_chunk_stripe_len(chunk, BTRFS_STRIPE_LEN);
|
2008-11-20 14:52:48 +00:00
|
|
|
btrfs_set_stack_chunk_type(chunk, BTRFS_BLOCK_GROUP_SYSTEM);
|
|
|
|
btrfs_set_stack_chunk_io_align(chunk, sectorsize);
|
|
|
|
btrfs_set_stack_chunk_io_width(chunk, sectorsize);
|
|
|
|
btrfs_set_stack_chunk_sector_size(chunk, sectorsize);
|
|
|
|
btrfs_set_stack_chunk_num_stripes(chunk, 1);
|
|
|
|
btrfs_set_stack_chunk_sub_stripes(chunk, 0);
|
|
|
|
chunk->stripe.devid = super->dev_item.devid;
|
2013-06-26 05:27:08 +00:00
|
|
|
btrfs_set_stack_stripe_offset(&chunk->stripe, 0);
|
2008-11-20 14:52:48 +00:00
|
|
|
memcpy(chunk->stripe.dev_uuid, super->dev_item.uuid, BTRFS_UUID_SIZE);
|
|
|
|
btrfs_set_super_sys_array_size(super, sizeof(*key) + sizeof(*chunk));
|
2014-06-26 02:53:06 +00:00
|
|
|
csum_block(buffer, BTRFS_SUPER_INFO_SIZE);
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
static int update_super(struct mdrestore_struct *mdres, u8 *buffer)
|
2013-03-27 20:55:41 +00:00
|
|
|
{
|
|
|
|
struct btrfs_super_block *super = (struct btrfs_super_block *)buffer;
|
|
|
|
struct btrfs_chunk *chunk;
|
|
|
|
struct btrfs_disk_key *disk_key;
|
|
|
|
struct btrfs_key key;
|
2015-02-06 18:03:12 +00:00
|
|
|
u64 flags = btrfs_super_flags(super);
|
2013-03-27 20:55:41 +00:00
|
|
|
u32 new_array_size = 0;
|
|
|
|
u32 array_size;
|
|
|
|
u32 cur = 0;
|
|
|
|
u8 *ptr, *write_ptr;
|
|
|
|
int old_num_stripes;
|
|
|
|
|
2020-05-27 10:28:09 +00:00
|
|
|
/* No need to fix, use all data as is */
|
|
|
|
if (btrfs_super_num_devices(mdres->original_super) == 1) {
|
|
|
|
new_array_size = btrfs_super_sys_array_size(super);
|
|
|
|
goto finish;
|
|
|
|
}
|
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
write_ptr = ptr = super->sys_chunk_array;
|
|
|
|
array_size = btrfs_super_sys_array_size(super);
|
|
|
|
|
|
|
|
while (cur < array_size) {
|
|
|
|
disk_key = (struct btrfs_disk_key *)ptr;
|
|
|
|
btrfs_disk_key_to_cpu(&key, disk_key);
|
|
|
|
|
|
|
|
new_array_size += sizeof(*disk_key);
|
|
|
|
memmove(write_ptr, ptr, sizeof(*disk_key));
|
|
|
|
|
|
|
|
write_ptr += sizeof(*disk_key);
|
|
|
|
ptr += sizeof(*disk_key);
|
|
|
|
cur += sizeof(*disk_key);
|
|
|
|
|
|
|
|
if (key.type == BTRFS_CHUNK_ITEM_KEY) {
|
2016-05-26 09:43:00 +00:00
|
|
|
u64 type, physical, physical_dup, size = 0;
|
2015-01-26 01:39:24 +00:00
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
chunk = (struct btrfs_chunk *)ptr;
|
|
|
|
old_num_stripes = btrfs_stack_chunk_num_stripes(chunk);
|
|
|
|
chunk = (struct btrfs_chunk *)write_ptr;
|
|
|
|
|
|
|
|
memmove(write_ptr, ptr, sizeof(*chunk));
|
|
|
|
btrfs_set_stack_chunk_sub_stripes(chunk, 0);
|
2016-05-26 09:43:00 +00:00
|
|
|
type = btrfs_stack_chunk_type(chunk);
|
|
|
|
if (type & BTRFS_BLOCK_GROUP_DUP) {
|
|
|
|
new_array_size += sizeof(struct btrfs_stripe);
|
|
|
|
write_ptr += sizeof(struct btrfs_stripe);
|
|
|
|
} else {
|
|
|
|
btrfs_set_stack_chunk_num_stripes(chunk, 1);
|
|
|
|
btrfs_set_stack_chunk_type(chunk,
|
|
|
|
BTRFS_BLOCK_GROUP_SYSTEM);
|
|
|
|
}
|
2016-01-04 01:01:33 +00:00
|
|
|
chunk->stripe.devid = super->dev_item.devid;
|
2015-01-26 01:39:24 +00:00
|
|
|
physical = logical_to_physical(mdres, key.offset,
|
2016-05-26 09:43:00 +00:00
|
|
|
&size, &physical_dup);
|
2015-01-26 01:39:24 +00:00
|
|
|
if (size != (u64)-1)
|
|
|
|
btrfs_set_stack_stripe_offset(&chunk->stripe,
|
|
|
|
physical);
|
2013-03-27 20:55:41 +00:00
|
|
|
memcpy(chunk->stripe.dev_uuid, super->dev_item.uuid,
|
|
|
|
BTRFS_UUID_SIZE);
|
|
|
|
new_array_size += sizeof(*chunk);
|
|
|
|
} else {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("bogus key in the sys array %d", key.type);
|
2013-03-27 20:55:41 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
write_ptr += sizeof(*chunk);
|
|
|
|
ptr += btrfs_chunk_item_size(old_num_stripes);
|
|
|
|
cur += btrfs_chunk_item_size(old_num_stripes);
|
|
|
|
}
|
|
|
|
|
2020-05-27 10:28:09 +00:00
|
|
|
finish:
|
2015-01-26 01:39:24 +00:00
|
|
|
if (mdres->clear_space_cache)
|
|
|
|
btrfs_set_super_cache_generation(super, 0);
|
|
|
|
|
2015-02-06 18:03:12 +00:00
|
|
|
flags |= BTRFS_SUPER_FLAG_METADUMP_V2;
|
|
|
|
btrfs_set_super_flags(super, flags);
|
2013-03-27 20:55:41 +00:00
|
|
|
btrfs_set_super_sys_array_size(super, new_array_size);
|
2017-05-17 01:41:21 +00:00
|
|
|
btrfs_set_super_num_devices(super, 1);
|
2014-06-26 02:53:06 +00:00
|
|
|
csum_block(buffer, BTRFS_SUPER_INFO_SIZE);
|
2013-03-27 20:55:41 +00:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct extent_buffer *alloc_dummy_eb(u64 bytenr, u32 size)
|
|
|
|
{
|
|
|
|
struct extent_buffer *eb;
|
|
|
|
|
2015-09-29 17:10:36 +00:00
|
|
|
eb = calloc(1, sizeof(struct extent_buffer) + size);
|
2013-03-27 20:55:41 +00:00
|
|
|
if (!eb)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
eb->start = bytenr;
|
|
|
|
eb->len = size;
|
|
|
|
return eb;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void truncate_item(struct extent_buffer *eb, int slot, u32 new_size)
|
|
|
|
{
|
|
|
|
struct btrfs_item *item;
|
|
|
|
u32 nritems;
|
|
|
|
u32 old_size;
|
|
|
|
u32 old_data_start;
|
|
|
|
u32 size_diff;
|
|
|
|
u32 data_end;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
old_size = btrfs_item_size_nr(eb, slot);
|
|
|
|
if (old_size == new_size)
|
|
|
|
return;
|
|
|
|
|
|
|
|
nritems = btrfs_header_nritems(eb);
|
|
|
|
data_end = btrfs_item_offset_nr(eb, nritems - 1);
|
|
|
|
|
|
|
|
old_data_start = btrfs_item_offset_nr(eb, slot);
|
|
|
|
size_diff = old_size - new_size;
|
|
|
|
|
|
|
|
for (i = slot; i < nritems; i++) {
|
|
|
|
u32 ioff;
|
2013-09-20 09:55:26 +00:00
|
|
|
item = btrfs_item_nr(i);
|
2013-03-27 20:55:41 +00:00
|
|
|
ioff = btrfs_item_offset(eb, item);
|
|
|
|
btrfs_set_item_offset(eb, item, ioff + size_diff);
|
|
|
|
}
|
|
|
|
|
|
|
|
memmove_extent_buffer(eb, btrfs_leaf_data(eb) + data_end + size_diff,
|
|
|
|
btrfs_leaf_data(eb) + data_end,
|
|
|
|
old_data_start + new_size - data_end);
|
2013-09-20 09:55:26 +00:00
|
|
|
item = btrfs_item_nr(slot);
|
2013-03-27 20:55:41 +00:00
|
|
|
btrfs_set_item_size(eb, item, new_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int fixup_chunk_tree_block(struct mdrestore_struct *mdres,
|
|
|
|
struct async_work *async, u8 *buffer,
|
|
|
|
size_t size)
|
|
|
|
{
|
|
|
|
struct extent_buffer *eb;
|
|
|
|
size_t size_left = size;
|
|
|
|
u64 bytenr = async->start;
|
|
|
|
int i;
|
|
|
|
|
2020-05-27 10:28:09 +00:00
|
|
|
if (btrfs_super_num_devices(mdres->original_super) == 1)
|
|
|
|
return 0;
|
2016-04-01 10:57:11 +00:00
|
|
|
if (size_left % mdres->nodesize)
|
2013-03-27 20:55:41 +00:00
|
|
|
return 0;
|
|
|
|
|
2016-04-01 10:57:11 +00:00
|
|
|
eb = alloc_dummy_eb(bytenr, mdres->nodesize);
|
2013-03-27 20:55:41 +00:00
|
|
|
if (!eb)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
while (size_left) {
|
|
|
|
eb->start = bytenr;
|
2016-04-01 10:57:11 +00:00
|
|
|
memcpy(eb->data, buffer, mdres->nodesize);
|
2013-03-27 20:55:41 +00:00
|
|
|
|
|
|
|
if (btrfs_header_bytenr(eb) != bytenr)
|
|
|
|
break;
|
|
|
|
if (memcmp(mdres->fsid,
|
|
|
|
eb->data + offsetof(struct btrfs_header, fsid),
|
|
|
|
BTRFS_FSID_SIZE))
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (btrfs_header_owner(eb) != BTRFS_CHUNK_TREE_OBJECTID)
|
|
|
|
goto next;
|
|
|
|
|
|
|
|
if (btrfs_header_level(eb) != 0)
|
|
|
|
goto next;
|
|
|
|
|
|
|
|
for (i = 0; i < btrfs_header_nritems(eb); i++) {
|
2016-05-26 09:43:00 +00:00
|
|
|
struct btrfs_chunk *chunk;
|
2013-03-27 20:55:41 +00:00
|
|
|
struct btrfs_key key;
|
2016-05-26 09:43:00 +00:00
|
|
|
u64 type, physical, physical_dup, size = (u64)-1;
|
2013-03-27 20:55:41 +00:00
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(eb, &key, i);
|
|
|
|
if (key.type != BTRFS_CHUNK_ITEM_KEY)
|
|
|
|
continue;
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
size = 0;
|
|
|
|
physical = logical_to_physical(mdres, key.offset,
|
2016-05-26 09:43:00 +00:00
|
|
|
&size, &physical_dup);
|
|
|
|
|
|
|
|
if (!physical_dup)
|
|
|
|
truncate_item(eb, i, sizeof(*chunk));
|
|
|
|
chunk = btrfs_item_ptr(eb, i, struct btrfs_chunk);
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
/* Zero out the RAID profile */
|
2016-05-26 09:43:00 +00:00
|
|
|
type = btrfs_chunk_type(eb, chunk);
|
2013-03-27 20:55:41 +00:00
|
|
|
type &= (BTRFS_BLOCK_GROUP_DATA |
|
|
|
|
BTRFS_BLOCK_GROUP_SYSTEM |
|
btrfs-progs: don't remove BTRFS_BLOCK_GROUP_DUP in chunk type
During restoring of image (-r using btrfs-image) we zero out RAID
profile in chunk type but forget to save BTRFS_BLOCK_GROUP_DUP if
present. This results in some false messages being printed by btrfsck.
$ ./mkfs.btrfs /dev/sdb2 -f
$ ./btrfs-image /dev/sdb2 btrfs_image_output
$ ./btrfs-image -r btrfs_image_output disk-image
$ ./btrfsck disk-image
Checking filesystem on disk-image
UUID: e644be2d-7701-4bd4-8804-7487f560d2a7
checking extents
Chunk[256, 228, 20971520]: length(8388608), offset(20971520), type(2) mismatch with block group[20971520, 192, 8388608]: offset(8388608), objectid(20971520), flags(34)
Chunk[256, 228, 29360128]: length(1073741824), offset(29360128), type(4) mismatch with block group[29360128, 192, 1073741824]: offset(1073741824), objectid(29360128), flags(36)
Block group[20971520, 8388608] (flags = 34) didn't find the relative chunk.
Block group[29360128, 1073741824] (flags = 36) didn't find the relative chunk.
Even though ./btrfsck on /dev/sdb2 seemed fine. This is due to type
mismatch above and type mismatch occured because we zero'ed out
BTRFS_BLOCK_GROUP_DUP while handling chunk trees.
Signed-off-by: Rakesh Pandit <rakesh@tuxera.com>
Signed-off-by: David Sterba <dsterba@suse.cz>
Signed-off-by: Chris Mason <clm@fb.com>
2014-02-20 14:44:30 +00:00
|
|
|
BTRFS_BLOCK_GROUP_METADATA |
|
|
|
|
BTRFS_BLOCK_GROUP_DUP);
|
2016-05-26 09:43:00 +00:00
|
|
|
btrfs_set_chunk_type(eb, chunk, type);
|
2013-03-27 20:55:41 +00:00
|
|
|
|
2016-05-26 09:43:00 +00:00
|
|
|
if (!physical_dup)
|
|
|
|
btrfs_set_chunk_num_stripes(eb, chunk, 1);
|
|
|
|
btrfs_set_chunk_sub_stripes(eb, chunk, 0);
|
|
|
|
btrfs_set_stripe_devid_nr(eb, chunk, 0, mdres->devid);
|
2015-01-26 01:39:24 +00:00
|
|
|
if (size != (u64)-1)
|
2016-05-26 09:43:00 +00:00
|
|
|
btrfs_set_stripe_offset_nr(eb, chunk, 0,
|
|
|
|
physical);
|
|
|
|
/* update stripe 2 offset */
|
|
|
|
if (physical_dup)
|
|
|
|
btrfs_set_stripe_offset_nr(eb, chunk, 1,
|
|
|
|
physical_dup);
|
|
|
|
|
|
|
|
write_extent_buffer(eb, mdres->uuid,
|
|
|
|
(unsigned long)btrfs_stripe_dev_uuid_nr(
|
|
|
|
chunk, 0),
|
|
|
|
BTRFS_UUID_SIZE);
|
2013-03-27 20:55:41 +00:00
|
|
|
}
|
|
|
|
memcpy(buffer, eb->data, eb->len);
|
|
|
|
csum_block(buffer, eb->len);
|
|
|
|
next:
|
2016-04-01 10:57:11 +00:00
|
|
|
size_left -= mdres->nodesize;
|
|
|
|
buffer += mdres->nodesize;
|
|
|
|
bytenr += mdres->nodesize;
|
2013-03-27 20:55:41 +00:00
|
|
|
}
|
|
|
|
|
2013-10-07 21:43:00 +00:00
|
|
|
free(eb);
|
2013-03-27 20:55:41 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void write_backup_supers(int fd, u8 *buf)
|
|
|
|
{
|
2013-05-08 15:40:36 +00:00
|
|
|
struct btrfs_super_block *super = (struct btrfs_super_block *)buf;
|
2013-03-27 20:55:41 +00:00
|
|
|
struct stat st;
|
|
|
|
u64 size;
|
|
|
|
u64 bytenr;
|
|
|
|
int i;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (fstat(fd, &st)) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error(
|
2018-01-07 21:54:21 +00:00
|
|
|
"cannot stat restore point, won't be able to write backup supers: %m");
|
2013-03-27 20:55:41 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
size = btrfs_device_size(fd, &st);
|
|
|
|
|
|
|
|
for (i = 1; i < BTRFS_SUPER_MIRROR_MAX; i++) {
|
|
|
|
bytenr = btrfs_sb_offset(i);
|
2014-06-26 02:53:06 +00:00
|
|
|
if (bytenr + BTRFS_SUPER_INFO_SIZE > size)
|
2013-03-27 20:55:41 +00:00
|
|
|
break;
|
2013-05-08 15:40:36 +00:00
|
|
|
btrfs_set_super_bytenr(super, bytenr);
|
2014-06-26 02:53:06 +00:00
|
|
|
csum_block(buf, BTRFS_SUPER_INFO_SIZE);
|
|
|
|
ret = pwrite64(fd, buf, BTRFS_SUPER_INFO_SIZE, bytenr);
|
|
|
|
if (ret < BTRFS_SUPER_INFO_SIZE) {
|
2013-03-27 20:55:41 +00:00
|
|
|
if (ret < 0)
|
2016-09-08 13:57:42 +00:00
|
|
|
error(
|
2018-01-07 21:54:21 +00:00
|
|
|
"problem writing out backup super block %d: %m", i);
|
2013-03-27 20:55:41 +00:00
|
|
|
else
|
2016-09-08 13:57:42 +00:00
|
|
|
error("short write writing out backup super block");
|
2013-03-27 20:55:41 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
static void *restore_worker(void *data)
|
|
|
|
{
|
|
|
|
struct mdrestore_struct *mdres = (struct mdrestore_struct *)data;
|
|
|
|
struct async_work *async;
|
|
|
|
size_t size;
|
|
|
|
u8 *buffer;
|
|
|
|
u8 *outbuf;
|
|
|
|
int outfd;
|
|
|
|
int ret;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int compress_size = MAX_PENDING_SIZE * 4;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
outfd = fileno(mdres->out);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
buffer = malloc(compress_size);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!buffer) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for restore worker buffer");
|
2013-03-18 18:50:45 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
|
|
|
if (!mdres->error)
|
|
|
|
mdres->error = -ENOMEM;
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
2014-06-26 02:53:03 +00:00
|
|
|
pthread_exit(NULL);
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
while (1) {
|
2016-05-26 09:43:00 +00:00
|
|
|
u64 bytenr, physical_dup;
|
2013-05-08 15:40:36 +00:00
|
|
|
off_t offset = 0;
|
2013-03-18 18:50:45 +00:00
|
|
|
int err = 0;
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2016-04-01 10:57:11 +00:00
|
|
|
while (!mdres->nodesize || list_empty(&mdres->list)) {
|
2008-11-20 14:52:48 +00:00
|
|
|
if (mdres->done) {
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
pthread_cond_wait(&mdres->cond, &mdres->mutex);
|
|
|
|
}
|
|
|
|
async = list_entry(mdres->list.next, struct async_work, list);
|
|
|
|
list_del_init(&async->list);
|
|
|
|
|
|
|
|
if (mdres->compress_method == COMPRESS_ZLIB) {
|
2018-10-11 15:03:59 +00:00
|
|
|
size = compress_size;
|
2017-07-12 20:05:10 +00:00
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
2008-12-02 12:19:08 +00:00
|
|
|
ret = uncompress(buffer, (unsigned long *)&size,
|
|
|
|
async->buffer, async->bufsize);
|
2017-07-12 20:05:10 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret != Z_OK) {
|
2017-07-12 22:10:13 +00:00
|
|
|
error("decompression failed with %d", ret);
|
2013-03-18 18:50:45 +00:00
|
|
|
err = -EIO;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
outbuf = buffer;
|
|
|
|
} else {
|
|
|
|
outbuf = async->buffer;
|
|
|
|
size = async->bufsize;
|
|
|
|
}
|
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (!mdres->multi_devices) {
|
|
|
|
if (async->start == BTRFS_SUPER_INFO_OFFSET) {
|
2020-05-27 10:28:09 +00:00
|
|
|
memcpy(mdres->original_super, outbuf,
|
|
|
|
BTRFS_SUPER_INFO_SIZE);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (mdres->old_restore) {
|
|
|
|
update_super_old(outbuf);
|
|
|
|
} else {
|
2015-01-26 01:39:24 +00:00
|
|
|
ret = update_super(mdres, outbuf);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (ret)
|
|
|
|
err = ret;
|
|
|
|
}
|
|
|
|
} else if (!mdres->old_restore) {
|
|
|
|
ret = fixup_chunk_tree_block(mdres, async, outbuf, size);
|
2013-03-27 20:55:41 +00:00
|
|
|
if (ret)
|
|
|
|
err = ret;
|
|
|
|
}
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (!mdres->fixup_offset) {
|
|
|
|
while (size) {
|
|
|
|
u64 chunk_size = size;
|
2016-05-26 09:43:00 +00:00
|
|
|
physical_dup = 0;
|
2014-06-26 02:53:01 +00:00
|
|
|
if (!mdres->multi_devices && !mdres->old_restore)
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
bytenr = logical_to_physical(mdres,
|
2016-05-26 09:43:00 +00:00
|
|
|
async->start + offset,
|
|
|
|
&chunk_size,
|
|
|
|
&physical_dup);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
else
|
|
|
|
bytenr = async->start + offset;
|
|
|
|
|
|
|
|
ret = pwrite64(outfd, outbuf+offset, chunk_size,
|
|
|
|
bytenr);
|
2016-05-26 09:43:00 +00:00
|
|
|
if (ret != chunk_size)
|
|
|
|
goto error;
|
|
|
|
|
|
|
|
if (physical_dup)
|
|
|
|
ret = pwrite64(outfd, outbuf+offset,
|
|
|
|
chunk_size,
|
|
|
|
physical_dup);
|
|
|
|
if (ret != chunk_size)
|
|
|
|
goto error;
|
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
size -= chunk_size;
|
|
|
|
offset += chunk_size;
|
2016-05-26 09:43:00 +00:00
|
|
|
continue;
|
|
|
|
|
|
|
|
error:
|
|
|
|
if (ret < 0) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to write to device: %m");
|
2016-05-26 09:43:00 +00:00
|
|
|
err = errno;
|
|
|
|
} else {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("short write");
|
2016-05-26 09:43:00 +00:00
|
|
|
err = -EIO;
|
|
|
|
}
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
} else if (async->start != BTRFS_SUPER_INFO_OFFSET) {
|
|
|
|
ret = write_data_to_disk(mdres->info, outbuf, async->start, size, 0);
|
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("failed to write data");
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
exit(1);
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
|
|
|
|
/* backup super blocks are already there at fixup_offset stage */
|
|
|
|
if (!mdres->multi_devices && async->start == BTRFS_SUPER_INFO_OFFSET)
|
2013-03-27 20:55:41 +00:00
|
|
|
write_backup_supers(outfd, outbuf);
|
|
|
|
|
2013-03-18 18:50:45 +00:00
|
|
|
if (err && !mdres->error)
|
|
|
|
mdres->error = err;
|
2008-11-20 14:52:48 +00:00
|
|
|
mdres->num_items--;
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
|
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
free(buffer);
|
|
|
|
pthread_exit(NULL);
|
|
|
|
}
|
|
|
|
|
2014-03-21 01:06:23 +00:00
|
|
|
static void mdrestore_destroy(struct mdrestore_struct *mdres, int num_threads)
|
2013-03-18 18:50:45 +00:00
|
|
|
{
|
2013-05-08 15:40:36 +00:00
|
|
|
struct rb_node *n;
|
2013-03-18 18:50:45 +00:00
|
|
|
int i;
|
2013-05-08 15:40:36 +00:00
|
|
|
|
|
|
|
while ((n = rb_first(&mdres->chunk_tree))) {
|
|
|
|
struct fs_chunk *entry;
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
entry = rb_entry(n, struct fs_chunk, l);
|
2013-05-08 15:40:36 +00:00
|
|
|
rb_erase(n, &mdres->chunk_tree);
|
2015-01-26 01:39:24 +00:00
|
|
|
rb_erase(&entry->p, &mdres->physical_tree);
|
2013-05-08 15:40:36 +00:00
|
|
|
free(entry);
|
|
|
|
}
|
2019-07-04 06:10:57 +00:00
|
|
|
free_extent_cache_tree(&mdres->sys_chunks);
|
2013-03-18 18:50:45 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
|
|
|
mdres->done = 1;
|
|
|
|
pthread_cond_broadcast(&mdres->cond);
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
|
2014-03-21 01:06:23 +00:00
|
|
|
for (i = 0; i < num_threads; i++)
|
2013-03-18 18:50:45 +00:00
|
|
|
pthread_join(mdres->threads[i], NULL);
|
|
|
|
|
|
|
|
pthread_cond_destroy(&mdres->cond);
|
|
|
|
pthread_mutex_destroy(&mdres->mutex);
|
2020-05-27 10:28:09 +00:00
|
|
|
free(mdres->original_super);
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
|
|
|
|
2013-01-25 00:18:53 +00:00
|
|
|
static int mdrestore_init(struct mdrestore_struct *mdres,
|
2013-03-27 20:55:41 +00:00
|
|
|
FILE *in, FILE *out, int old_restore,
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int num_threads, int fixup_offset,
|
|
|
|
struct btrfs_fs_info *info, int multi_devices)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
int i, ret = 0;
|
|
|
|
|
|
|
|
memset(mdres, 0, sizeof(*mdres));
|
|
|
|
pthread_cond_init(&mdres->cond, NULL);
|
|
|
|
pthread_mutex_init(&mdres->mutex, NULL);
|
|
|
|
INIT_LIST_HEAD(&mdres->list);
|
2015-01-26 01:39:24 +00:00
|
|
|
INIT_LIST_HEAD(&mdres->overlapping_chunks);
|
2019-07-04 06:10:57 +00:00
|
|
|
cache_tree_init(&mdres->sys_chunks);
|
2008-11-20 14:52:48 +00:00
|
|
|
mdres->in = in;
|
|
|
|
mdres->out = out;
|
2013-03-27 20:55:41 +00:00
|
|
|
mdres->old_restore = old_restore;
|
2013-05-08 15:40:36 +00:00
|
|
|
mdres->chunk_tree.rb_node = NULL;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
mdres->fixup_offset = fixup_offset;
|
|
|
|
mdres->info = info;
|
|
|
|
mdres->multi_devices = multi_devices;
|
2015-01-26 01:39:24 +00:00
|
|
|
mdres->clear_space_cache = 0;
|
|
|
|
mdres->last_physical_offset = 0;
|
2015-01-28 20:38:03 +00:00
|
|
|
mdres->alloced_chunks = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2020-05-27 10:28:09 +00:00
|
|
|
mdres->original_super = malloc(BTRFS_SUPER_INFO_SIZE);
|
|
|
|
if (!mdres->original_super)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
if (!num_threads)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
mdres->num_threads = num_threads;
|
|
|
|
for (i = 0; i < num_threads; i++) {
|
2016-11-02 23:57:43 +00:00
|
|
|
ret = pthread_create(&mdres->threads[i], NULL, restore_worker,
|
2008-11-20 14:52:48 +00:00
|
|
|
mdres);
|
2016-10-03 13:11:13 +00:00
|
|
|
if (ret) {
|
|
|
|
/* pthread_create returns errno directly */
|
|
|
|
ret = -ret;
|
2008-11-20 14:52:48 +00:00
|
|
|
break;
|
2016-10-03 13:11:13 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret)
|
2014-03-21 01:06:23 +00:00
|
|
|
mdrestore_destroy(mdres, i + 1);
|
2008-11-20 14:52:48 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
static int fill_mdres_info(struct mdrestore_struct *mdres,
|
|
|
|
struct async_work *async)
|
|
|
|
{
|
|
|
|
struct btrfs_super_block *super;
|
|
|
|
u8 *buffer = NULL;
|
|
|
|
u8 *outbuf;
|
|
|
|
int ret;
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
/* We've already been initialized */
|
2016-04-01 10:57:11 +00:00
|
|
|
if (mdres->nodesize)
|
2013-05-08 15:40:36 +00:00
|
|
|
return 0;
|
|
|
|
|
2013-03-27 20:55:41 +00:00
|
|
|
if (mdres->compress_method == COMPRESS_ZLIB) {
|
2019-07-04 06:10:56 +00:00
|
|
|
/*
|
|
|
|
* We know this item is superblock, its should only be 4K.
|
|
|
|
* Don't need to waste memory following max_pending_size as it
|
|
|
|
* can be as large as 256M.
|
|
|
|
*/
|
|
|
|
size_t size = BTRFS_SUPER_INFO_SIZE;
|
2013-03-27 20:55:41 +00:00
|
|
|
|
2019-07-04 06:10:56 +00:00
|
|
|
buffer = malloc(size);
|
2013-03-27 20:55:41 +00:00
|
|
|
if (!buffer)
|
|
|
|
return -ENOMEM;
|
|
|
|
ret = uncompress(buffer, (unsigned long *)&size,
|
|
|
|
async->buffer, async->bufsize);
|
|
|
|
if (ret != Z_OK) {
|
2017-07-12 22:10:13 +00:00
|
|
|
error("decompression failed with %d", ret);
|
2013-03-27 20:55:41 +00:00
|
|
|
free(buffer);
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
outbuf = buffer;
|
|
|
|
} else {
|
|
|
|
outbuf = async->buffer;
|
|
|
|
}
|
|
|
|
|
|
|
|
super = (struct btrfs_super_block *)outbuf;
|
2016-04-01 10:57:11 +00:00
|
|
|
mdres->nodesize = btrfs_super_nodesize(super);
|
2018-10-11 15:03:59 +00:00
|
|
|
if (btrfs_super_incompat_flags(super) &
|
|
|
|
BTRFS_FEATURE_INCOMPAT_METADATA_UUID)
|
|
|
|
memcpy(mdres->fsid, super->metadata_uuid, BTRFS_FSID_SIZE);
|
|
|
|
else
|
|
|
|
memcpy(mdres->fsid, super->fsid, BTRFS_FSID_SIZE);
|
|
|
|
memcpy(mdres->uuid, super->dev_item.uuid, BTRFS_UUID_SIZE);
|
2013-03-27 20:55:41 +00:00
|
|
|
mdres->devid = le64_to_cpu(super->dev_item.devid);
|
|
|
|
free(buffer);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
static int add_cluster(struct meta_cluster *cluster,
|
|
|
|
struct mdrestore_struct *mdres, u64 *next)
|
|
|
|
{
|
|
|
|
struct meta_cluster_item *item;
|
|
|
|
struct meta_cluster_header *header = &cluster->header;
|
|
|
|
struct async_work *async;
|
|
|
|
u64 bytenr;
|
|
|
|
u32 i, nritems;
|
|
|
|
int ret;
|
|
|
|
|
2017-07-12 20:05:10 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2008-11-20 14:52:48 +00:00
|
|
|
mdres->compress_method = header->compress;
|
2017-07-12 20:05:10 +00:00
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
bytenr = le64_to_cpu(header->bytenr) + BLOCK_SIZE;
|
|
|
|
nritems = le32_to_cpu(header->nritems);
|
|
|
|
for (i = 0; i < nritems; i++) {
|
|
|
|
item = &cluster->items[i];
|
|
|
|
async = calloc(1, sizeof(*async));
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!async) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for async data");
|
2013-03-18 18:50:45 +00:00
|
|
|
return -ENOMEM;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
async->start = le64_to_cpu(item->bytenr);
|
|
|
|
async->bufsize = le32_to_cpu(item->size);
|
|
|
|
async->buffer = malloc(async->bufsize);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!async->buffer) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for async buffer");
|
2013-03-18 18:50:45 +00:00
|
|
|
free(async);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
ret = fread(async->buffer, async->bufsize, 1, mdres->in);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to read buffer: %m");
|
2013-03-18 18:50:45 +00:00
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
|
|
|
return -EIO;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
bytenr += async->bufsize;
|
|
|
|
|
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2013-03-27 20:55:41 +00:00
|
|
|
if (async->start == BTRFS_SUPER_INFO_OFFSET) {
|
|
|
|
ret = fill_mdres_info(mdres, async);
|
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to set up restore state");
|
2013-03-27 20:55:41 +00:00
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
free(async->buffer);
|
|
|
|
free(async);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
list_add_tail(&async->list, &mdres->list);
|
|
|
|
mdres->num_items++;
|
|
|
|
pthread_cond_signal(&mdres->cond);
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
}
|
|
|
|
if (bytenr & BLOCK_MASK) {
|
|
|
|
char buffer[BLOCK_MASK];
|
|
|
|
size_t size = BLOCK_SIZE - (bytenr & BLOCK_MASK);
|
|
|
|
|
|
|
|
bytenr += size;
|
|
|
|
ret = fread(buffer, size, 1, mdres->in);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("failed to read buffer: %m");
|
2013-03-18 18:50:45 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
*next = bytenr;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int wait_for_worker(struct mdrestore_struct *mdres)
|
|
|
|
{
|
2013-03-18 18:50:45 +00:00
|
|
|
int ret = 0;
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2013-03-18 18:50:45 +00:00
|
|
|
ret = mdres->error;
|
|
|
|
while (!ret && mdres->num_items > 0) {
|
2008-11-20 14:52:48 +00:00
|
|
|
struct timespec ts = {
|
|
|
|
.tv_sec = 0,
|
|
|
|
.tv_nsec = 10000000,
|
|
|
|
};
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
nanosleep(&ts, NULL);
|
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2013-03-18 18:50:45 +00:00
|
|
|
ret = mdres->error;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
2013-03-18 18:50:45 +00:00
|
|
|
return ret;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2019-07-04 06:10:58 +00:00
|
|
|
/*
|
|
|
|
* Check if a range [start, start + len] has ANY bytes covered by system chunk
|
|
|
|
* ranges.
|
|
|
|
*/
|
|
|
|
static bool is_in_sys_chunks(struct mdrestore_struct *mdres, u64 start, u64 len)
|
|
|
|
{
|
|
|
|
struct rb_node *node = mdres->sys_chunks.root.rb_node;
|
|
|
|
struct cache_extent *entry;
|
|
|
|
struct cache_extent *next;
|
|
|
|
struct cache_extent *prev;
|
|
|
|
|
|
|
|
if (start > mdres->sys_chunk_end)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
while (node) {
|
|
|
|
entry = rb_entry(node, struct cache_extent, rb_node);
|
|
|
|
if (start > entry->start) {
|
|
|
|
if (!node->rb_right)
|
|
|
|
break;
|
|
|
|
node = node->rb_right;
|
|
|
|
} else if (start < entry->start) {
|
|
|
|
if (!node->rb_left)
|
|
|
|
break;
|
|
|
|
node = node->rb_left;
|
|
|
|
} else {
|
|
|
|
/* Already in a system chunk */
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!node)
|
|
|
|
return false;
|
|
|
|
entry = rb_entry(node, struct cache_extent, rb_node);
|
|
|
|
/* Now we have entry which is the nearst chunk around @start */
|
|
|
|
if (start > entry->start) {
|
|
|
|
prev = entry;
|
|
|
|
next = next_cache_extent(entry);
|
|
|
|
} else {
|
|
|
|
prev = prev_cache_extent(entry);
|
|
|
|
next = entry;
|
|
|
|
}
|
|
|
|
if (prev && prev->start + prev->size > start)
|
|
|
|
return true;
|
|
|
|
if (next && start + len > next->start)
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
static int read_chunk_tree_block(struct mdrestore_struct *mdres,
|
|
|
|
struct extent_buffer *eb)
|
2013-05-08 15:40:36 +00:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < btrfs_header_nritems(eb); i++) {
|
2016-05-26 09:43:00 +00:00
|
|
|
struct btrfs_chunk *chunk;
|
2013-05-08 15:40:36 +00:00
|
|
|
struct fs_chunk *fs_chunk;
|
|
|
|
struct btrfs_key key;
|
2016-05-26 09:43:00 +00:00
|
|
|
u64 type;
|
2013-05-08 15:40:36 +00:00
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(eb, &key, i);
|
|
|
|
if (key.type != BTRFS_CHUNK_ITEM_KEY)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
fs_chunk = malloc(sizeof(struct fs_chunk));
|
|
|
|
if (!fs_chunk) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory to allocate chunk");
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
return -ENOMEM;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
memset(fs_chunk, 0, sizeof(*fs_chunk));
|
2016-05-26 09:43:00 +00:00
|
|
|
chunk = btrfs_item_ptr(eb, i, struct btrfs_chunk);
|
2013-05-08 15:40:36 +00:00
|
|
|
|
|
|
|
fs_chunk->logical = key.offset;
|
2016-05-26 09:43:00 +00:00
|
|
|
fs_chunk->physical = btrfs_stripe_offset_nr(eb, chunk, 0);
|
|
|
|
fs_chunk->bytes = btrfs_chunk_length(eb, chunk);
|
2015-01-26 01:39:24 +00:00
|
|
|
INIT_LIST_HEAD(&fs_chunk->list);
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
if (tree_search(&mdres->physical_tree, &fs_chunk->p,
|
|
|
|
physical_cmp, 1) != NULL)
|
|
|
|
list_add(&fs_chunk->list, &mdres->overlapping_chunks);
|
|
|
|
else
|
|
|
|
tree_insert(&mdres->physical_tree, &fs_chunk->p,
|
|
|
|
physical_cmp);
|
2016-05-26 09:43:00 +00:00
|
|
|
type = btrfs_chunk_type(eb, chunk);
|
|
|
|
if (type & BTRFS_BLOCK_GROUP_DUP) {
|
|
|
|
fs_chunk->physical_dup =
|
|
|
|
btrfs_stripe_offset_nr(eb, chunk, 1);
|
|
|
|
}
|
|
|
|
if (fs_chunk->physical_dup + fs_chunk->bytes >
|
|
|
|
mdres->last_physical_offset)
|
|
|
|
mdres->last_physical_offset = fs_chunk->physical_dup +
|
|
|
|
fs_chunk->bytes;
|
|
|
|
else if (fs_chunk->physical + fs_chunk->bytes >
|
2015-01-26 01:39:24 +00:00
|
|
|
mdres->last_physical_offset)
|
|
|
|
mdres->last_physical_offset = fs_chunk->physical +
|
|
|
|
fs_chunk->bytes;
|
2015-01-28 20:38:03 +00:00
|
|
|
mdres->alloced_chunks += fs_chunk->bytes;
|
2016-05-26 09:43:00 +00:00
|
|
|
/* in dup case, fs_chunk->bytes should add twice */
|
|
|
|
if (fs_chunk->physical_dup)
|
|
|
|
mdres->alloced_chunks += fs_chunk->bytes;
|
2015-01-26 01:39:24 +00:00
|
|
|
tree_insert(&mdres->chunk_tree, &fs_chunk->l, chunk_cmp);
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int read_chunk_block(struct mdrestore_struct *mdres, u8 *buffer,
|
|
|
|
u64 item_bytenr, u32 bufsize,
|
|
|
|
u64 cluster_bytenr)
|
|
|
|
{
|
|
|
|
struct extent_buffer *eb;
|
|
|
|
u32 nodesize = mdres->nodesize;
|
|
|
|
u64 bytenr;
|
|
|
|
size_t cur_offset;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
eb = alloc_dummy_eb(0, mdres->nodesize);
|
|
|
|
if (!eb)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
for (cur_offset = 0; cur_offset < bufsize; cur_offset += nodesize) {
|
|
|
|
bytenr = item_bytenr + cur_offset;
|
|
|
|
if (!is_in_sys_chunks(mdres, bytenr, nodesize))
|
|
|
|
continue;
|
|
|
|
memcpy(eb->data, buffer + cur_offset, nodesize);
|
|
|
|
if (btrfs_header_bytenr(eb) != bytenr) {
|
|
|
|
error(
|
|
|
|
"eb bytenr does not match found bytenr: %llu != %llu",
|
|
|
|
(unsigned long long)btrfs_header_bytenr(eb),
|
|
|
|
(unsigned long long)bytenr);
|
|
|
|
ret = -EUCLEAN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (memcmp(mdres->fsid, eb->data +
|
|
|
|
offsetof(struct btrfs_header, fsid),
|
|
|
|
BTRFS_FSID_SIZE)) {
|
|
|
|
error(
|
|
|
|
"filesystem metadata UUID of eb %llu does not match",
|
|
|
|
bytenr);
|
|
|
|
ret = -EUCLEAN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (btrfs_header_owner(eb) != BTRFS_CHUNK_TREE_OBJECTID) {
|
|
|
|
error("wrong eb %llu owner %llu",
|
|
|
|
(unsigned long long)bytenr,
|
|
|
|
(unsigned long long)btrfs_header_owner(eb));
|
|
|
|
ret = -EUCLEAN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* No need to search node, as we will iterate all tree blocks
|
|
|
|
* in chunk tree, only need to bother leaves.
|
|
|
|
*/
|
|
|
|
if (btrfs_header_level(eb))
|
|
|
|
continue;
|
|
|
|
ret = read_chunk_tree_block(mdres, eb);
|
|
|
|
if (ret < 0)
|
|
|
|
break;
|
|
|
|
}
|
2013-05-08 15:40:36 +00:00
|
|
|
free(eb);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
/*
|
|
|
|
* This function will try to find all chunk items in the dump image.
|
|
|
|
*
|
|
|
|
* This function will iterate all clusters, and find any item inside system
|
|
|
|
* chunk ranges. For such item, it will try to read them as tree blocks, and
|
|
|
|
* find CHUNK_ITEMs, add them to @mdres.
|
|
|
|
*/
|
|
|
|
static int search_for_chunk_blocks(struct mdrestore_struct *mdres)
|
2013-05-08 15:40:36 +00:00
|
|
|
{
|
|
|
|
struct meta_cluster *cluster;
|
|
|
|
struct meta_cluster_header *header;
|
|
|
|
struct meta_cluster_item *item;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
u64 current_cluster = 0, bytenr;
|
2013-05-08 15:40:36 +00:00
|
|
|
u64 item_bytenr;
|
|
|
|
u32 bufsize, nritems, i;
|
2013-10-07 21:42:57 +00:00
|
|
|
u32 max_size = MAX_PENDING_SIZE * 2;
|
2013-05-08 15:40:36 +00:00
|
|
|
u8 *buffer, *tmp = NULL;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
cluster = malloc(BLOCK_SIZE);
|
|
|
|
if (!cluster) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for cluster");
|
2013-05-08 15:40:36 +00:00
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
2013-10-07 21:42:57 +00:00
|
|
|
buffer = malloc(max_size);
|
2013-05-08 15:40:36 +00:00
|
|
|
if (!buffer) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for buffer");
|
2013-05-08 15:40:36 +00:00
|
|
|
free(cluster);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (mdres->compress_method == COMPRESS_ZLIB) {
|
2013-10-07 21:42:57 +00:00
|
|
|
tmp = malloc(max_size);
|
2013-05-08 15:40:36 +00:00
|
|
|
if (!tmp) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for buffer");
|
2013-05-08 15:40:36 +00:00
|
|
|
free(cluster);
|
|
|
|
free(buffer);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bytenr = current_cluster;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
/* Main loop, iterating all clusters */
|
2013-05-08 15:40:36 +00:00
|
|
|
while (1) {
|
|
|
|
if (fseek(mdres->in, current_cluster, SEEK_SET)) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("seek failed: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ret = fread(cluster, BLOCK_SIZE, 1, mdres->in);
|
|
|
|
if (ret == 0) {
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
if (feof(mdres->in))
|
|
|
|
goto out;
|
2016-09-08 13:57:42 +00:00
|
|
|
error(
|
2017-07-12 22:10:13 +00:00
|
|
|
"unknown state after reading cluster at %llu, probably corrupted data",
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
current_cluster);
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
} else if (ret < 0) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to read image at %llu: %m",
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
current_cluster);
|
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
|
|
|
|
header = &cluster->header;
|
|
|
|
if (le64_to_cpu(header->magic) != HEADER_MAGIC ||
|
|
|
|
le64_to_cpu(header->bytenr) != current_cluster) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("bad header in metadump image");
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
/* We're already over the system chunk end, no need to search*/
|
|
|
|
if (current_cluster > mdres->sys_chunk_end)
|
|
|
|
goto out;
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
bytenr += BLOCK_SIZE;
|
|
|
|
nritems = le32_to_cpu(header->nritems);
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
|
|
|
|
/* Search items for tree blocks in sys chunks */
|
2013-05-08 15:40:36 +00:00
|
|
|
for (i = 0; i < nritems; i++) {
|
|
|
|
size_t size;
|
|
|
|
|
|
|
|
item = &cluster->items[i];
|
|
|
|
bufsize = le32_to_cpu(item->size);
|
|
|
|
item_bytenr = le64_to_cpu(item->bytenr);
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
/*
|
|
|
|
* Only data extent/free space cache can be that big,
|
|
|
|
* adjacent tree blocks won't be able to be merged
|
|
|
|
* beyond max_size. Also, we can skip super block.
|
|
|
|
*/
|
|
|
|
if (bufsize > max_size ||
|
|
|
|
!is_in_sys_chunks(mdres, item_bytenr, bufsize) ||
|
|
|
|
item_bytenr == BTRFS_SUPER_INFO_OFFSET) {
|
|
|
|
ret = fseek(mdres->in, bufsize, SEEK_CUR);
|
|
|
|
if (ret < 0) {
|
|
|
|
error("failed to seek: %m");
|
|
|
|
ret = -errno;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
bytenr += bufsize;
|
|
|
|
continue;
|
2013-10-07 21:42:57 +00:00
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
if (mdres->compress_method == COMPRESS_ZLIB) {
|
|
|
|
ret = fread(tmp, bufsize, 1, mdres->in);
|
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("read error: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
|
2013-10-07 21:42:57 +00:00
|
|
|
size = max_size;
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = uncompress(buffer,
|
|
|
|
(unsigned long *)&size, tmp,
|
|
|
|
bufsize);
|
|
|
|
if (ret != Z_OK) {
|
2017-07-12 22:10:13 +00:00
|
|
|
error("decompression failed with %d",
|
2016-09-08 13:57:42 +00:00
|
|
|
ret);
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
ret = fread(buffer, bufsize, 1, mdres->in);
|
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("read error: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
ret = -EIO;
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
size = bufsize;
|
|
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
ret = read_chunk_block(mdres, buffer, item_bytenr, size,
|
|
|
|
current_cluster);
|
|
|
|
if (ret < 0) {
|
|
|
|
error(
|
|
|
|
"failed to search tree blocks in item bytenr %llu size %lu",
|
|
|
|
item_bytenr, size);
|
|
|
|
goto out;
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
bytenr += bufsize;
|
|
|
|
}
|
|
|
|
if (bytenr & BLOCK_MASK)
|
|
|
|
bytenr += BLOCK_SIZE - (bytenr & BLOCK_MASK);
|
|
|
|
current_cluster = bytenr;
|
|
|
|
}
|
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
out:
|
2013-05-08 15:40:36 +00:00
|
|
|
free(tmp);
|
|
|
|
free(buffer);
|
|
|
|
free(cluster);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2019-07-04 06:10:57 +00:00
|
|
|
/*
|
|
|
|
* Add system chunks in super blocks into mdres->sys_chunks, so later we can
|
|
|
|
* determine if an item is a chunk tree block.
|
|
|
|
*/
|
|
|
|
static int add_sys_array(struct mdrestore_struct *mdres,
|
|
|
|
struct btrfs_super_block *sb)
|
|
|
|
{
|
|
|
|
struct btrfs_disk_key *disk_key;
|
|
|
|
struct btrfs_key key;
|
|
|
|
struct btrfs_chunk *chunk;
|
|
|
|
struct cache_extent *cache;
|
|
|
|
u32 cur_offset;
|
|
|
|
u32 len = 0;
|
|
|
|
u32 array_size;
|
|
|
|
u8 *array_ptr;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
array_size = btrfs_super_sys_array_size(sb);
|
|
|
|
array_ptr = sb->sys_chunk_array;
|
|
|
|
cur_offset = 0;
|
|
|
|
|
|
|
|
while (cur_offset < array_size) {
|
|
|
|
u32 num_stripes;
|
|
|
|
|
|
|
|
disk_key = (struct btrfs_disk_key *)array_ptr;
|
|
|
|
len = sizeof(*disk_key);
|
|
|
|
if (cur_offset + len > array_size)
|
|
|
|
goto out_short_read;
|
|
|
|
btrfs_disk_key_to_cpu(&key, disk_key);
|
|
|
|
|
|
|
|
array_ptr += len;
|
|
|
|
cur_offset += len;
|
|
|
|
|
|
|
|
if (key.type != BTRFS_CHUNK_ITEM_KEY) {
|
|
|
|
error("unexpected item type %u in sys_array offset %u",
|
|
|
|
key.type, cur_offset);
|
|
|
|
ret = -EUCLEAN;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
chunk = (struct btrfs_chunk *)array_ptr;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* At least one btrfs_chunk with one stripe must be present,
|
|
|
|
* exact stripe count check comes afterwards
|
|
|
|
*/
|
|
|
|
len = btrfs_chunk_item_size(1);
|
|
|
|
if (cur_offset + len > array_size)
|
|
|
|
goto out_short_read;
|
|
|
|
num_stripes = btrfs_stack_chunk_num_stripes(chunk);
|
|
|
|
if (!num_stripes) {
|
|
|
|
error(
|
|
|
|
"invalid number of stripes %u in sys_array at offset %u",
|
|
|
|
num_stripes, cur_offset);
|
|
|
|
ret = -EIO;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
len = btrfs_chunk_item_size(num_stripes);
|
|
|
|
if (cur_offset + len > array_size)
|
|
|
|
goto out_short_read;
|
|
|
|
if (btrfs_stack_chunk_type(chunk) &
|
|
|
|
BTRFS_BLOCK_GROUP_SYSTEM) {
|
|
|
|
ret = add_merge_cache_extent(&mdres->sys_chunks,
|
|
|
|
key.offset,
|
|
|
|
btrfs_stack_chunk_length(chunk));
|
|
|
|
if (ret < 0)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
array_ptr += len;
|
|
|
|
cur_offset += len;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Get the last system chunk end as a quicker check */
|
|
|
|
cache = last_cache_extent(&mdres->sys_chunks);
|
|
|
|
if (!cache) {
|
|
|
|
error("no system chunk found in super block");
|
|
|
|
return -EUCLEAN;
|
|
|
|
}
|
|
|
|
mdres->sys_chunk_end = cache->start + cache->size - 1;
|
|
|
|
return ret;
|
|
|
|
out_short_read:
|
|
|
|
error("sys_array too short to read %u bytes at offset %u",
|
|
|
|
len, cur_offset);
|
|
|
|
return -EUCLEAN;
|
|
|
|
}
|
|
|
|
|
2013-05-08 15:40:36 +00:00
|
|
|
static int build_chunk_tree(struct mdrestore_struct *mdres,
|
|
|
|
struct meta_cluster *cluster)
|
|
|
|
{
|
|
|
|
struct btrfs_super_block *super;
|
|
|
|
struct meta_cluster_header *header;
|
|
|
|
struct meta_cluster_item *item = NULL;
|
|
|
|
u32 i, nritems;
|
|
|
|
u64 bytenr = 0;
|
|
|
|
u8 *buffer;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* We can't seek with stdin so don't bother doing this */
|
|
|
|
if (mdres->in == stdin)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
ret = fread(cluster, BLOCK_SIZE, 1, mdres->in);
|
|
|
|
if (ret <= 0) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to read cluster: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
|
|
|
|
header = &cluster->header;
|
|
|
|
if (le64_to_cpu(header->magic) != HEADER_MAGIC ||
|
|
|
|
le64_to_cpu(header->bytenr) != 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("bad header in metadump image");
|
2013-05-08 15:40:36 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
|
|
|
bytenr += BLOCK_SIZE;
|
|
|
|
mdres->compress_method = header->compress;
|
|
|
|
nritems = le32_to_cpu(header->nritems);
|
|
|
|
for (i = 0; i < nritems; i++) {
|
|
|
|
item = &cluster->items[i];
|
|
|
|
|
|
|
|
if (le64_to_cpu(item->bytenr) == BTRFS_SUPER_INFO_OFFSET)
|
|
|
|
break;
|
|
|
|
bytenr += le32_to_cpu(item->size);
|
|
|
|
if (fseek(mdres->in, le32_to_cpu(item->size), SEEK_CUR)) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("seek failed: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!item || le64_to_cpu(item->bytenr) != BTRFS_SUPER_INFO_OFFSET) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("did not find superblock at %llu",
|
|
|
|
le64_to_cpu(item->bytenr));
|
2013-05-08 15:40:36 +00:00
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
buffer = malloc(le32_to_cpu(item->size));
|
|
|
|
if (!buffer) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory to allocate buffer");
|
2013-05-08 15:40:36 +00:00
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = fread(buffer, le32_to_cpu(item->size), 1, mdres->in);
|
|
|
|
if (ret != 1) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to read buffer: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
free(buffer);
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (mdres->compress_method == COMPRESS_ZLIB) {
|
2019-07-04 06:10:56 +00:00
|
|
|
size_t size = BTRFS_SUPER_INFO_SIZE;
|
2013-05-08 15:40:36 +00:00
|
|
|
u8 *tmp;
|
|
|
|
|
2019-07-04 06:10:56 +00:00
|
|
|
tmp = malloc(size);
|
2013-05-08 15:40:36 +00:00
|
|
|
if (!tmp) {
|
|
|
|
free(buffer);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
ret = uncompress(tmp, (unsigned long *)&size,
|
|
|
|
buffer, le32_to_cpu(item->size));
|
|
|
|
if (ret != Z_OK) {
|
2017-07-12 22:10:13 +00:00
|
|
|
error("decompression failed with %d", ret);
|
2013-05-08 15:40:36 +00:00
|
|
|
free(buffer);
|
|
|
|
free(tmp);
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
free(buffer);
|
|
|
|
buffer = tmp;
|
|
|
|
}
|
|
|
|
|
2014-05-19 05:40:42 +00:00
|
|
|
pthread_mutex_lock(&mdres->mutex);
|
2013-05-08 15:40:36 +00:00
|
|
|
super = (struct btrfs_super_block *)buffer;
|
2019-06-06 11:06:06 +00:00
|
|
|
ret = btrfs_check_super(super, 0);
|
|
|
|
if (ret < 0) {
|
|
|
|
error("invalid superblock");
|
|
|
|
return ret;
|
|
|
|
}
|
2019-07-04 06:10:57 +00:00
|
|
|
ret = add_sys_array(mdres, super);
|
|
|
|
if (ret < 0) {
|
|
|
|
error("failed to read system chunk array");
|
|
|
|
free(buffer);
|
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
|
|
|
return ret;
|
|
|
|
}
|
2016-04-01 10:57:11 +00:00
|
|
|
mdres->nodesize = btrfs_super_nodesize(super);
|
2018-10-11 15:03:59 +00:00
|
|
|
if (btrfs_super_incompat_flags(super) &
|
|
|
|
BTRFS_FEATURE_INCOMPAT_METADATA_UUID)
|
|
|
|
memcpy(mdres->fsid, super->metadata_uuid, BTRFS_FSID_SIZE);
|
|
|
|
else
|
|
|
|
memcpy(mdres->fsid, super->fsid, BTRFS_FSID_SIZE);
|
|
|
|
|
|
|
|
memcpy(mdres->uuid, super->dev_item.uuid, BTRFS_UUID_SIZE);
|
2013-05-08 15:40:36 +00:00
|
|
|
mdres->devid = le64_to_cpu(super->dev_item.devid);
|
|
|
|
free(buffer);
|
2014-05-19 05:40:42 +00:00
|
|
|
pthread_mutex_unlock(&mdres->mutex);
|
2013-05-08 15:40:36 +00:00
|
|
|
|
btrfs-progs: image: Rework how we search chunk tree blocks
Before this patch, we were using a very inefficient way to search
chunks:
We iterate through all clusters to find the chunk root tree block first,
then re-iterate all clusters again to find every child tree block.
Each time we need to iterate all clusters just to find a chunk tree
block. This is obviously inefficient, especially when chunk tree gets
larger. So the original author leaves a comment on it:
/* If you have to ask you aren't worthy */
static int search_for_chunk_blocks()
This patch will change the behavior so that we will only iterate all
clusters once.
The idea behind the optimization is, since we have the superblock
restored first, we could use the CHUNK_ITEMs in
super_block::sys_chunk_array to build a SYSTEM chunk mapping.
Then, when we start to iterate through all items, we can easily skip
unrelated items at different level:
- At cluster level
If a cluster starts beyond last system chunk map, it must not contain
any chunk tree blocks (as chunk tree blocks only lives inside system
chunks)
- At item level
If one item has no intersection with any system chunk map, then it
must not contain any tree blocks.
By this, we can iterate through all clusters just once, and find out all
CHUNK_ITEMs.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-07-04 06:10:59 +00:00
|
|
|
return search_for_chunk_blocks(mdres);
|
2013-05-08 15:40:36 +00:00
|
|
|
}
|
|
|
|
|
2015-01-26 01:39:24 +00:00
|
|
|
static int range_contains_super(u64 physical, u64 bytes)
|
|
|
|
{
|
|
|
|
u64 super_bytenr;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < BTRFS_SUPER_MIRROR_MAX; i++) {
|
|
|
|
super_bytenr = btrfs_sb_offset(i);
|
|
|
|
if (super_bytenr >= physical &&
|
|
|
|
super_bytenr < physical + bytes)
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void remap_overlapping_chunks(struct mdrestore_struct *mdres)
|
|
|
|
{
|
|
|
|
struct fs_chunk *fs_chunk;
|
|
|
|
|
|
|
|
while (!list_empty(&mdres->overlapping_chunks)) {
|
|
|
|
fs_chunk = list_first_entry(&mdres->overlapping_chunks,
|
|
|
|
struct fs_chunk, list);
|
|
|
|
list_del_init(&fs_chunk->list);
|
|
|
|
if (range_contains_super(fs_chunk->physical,
|
|
|
|
fs_chunk->bytes)) {
|
2016-09-30 11:00:24 +00:00
|
|
|
warning(
|
|
|
|
"remapping a chunk that had a super mirror inside of it, clearing space cache so we don't end up with corruption");
|
2015-01-26 01:39:24 +00:00
|
|
|
mdres->clear_space_cache = 1;
|
|
|
|
}
|
|
|
|
fs_chunk->physical = mdres->last_physical_offset;
|
|
|
|
tree_insert(&mdres->physical_tree, &fs_chunk->p, physical_cmp);
|
|
|
|
mdres->last_physical_offset += fs_chunk->bytes;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-11-27 08:38:24 +00:00
|
|
|
static int fixup_device_size(struct btrfs_trans_handle *trans,
|
2018-10-08 12:18:35 +00:00
|
|
|
struct mdrestore_struct *mdres, int out_fd)
|
2015-01-28 20:38:03 +00:00
|
|
|
{
|
2018-11-27 08:38:24 +00:00
|
|
|
struct btrfs_fs_info *fs_info = trans->fs_info;
|
2015-01-28 20:38:03 +00:00
|
|
|
struct btrfs_dev_item *dev_item;
|
2018-10-08 12:18:35 +00:00
|
|
|
struct btrfs_dev_extent *dev_ext;
|
2016-11-02 23:37:51 +00:00
|
|
|
struct btrfs_path path;
|
2015-01-28 20:38:03 +00:00
|
|
|
struct extent_buffer *leaf;
|
|
|
|
struct btrfs_root *root = fs_info->chunk_root;
|
|
|
|
struct btrfs_key key;
|
2018-12-18 07:57:40 +00:00
|
|
|
struct stat buf;
|
2015-01-28 20:38:03 +00:00
|
|
|
u64 devid, cur_devid;
|
2018-10-08 12:18:35 +00:00
|
|
|
u64 dev_size; /* Get from last dev extents */
|
2015-01-28 20:38:03 +00:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
dev_item = &fs_info->super_copy->dev_item;
|
|
|
|
|
2018-10-08 12:18:35 +00:00
|
|
|
btrfs_init_path(&path);
|
2015-01-28 20:38:03 +00:00
|
|
|
devid = btrfs_stack_device_id(dev_item);
|
|
|
|
|
2018-10-08 12:18:35 +00:00
|
|
|
key.objectid = devid;
|
|
|
|
key.type = BTRFS_DEV_EXTENT_KEY;
|
|
|
|
key.offset = (u64)-1;
|
|
|
|
|
|
|
|
ret = btrfs_search_slot(NULL, fs_info->dev_root, &key, &path, 0, 0);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to locate last dev extent of devid %llu: %m",
|
|
|
|
devid);
|
|
|
|
btrfs_release_path(&path);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
if (ret == 0) {
|
|
|
|
error("found invalid dev extent devid %llu offset -1", devid);
|
|
|
|
btrfs_release_path(&path);
|
|
|
|
return -EUCLEAN;
|
|
|
|
}
|
|
|
|
ret = btrfs_previous_item(fs_info->dev_root, &path, devid,
|
|
|
|
BTRFS_DEV_EXTENT_KEY);
|
|
|
|
if (ret > 0)
|
|
|
|
ret = -ENOENT;
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to locate last dev extent of devid %llu: %m",
|
|
|
|
devid);
|
|
|
|
btrfs_release_path(&path);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(path.nodes[0], &key, path.slots[0]);
|
|
|
|
dev_ext = btrfs_item_ptr(path.nodes[0], path.slots[0],
|
|
|
|
struct btrfs_dev_extent);
|
|
|
|
dev_size = key.offset + btrfs_dev_extent_length(path.nodes[0], dev_ext);
|
|
|
|
btrfs_release_path(&path);
|
|
|
|
|
2015-01-28 20:38:03 +00:00
|
|
|
btrfs_set_stack_device_total_bytes(dev_item, dev_size);
|
|
|
|
btrfs_set_stack_device_bytes_used(dev_item, mdres->alloced_chunks);
|
2018-12-18 07:57:40 +00:00
|
|
|
ret = fstat(out_fd, &buf);
|
2018-10-08 12:18:35 +00:00
|
|
|
if (ret < 0) {
|
2018-12-18 07:57:40 +00:00
|
|
|
error("failed to stat result image: %m");
|
2018-10-08 12:18:35 +00:00
|
|
|
return -errno;
|
|
|
|
}
|
2018-12-18 07:57:40 +00:00
|
|
|
if (S_ISREG(buf.st_mode)) {
|
|
|
|
/* Don't forget to enlarge the real file */
|
|
|
|
ret = ftruncate64(out_fd, dev_size);
|
|
|
|
if (ret < 0) {
|
|
|
|
error("failed to enlarge result image: %m");
|
|
|
|
return -errno;
|
|
|
|
}
|
|
|
|
}
|
2015-01-28 20:38:03 +00:00
|
|
|
|
|
|
|
key.objectid = BTRFS_DEV_ITEMS_OBJECTID;
|
|
|
|
key.type = BTRFS_DEV_ITEM_KEY;
|
|
|
|
key.offset = 0;
|
|
|
|
|
|
|
|
again:
|
2016-11-02 23:37:51 +00:00
|
|
|
ret = btrfs_search_slot(trans, root, &key, &path, -1, 1);
|
2015-01-28 20:38:03 +00:00
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("search failed: %d", ret);
|
2018-11-27 08:38:24 +00:00
|
|
|
return ret;
|
2015-01-28 20:38:03 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
while (1) {
|
2016-11-02 23:37:51 +00:00
|
|
|
leaf = path.nodes[0];
|
|
|
|
if (path.slots[0] >= btrfs_header_nritems(leaf)) {
|
|
|
|
ret = btrfs_next_leaf(root, &path);
|
2015-01-28 20:38:03 +00:00
|
|
|
if (ret < 0) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("cannot go to next leaf %d", ret);
|
2015-01-28 20:38:03 +00:00
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (ret > 0) {
|
|
|
|
ret = 0;
|
|
|
|
break;
|
|
|
|
}
|
2016-11-02 23:37:51 +00:00
|
|
|
leaf = path.nodes[0];
|
2015-01-28 20:38:03 +00:00
|
|
|
}
|
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
btrfs_item_key_to_cpu(leaf, &key, path.slots[0]);
|
2015-01-28 20:38:03 +00:00
|
|
|
if (key.type > BTRFS_DEV_ITEM_KEY)
|
|
|
|
break;
|
|
|
|
if (key.type != BTRFS_DEV_ITEM_KEY) {
|
2016-11-02 23:37:51 +00:00
|
|
|
path.slots[0]++;
|
2015-01-28 20:38:03 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
dev_item = btrfs_item_ptr(leaf, path.slots[0],
|
2015-01-28 20:38:03 +00:00
|
|
|
struct btrfs_dev_item);
|
|
|
|
cur_devid = btrfs_device_id(leaf, dev_item);
|
|
|
|
if (devid != cur_devid) {
|
2016-11-02 23:37:51 +00:00
|
|
|
ret = btrfs_del_item(trans, root, &path);
|
2015-01-28 20:38:03 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("cannot delete item: %d", ret);
|
2015-01-28 20:38:03 +00:00
|
|
|
exit(1);
|
|
|
|
}
|
2016-11-02 23:37:51 +00:00
|
|
|
btrfs_release_path(&path);
|
2015-01-28 20:38:03 +00:00
|
|
|
goto again;
|
|
|
|
}
|
|
|
|
|
|
|
|
btrfs_set_device_total_bytes(leaf, dev_item, dev_size);
|
|
|
|
btrfs_set_device_bytes_used(leaf, dev_item,
|
|
|
|
mdres->alloced_chunks);
|
|
|
|
btrfs_mark_buffer_dirty(leaf);
|
2016-11-02 23:37:51 +00:00
|
|
|
path.slots[0]++;
|
2015-01-28 20:38:03 +00:00
|
|
|
}
|
|
|
|
|
2016-11-02 23:37:51 +00:00
|
|
|
btrfs_release_path(&path);
|
2018-11-27 08:38:24 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2019-12-18 05:18:47 +00:00
|
|
|
static void fixup_block_groups(struct btrfs_trans_handle *trans)
|
btrfs-progs: image: Fix block group item flags when restoring multi-device image to single device
Since btrfs-image is just restoring tree blocks without really checking
if that tree block contents makes sense, for multi-device image, block
group items will keep the incorrect block group flags.
For example, for a metadata RAID1 data RAID0 btrfs recovered to a single
disk, its chunk tree will look like:
item 1 key (FIRST_CHUNK_TREE CHUNK_ITEM 22020096)
length 8388608 owner 2 stripe_len 65536 type SYSTEM
item 2 key (FIRST_CHUNK_TREE CHUNK_ITEM 30408704)
length 1073741824 owner 2 stripe_len 65536 type METADATA
item 3 key (FIRST_CHUNK_TREE CHUNK_ITEM 1104150528)
length 1073741824 owner 2 stripe_len 65536 type DATA
All chunks have correct type (SINGLE).
While its block group items will look like:
item 1 key (22020096 BLOCK_GROUP_ITEM 8388608)
block group used 16384 chunk_objectid 256 flags SYSTEM|RAID1
item 3 key (30408704 BLOCK_GROUP_ITEM 1073741824)
block group used 114688 chunk_objectid 256 flags METADATA|RAID1
item 11 key (1104150528 BLOCK_GROUP_ITEM 1073741824)
block group used 1572864 chunk_objectid 256 flags DATA|RAID0
All block group items still have the wrong profiles.
And btrfs check (lowmem mode for better output) will report error for
such image:
ERROR: chunk[22020096 30408704) related block group item flags mismatch, wanted: 2, have: 18
ERROR: chunk[30408704 1104150528) related block group item flags mismatch, wanted: 4, have: 20
ERROR: chunk[1104150528 2177892352) related block group item flags mismatch, wanted: 1, have: 9
This patch will do an extra repair for block group items to fix the
profile of them.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2018-11-27 08:38:25 +00:00
|
|
|
{
|
2019-12-18 05:18:47 +00:00
|
|
|
struct btrfs_fs_info *fs_info = trans->fs_info;
|
2020-05-01 06:52:19 +00:00
|
|
|
struct btrfs_block_group *bg;
|
btrfs-progs: image: Fix block group item flags when restoring multi-device image to single device
Since btrfs-image is just restoring tree blocks without really checking
if that tree block contents makes sense, for multi-device image, block
group items will keep the incorrect block group flags.
For example, for a metadata RAID1 data RAID0 btrfs recovered to a single
disk, its chunk tree will look like:
item 1 key (FIRST_CHUNK_TREE CHUNK_ITEM 22020096)
length 8388608 owner 2 stripe_len 65536 type SYSTEM
item 2 key (FIRST_CHUNK_TREE CHUNK_ITEM 30408704)
length 1073741824 owner 2 stripe_len 65536 type METADATA
item 3 key (FIRST_CHUNK_TREE CHUNK_ITEM 1104150528)
length 1073741824 owner 2 stripe_len 65536 type DATA
All chunks have correct type (SINGLE).
While its block group items will look like:
item 1 key (22020096 BLOCK_GROUP_ITEM 8388608)
block group used 16384 chunk_objectid 256 flags SYSTEM|RAID1
item 3 key (30408704 BLOCK_GROUP_ITEM 1073741824)
block group used 114688 chunk_objectid 256 flags METADATA|RAID1
item 11 key (1104150528 BLOCK_GROUP_ITEM 1073741824)
block group used 1572864 chunk_objectid 256 flags DATA|RAID0
All block group items still have the wrong profiles.
And btrfs check (lowmem mode for better output) will report error for
such image:
ERROR: chunk[22020096 30408704) related block group item flags mismatch, wanted: 2, have: 18
ERROR: chunk[30408704 1104150528) related block group item flags mismatch, wanted: 4, have: 20
ERROR: chunk[1104150528 2177892352) related block group item flags mismatch, wanted: 1, have: 9
This patch will do an extra repair for block group items to fix the
profile of them.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2018-11-27 08:38:25 +00:00
|
|
|
struct btrfs_mapping_tree *map_tree = &fs_info->mapping_tree;
|
|
|
|
struct cache_extent *ce;
|
|
|
|
struct map_lookup *map;
|
|
|
|
u64 extra_flags;
|
|
|
|
|
|
|
|
for (ce = search_cache_extent(&map_tree->cache_tree, 0); ce;
|
|
|
|
ce = next_cache_extent(ce)) {
|
|
|
|
map = container_of(ce, struct map_lookup, ce);
|
|
|
|
|
|
|
|
bg = btrfs_lookup_block_group(fs_info, ce->start);
|
|
|
|
if (!bg) {
|
|
|
|
warning(
|
|
|
|
"cannot find block group %llu, filesystem may not be mountable",
|
|
|
|
ce->start);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
extra_flags = map->type & BTRFS_BLOCK_GROUP_PROFILE_MASK;
|
|
|
|
|
|
|
|
if (bg->flags == map->type)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
/* Update the block group item and mark the bg dirty */
|
|
|
|
bg->flags = map->type;
|
2019-12-18 05:18:48 +00:00
|
|
|
if (list_empty(&bg->dirty_list))
|
|
|
|
list_add_tail(&bg->dirty_list, &trans->dirty_bgs);
|
btrfs-progs: image: Fix block group item flags when restoring multi-device image to single device
Since btrfs-image is just restoring tree blocks without really checking
if that tree block contents makes sense, for multi-device image, block
group items will keep the incorrect block group flags.
For example, for a metadata RAID1 data RAID0 btrfs recovered to a single
disk, its chunk tree will look like:
item 1 key (FIRST_CHUNK_TREE CHUNK_ITEM 22020096)
length 8388608 owner 2 stripe_len 65536 type SYSTEM
item 2 key (FIRST_CHUNK_TREE CHUNK_ITEM 30408704)
length 1073741824 owner 2 stripe_len 65536 type METADATA
item 3 key (FIRST_CHUNK_TREE CHUNK_ITEM 1104150528)
length 1073741824 owner 2 stripe_len 65536 type DATA
All chunks have correct type (SINGLE).
While its block group items will look like:
item 1 key (22020096 BLOCK_GROUP_ITEM 8388608)
block group used 16384 chunk_objectid 256 flags SYSTEM|RAID1
item 3 key (30408704 BLOCK_GROUP_ITEM 1073741824)
block group used 114688 chunk_objectid 256 flags METADATA|RAID1
item 11 key (1104150528 BLOCK_GROUP_ITEM 1073741824)
block group used 1572864 chunk_objectid 256 flags DATA|RAID0
All block group items still have the wrong profiles.
And btrfs check (lowmem mode for better output) will report error for
such image:
ERROR: chunk[22020096 30408704) related block group item flags mismatch, wanted: 2, have: 18
ERROR: chunk[30408704 1104150528) related block group item flags mismatch, wanted: 4, have: 20
ERROR: chunk[1104150528 2177892352) related block group item flags mismatch, wanted: 1, have: 9
This patch will do an extra repair for block group items to fix the
profile of them.
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2018-11-27 08:38:25 +00:00
|
|
|
/*
|
|
|
|
* Chunk and bg flags can be different, changing bg flags
|
|
|
|
* without update avail_data/meta_alloc_bits will lead to
|
|
|
|
* ENOSPC.
|
|
|
|
* So here we set avail_*_alloc_bits to match chunk types.
|
|
|
|
*/
|
|
|
|
if (map->type & BTRFS_BLOCK_GROUP_DATA)
|
|
|
|
fs_info->avail_data_alloc_bits = extra_flags;
|
|
|
|
if (map->type & BTRFS_BLOCK_GROUP_METADATA)
|
|
|
|
fs_info->avail_metadata_alloc_bits = extra_flags;
|
|
|
|
if (map->type & BTRFS_BLOCK_GROUP_SYSTEM)
|
|
|
|
fs_info->avail_system_alloc_bits = extra_flags;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-11-27 08:38:27 +00:00
|
|
|
static int remove_all_dev_extents(struct btrfs_trans_handle *trans)
|
|
|
|
{
|
|
|
|
struct btrfs_fs_info *fs_info = trans->fs_info;
|
|
|
|
struct btrfs_root *root = fs_info->dev_root;
|
|
|
|
struct btrfs_path path;
|
|
|
|
struct btrfs_key key;
|
|
|
|
struct extent_buffer *leaf;
|
|
|
|
int slot;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
key.objectid = 1;
|
|
|
|
key.type = BTRFS_DEV_EXTENT_KEY;
|
|
|
|
key.offset = 0;
|
|
|
|
btrfs_init_path(&path);
|
|
|
|
|
|
|
|
ret = btrfs_search_slot(trans, root, &key, &path, -1, 1);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to search dev tree: %m");
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
while (1) {
|
|
|
|
slot = path.slots[0];
|
|
|
|
leaf = path.nodes[0];
|
|
|
|
if (slot >= btrfs_header_nritems(leaf)) {
|
|
|
|
ret = btrfs_next_leaf(root, &path);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to search dev tree: %m");
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
if (ret > 0) {
|
|
|
|
ret = 0;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(leaf, &key, slot);
|
|
|
|
if (key.type != BTRFS_DEV_EXTENT_KEY)
|
|
|
|
break;
|
|
|
|
ret = btrfs_del_item(trans, root, &path);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to delete dev extent %llu, %llu: %m",
|
|
|
|
key.objectid, key.offset);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
btrfs_release_path(&path);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int fixup_dev_extents(struct btrfs_trans_handle *trans)
|
|
|
|
{
|
|
|
|
struct btrfs_fs_info *fs_info = trans->fs_info;
|
|
|
|
struct btrfs_mapping_tree *map_tree = &fs_info->mapping_tree;
|
|
|
|
struct btrfs_device *dev;
|
|
|
|
struct cache_extent *ce;
|
|
|
|
struct map_lookup *map;
|
|
|
|
u64 devid = btrfs_stack_device_id(&fs_info->super_copy->dev_item);
|
|
|
|
int i;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = remove_all_dev_extents(trans);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error("failed to remove all existing dev extents: %m");
|
|
|
|
}
|
|
|
|
|
|
|
|
dev = btrfs_find_device(fs_info, devid, NULL, NULL);
|
|
|
|
if (!dev) {
|
2020-03-27 20:36:52 +00:00
|
|
|
error("failed to find devid %llu", devid);
|
2018-11-27 08:38:27 +00:00
|
|
|
return -ENODEV;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Rebuild all dev extents using chunk maps */
|
|
|
|
for (ce = search_cache_extent(&map_tree->cache_tree, 0); ce;
|
|
|
|
ce = next_cache_extent(ce)) {
|
|
|
|
u64 stripe_len;
|
|
|
|
|
|
|
|
map = container_of(ce, struct map_lookup, ce);
|
|
|
|
stripe_len = calc_stripe_length(map->type, ce->size,
|
|
|
|
map->num_stripes);
|
|
|
|
for (i = 0; i < map->num_stripes; i++) {
|
|
|
|
ret = btrfs_insert_dev_extent(trans, dev, ce->start,
|
|
|
|
stripe_len, map->stripes[i].physical);
|
|
|
|
if (ret < 0) {
|
|
|
|
errno = -ret;
|
|
|
|
error(
|
|
|
|
"failed to insert dev extent %llu %llu: %m",
|
|
|
|
devid, map->stripes[i].physical);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2020-05-27 10:28:10 +00:00
|
|
|
static int iter_tree_blocks(struct btrfs_fs_info *fs_info,
|
|
|
|
struct extent_buffer *eb, bool pin)
|
|
|
|
{
|
|
|
|
void (*func)(struct btrfs_fs_info *fs_info, u64 bytenr, u64 num_bytes);
|
|
|
|
int nritems;
|
|
|
|
int level;
|
|
|
|
int i;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (pin)
|
|
|
|
func = btrfs_pin_extent;
|
|
|
|
else
|
|
|
|
func = btrfs_unpin_extent;
|
|
|
|
|
|
|
|
func(fs_info, eb->start, eb->len);
|
|
|
|
|
|
|
|
level = btrfs_header_level(eb);
|
|
|
|
nritems = btrfs_header_nritems(eb);
|
|
|
|
if (level == 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
for (i = 0; i < nritems; i++) {
|
|
|
|
u64 bytenr;
|
|
|
|
struct extent_buffer *tmp;
|
|
|
|
|
|
|
|
if (level == 0) {
|
|
|
|
struct btrfs_root_item *ri;
|
|
|
|
struct btrfs_key key;
|
|
|
|
|
|
|
|
btrfs_item_key_to_cpu(eb, &key, i);
|
|
|
|
if (key.type != BTRFS_ROOT_ITEM_KEY)
|
|
|
|
continue;
|
|
|
|
ri = btrfs_item_ptr(eb, i, struct btrfs_root_item);
|
|
|
|
bytenr = btrfs_disk_root_bytenr(eb, ri);
|
|
|
|
tmp = read_tree_block(fs_info, bytenr, 0);
|
|
|
|
if (!extent_buffer_uptodate(tmp)) {
|
|
|
|
error("unable to read log root block");
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
ret = iter_tree_blocks(fs_info, tmp, pin);
|
|
|
|
free_extent_buffer(tmp);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
} else {
|
|
|
|
bytenr = btrfs_node_blockptr(eb, i);
|
|
|
|
tmp = read_tree_block(fs_info, bytenr, 0);
|
|
|
|
if (!extent_buffer_uptodate(tmp)) {
|
|
|
|
error("unable to read log root block");
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
ret = iter_tree_blocks(fs_info, tmp, pin);
|
|
|
|
free_extent_buffer(tmp);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-11-27 08:38:24 +00:00
|
|
|
static int fixup_chunks_and_devices(struct btrfs_fs_info *fs_info,
|
2018-10-08 12:18:35 +00:00
|
|
|
struct mdrestore_struct *mdres, int out_fd)
|
2018-11-27 08:38:24 +00:00
|
|
|
{
|
|
|
|
struct btrfs_trans_handle *trans;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (btrfs_super_log_root(fs_info->super_copy)) {
|
|
|
|
warning(
|
|
|
|
"log tree detected, its generation will not match superblock");
|
|
|
|
}
|
|
|
|
trans = btrfs_start_transaction(fs_info->tree_root, 1);
|
|
|
|
if (IS_ERR(trans)) {
|
|
|
|
error("cannot start transaction %ld", PTR_ERR(trans));
|
|
|
|
return PTR_ERR(trans);
|
|
|
|
}
|
|
|
|
|
2020-05-27 10:28:10 +00:00
|
|
|
if (btrfs_super_log_root(fs_info->super_copy) && fs_info->log_root_tree)
|
|
|
|
iter_tree_blocks(fs_info, fs_info->log_root_tree->node, true);
|
2019-12-18 05:18:47 +00:00
|
|
|
fixup_block_groups(trans);
|
2018-11-27 08:38:27 +00:00
|
|
|
ret = fixup_dev_extents(trans);
|
|
|
|
if (ret < 0)
|
|
|
|
goto error;
|
|
|
|
|
2018-10-08 12:18:35 +00:00
|
|
|
ret = fixup_device_size(trans, mdres, out_fd);
|
2018-11-27 08:38:24 +00:00
|
|
|
if (ret < 0)
|
|
|
|
goto error;
|
|
|
|
|
2015-01-28 20:38:03 +00:00
|
|
|
ret = btrfs_commit_transaction(trans, fs_info->tree_root);
|
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to commit transaction: %d", ret);
|
2015-01-28 20:38:03 +00:00
|
|
|
return ret;
|
|
|
|
}
|
2020-05-27 10:28:10 +00:00
|
|
|
if (btrfs_super_log_root(fs_info->super_copy) && fs_info->log_root_tree)
|
|
|
|
iter_tree_blocks(fs_info, fs_info->log_root_tree->node, false);
|
2015-01-28 20:38:03 +00:00
|
|
|
return 0;
|
2018-11-27 08:38:24 +00:00
|
|
|
error:
|
|
|
|
errno = -ret;
|
|
|
|
error(
|
|
|
|
"failed to fix chunks and devices mapping, the fs may not be mountable: %m");
|
|
|
|
btrfs_abort_transaction(trans, ret);
|
|
|
|
return ret;
|
2015-01-28 20:38:03 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static int restore_metadump(const char *input, FILE *out, int old_restore,
|
|
|
|
int num_threads, int fixup_offset,
|
|
|
|
const char *target, int multi_devices)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
2013-03-04 22:39:55 +00:00
|
|
|
struct meta_cluster *cluster = NULL;
|
2008-11-20 14:52:48 +00:00
|
|
|
struct meta_cluster_header *header;
|
|
|
|
struct mdrestore_struct mdrestore;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
struct btrfs_fs_info *info = NULL;
|
2008-11-20 14:52:48 +00:00
|
|
|
u64 bytenr = 0;
|
2013-03-04 22:39:55 +00:00
|
|
|
FILE *in = NULL;
|
2013-03-18 18:50:45 +00:00
|
|
|
int ret = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
|
|
|
|
if (!strcmp(input, "-")) {
|
|
|
|
in = stdin;
|
|
|
|
} else {
|
|
|
|
in = fopen(input, "r");
|
|
|
|
if (!in) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unable to open metadump image: %m");
|
2009-01-21 18:22:49 +00:00
|
|
|
return 1;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
/* NOTE: open with write mode */
|
|
|
|
if (fixup_offset) {
|
2016-03-07 04:57:41 +00:00
|
|
|
info = open_ctree_fs_info(target, 0, 0, 0,
|
2013-10-28 18:28:43 +00:00
|
|
|
OPEN_CTREE_WRITES |
|
|
|
|
OPEN_CTREE_RESTORE |
|
|
|
|
OPEN_CTREE_PARTIAL);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (!info) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("open ctree failed");
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto failed_open;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
cluster = malloc(BLOCK_SIZE);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (!cluster) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("not enough memory for cluster");
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
ret = -ENOMEM;
|
|
|
|
goto failed_info;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
ret = mdrestore_init(&mdrestore, in, out, old_restore, num_threads,
|
|
|
|
fixup_offset, info, multi_devices);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret) {
|
2017-01-06 03:40:47 +00:00
|
|
|
error("failed to initialize metadata restore state: %d", ret);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
goto failed_cluster;
|
2013-03-18 18:50:45 +00:00
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2014-06-26 02:53:01 +00:00
|
|
|
if (!multi_devices && !old_restore) {
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
ret = build_chunk_tree(&mdrestore, cluster);
|
2019-07-04 06:10:54 +00:00
|
|
|
if (ret) {
|
|
|
|
error("failed to build chunk tree");
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
goto out;
|
2019-07-04 06:10:54 +00:00
|
|
|
}
|
2015-01-26 01:39:24 +00:00
|
|
|
if (!list_empty(&mdrestore.overlapping_chunks))
|
|
|
|
remap_overlapping_chunks(&mdrestore);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
2013-05-08 15:40:36 +00:00
|
|
|
|
|
|
|
if (in != stdin && fseek(in, 0, SEEK_SET)) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("seek failed: %m");
|
2013-05-08 15:40:36 +00:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2015-02-06 19:40:45 +00:00
|
|
|
while (!mdrestore.error) {
|
2008-11-20 14:52:48 +00:00
|
|
|
ret = fread(cluster, BLOCK_SIZE, 1, in);
|
|
|
|
if (!ret)
|
|
|
|
break;
|
|
|
|
|
|
|
|
header = &cluster->header;
|
|
|
|
if (le64_to_cpu(header->magic) != HEADER_MAGIC ||
|
|
|
|
le64_to_cpu(header->bytenr) != bytenr) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("bad header in metadump image");
|
2013-03-18 18:50:45 +00:00
|
|
|
ret = -EIO;
|
|
|
|
break;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
ret = add_cluster(cluster, &mdrestore, &bytenr);
|
2013-03-18 18:50:45 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("failed to add cluster: %d", ret);
|
2013-03-18 18:50:45 +00:00
|
|
|
break;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
2015-02-06 19:40:45 +00:00
|
|
|
ret = wait_for_worker(&mdrestore);
|
2015-01-28 20:38:03 +00:00
|
|
|
|
2020-05-27 10:28:09 +00:00
|
|
|
if (!ret && !multi_devices && !old_restore &&
|
|
|
|
btrfs_super_num_devices(mdrestore.original_super) != 1) {
|
2015-02-03 14:48:57 +00:00
|
|
|
struct btrfs_root *root;
|
2015-01-28 20:38:03 +00:00
|
|
|
struct stat st;
|
|
|
|
|
2015-02-03 14:48:57 +00:00
|
|
|
root = open_ctree_fd(fileno(out), target, 0,
|
2015-01-28 20:38:03 +00:00
|
|
|
OPEN_CTREE_PARTIAL |
|
2015-02-03 14:48:57 +00:00
|
|
|
OPEN_CTREE_WRITES |
|
|
|
|
OPEN_CTREE_NO_DEVICES);
|
|
|
|
if (!root) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("open ctree failed in %s", target);
|
2015-01-28 20:38:03 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto out;
|
|
|
|
}
|
2015-02-03 14:48:57 +00:00
|
|
|
info = root->fs_info;
|
2015-01-28 20:38:03 +00:00
|
|
|
|
|
|
|
if (stat(target, &st)) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("stat %s failed: %m", target);
|
2015-01-28 20:38:03 +00:00
|
|
|
close_ctree(info->chunk_root);
|
2016-07-15 14:27:06 +00:00
|
|
|
free(cluster);
|
2015-01-28 20:38:03 +00:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2018-10-08 12:18:35 +00:00
|
|
|
ret = fixup_chunks_and_devices(info, &mdrestore, fileno(out));
|
2015-01-28 20:38:03 +00:00
|
|
|
close_ctree(info->chunk_root);
|
|
|
|
if (ret)
|
|
|
|
goto out;
|
|
|
|
}
|
2013-05-08 15:40:36 +00:00
|
|
|
out:
|
2014-03-21 01:06:23 +00:00
|
|
|
mdrestore_destroy(&mdrestore, num_threads);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
failed_cluster:
|
2008-11-20 14:52:48 +00:00
|
|
|
free(cluster);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
failed_info:
|
|
|
|
if (fixup_offset && info)
|
|
|
|
close_ctree(info->chunk_root);
|
|
|
|
failed_open:
|
2008-11-20 14:52:48 +00:00
|
|
|
if (in != stdin)
|
|
|
|
fclose(in);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
static int update_disk_super_on_device(struct btrfs_fs_info *info,
|
|
|
|
const char *other_dev, u64 cur_devid)
|
|
|
|
{
|
|
|
|
struct btrfs_key key;
|
|
|
|
struct extent_buffer *leaf;
|
|
|
|
struct btrfs_path path;
|
|
|
|
struct btrfs_dev_item *dev_item;
|
|
|
|
struct btrfs_super_block *disk_super;
|
|
|
|
char dev_uuid[BTRFS_UUID_SIZE];
|
|
|
|
char fs_uuid[BTRFS_UUID_SIZE];
|
|
|
|
u64 devid, type, io_align, io_width;
|
|
|
|
u64 sector_size, total_bytes, bytes_used;
|
2015-09-01 13:10:48 +00:00
|
|
|
char buf[BTRFS_SUPER_INFO_SIZE];
|
2015-09-01 13:04:29 +00:00
|
|
|
int fp = -1;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
key.objectid = BTRFS_DEV_ITEMS_OBJECTID;
|
|
|
|
key.type = BTRFS_DEV_ITEM_KEY;
|
|
|
|
key.offset = cur_devid;
|
|
|
|
|
|
|
|
btrfs_init_path(&path);
|
2018-10-11 15:03:59 +00:00
|
|
|
ret = btrfs_search_slot(NULL, info->chunk_root, &key, &path, 0, 0);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("search key failed: %d", ret);
|
2015-09-01 13:04:29 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto out;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
leaf = path.nodes[0];
|
|
|
|
dev_item = btrfs_item_ptr(leaf, path.slots[0],
|
|
|
|
struct btrfs_dev_item);
|
|
|
|
|
|
|
|
devid = btrfs_device_id(leaf, dev_item);
|
|
|
|
if (devid != cur_devid) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("devid mismatch: %llu != %llu",
|
|
|
|
(unsigned long long)devid,
|
|
|
|
(unsigned long long)cur_devid);
|
2015-09-01 13:04:29 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto out;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type = btrfs_device_type(leaf, dev_item);
|
|
|
|
io_align = btrfs_device_io_align(leaf, dev_item);
|
|
|
|
io_width = btrfs_device_io_width(leaf, dev_item);
|
|
|
|
sector_size = btrfs_device_sector_size(leaf, dev_item);
|
|
|
|
total_bytes = btrfs_device_total_bytes(leaf, dev_item);
|
|
|
|
bytes_used = btrfs_device_bytes_used(leaf, dev_item);
|
|
|
|
read_extent_buffer(leaf, dev_uuid, (unsigned long)btrfs_device_uuid(dev_item), BTRFS_UUID_SIZE);
|
|
|
|
read_extent_buffer(leaf, fs_uuid, (unsigned long)btrfs_device_fsid(dev_item), BTRFS_UUID_SIZE);
|
|
|
|
|
2013-08-03 00:52:43 +00:00
|
|
|
btrfs_release_path(&path);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
|
2016-09-08 13:57:42 +00:00
|
|
|
printf("update disk super on %s devid=%llu\n", other_dev, devid);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
|
|
|
|
/* update other devices' super block */
|
|
|
|
fp = open(other_dev, O_CREAT | O_RDWR, 0600);
|
|
|
|
if (fp < 0) {
|
2018-01-07 21:54:21 +00:00
|
|
|
error("could not open %s: %m", other_dev);
|
2015-09-01 13:04:29 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto out;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
memcpy(buf, info->super_copy, BTRFS_SUPER_INFO_SIZE);
|
|
|
|
|
|
|
|
disk_super = (struct btrfs_super_block *)buf;
|
|
|
|
dev_item = &disk_super->dev_item;
|
|
|
|
|
|
|
|
btrfs_set_stack_device_type(dev_item, type);
|
|
|
|
btrfs_set_stack_device_id(dev_item, devid);
|
|
|
|
btrfs_set_stack_device_total_bytes(dev_item, total_bytes);
|
|
|
|
btrfs_set_stack_device_bytes_used(dev_item, bytes_used);
|
|
|
|
btrfs_set_stack_device_io_align(dev_item, io_align);
|
|
|
|
btrfs_set_stack_device_io_width(dev_item, io_width);
|
|
|
|
btrfs_set_stack_device_sector_size(dev_item, sector_size);
|
|
|
|
memcpy(dev_item->uuid, dev_uuid, BTRFS_UUID_SIZE);
|
|
|
|
memcpy(dev_item->fsid, fs_uuid, BTRFS_UUID_SIZE);
|
|
|
|
csum_block((u8 *)buf, BTRFS_SUPER_INFO_SIZE);
|
|
|
|
|
|
|
|
ret = pwrite64(fp, buf, BTRFS_SUPER_INFO_SIZE, BTRFS_SUPER_INFO_OFFSET);
|
|
|
|
if (ret != BTRFS_SUPER_INFO_SIZE) {
|
2018-10-25 12:10:54 +00:00
|
|
|
if (ret < 0) {
|
|
|
|
errno = ret;
|
|
|
|
error("cannot write superblock: %m");
|
|
|
|
} else {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("cannot write superblock");
|
2018-10-25 12:10:54 +00:00
|
|
|
}
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
ret = -EIO;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
write_backup_supers(fp, (u8 *)buf);
|
|
|
|
|
|
|
|
out:
|
2015-09-01 13:04:29 +00:00
|
|
|
if (fp != -1)
|
|
|
|
close(fp);
|
|
|
|
return ret;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
}
|
|
|
|
|
2015-06-10 22:04:19 +00:00
|
|
|
static void print_usage(int ret)
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
2016-09-03 18:30:50 +00:00
|
|
|
printf("usage: btrfs-image [options] source target\n");
|
|
|
|
printf("\t-r \trestore metadump image\n");
|
|
|
|
printf("\t-c value\tcompression level (0 ~ 9)\n");
|
|
|
|
printf("\t-t value\tnumber of threads (1 ~ 32)\n");
|
|
|
|
printf("\t-o \tdon't mess with the chunk tree when restoring\n");
|
|
|
|
printf("\t-s \tsanitize file names, use once to just use garbage, use twice if you want crc collisions\n");
|
|
|
|
printf("\t-w \twalk all trees instead of using extent tree, do this if your extent tree is broken\n");
|
|
|
|
printf("\t-m \trestore for multiple devices\n");
|
|
|
|
printf("\n");
|
|
|
|
printf("\tIn the dump mode, source is the btrfs device and target is the output file (use '-' for stdout).\n");
|
|
|
|
printf("\tIn the restore mode, source is the dumped image and target is the btrfs device/file.\n");
|
2015-06-10 22:04:19 +00:00
|
|
|
exit(ret);
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2015-06-21 16:23:19 +00:00
|
|
|
int BOX_MAIN(image)(int argc, char *argv[])
|
2008-11-20 14:52:48 +00:00
|
|
|
{
|
|
|
|
char *source;
|
|
|
|
char *target;
|
2015-09-09 13:32:21 +00:00
|
|
|
u64 num_threads = 0;
|
2014-02-20 01:30:51 +00:00
|
|
|
u64 compress_level = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
int create = 1;
|
2013-03-27 20:55:41 +00:00
|
|
|
int old_restore = 0;
|
2013-03-28 14:26:09 +00:00
|
|
|
int walk_trees = 0;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int multi_devices = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
int ret;
|
2017-10-19 23:01:43 +00:00
|
|
|
enum sanitize_mode sanitize = SANITIZE_NONE;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
int dev_cnt = 0;
|
2014-06-24 03:16:12 +00:00
|
|
|
int usage_error = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
FILE *out;
|
|
|
|
|
|
|
|
while (1) {
|
2015-06-10 22:04:19 +00:00
|
|
|
static const struct option long_options[] = {
|
|
|
|
{ "help", no_argument, NULL, GETOPT_VAL_HELP},
|
|
|
|
{ NULL, 0, NULL, 0 }
|
|
|
|
};
|
|
|
|
int c = getopt_long(argc, argv, "rc:t:oswm", long_options, NULL);
|
2008-11-20 14:52:48 +00:00
|
|
|
if (c < 0)
|
|
|
|
break;
|
|
|
|
switch (c) {
|
|
|
|
case 'r':
|
|
|
|
create = 0;
|
|
|
|
break;
|
|
|
|
case 't':
|
2014-02-20 01:30:51 +00:00
|
|
|
num_threads = arg_strtou64(optarg);
|
2016-11-02 23:53:43 +00:00
|
|
|
if (num_threads > MAX_WORKER_THREADS) {
|
|
|
|
error("number of threads out of range: %llu > %d",
|
|
|
|
(unsigned long long)num_threads,
|
|
|
|
MAX_WORKER_THREADS);
|
2016-09-03 18:34:47 +00:00
|
|
|
return 1;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
break;
|
|
|
|
case 'c':
|
2014-02-20 01:30:51 +00:00
|
|
|
compress_level = arg_strtou64(optarg);
|
2016-09-03 18:34:47 +00:00
|
|
|
if (compress_level > 9) {
|
|
|
|
error("compression level out of range: %llu",
|
|
|
|
(unsigned long long)compress_level);
|
|
|
|
return 1;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
break;
|
2013-03-27 20:55:41 +00:00
|
|
|
case 'o':
|
|
|
|
old_restore = 1;
|
|
|
|
break;
|
2013-03-22 14:52:07 +00:00
|
|
|
case 's':
|
2017-10-19 23:01:43 +00:00
|
|
|
if (sanitize == SANITIZE_NONE)
|
|
|
|
sanitize = SANITIZE_NAMES;
|
|
|
|
else if (sanitize == SANITIZE_NAMES)
|
|
|
|
sanitize = SANITIZE_COLLISIONS;
|
2013-03-22 14:52:07 +00:00
|
|
|
break;
|
2013-03-28 14:26:09 +00:00
|
|
|
case 'w':
|
|
|
|
walk_trees = 1;
|
|
|
|
break;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
case 'm':
|
|
|
|
create = 0;
|
|
|
|
multi_devices = 1;
|
|
|
|
break;
|
2019-06-06 11:06:04 +00:00
|
|
|
case GETOPT_VAL_HELP:
|
2008-11-20 14:52:48 +00:00
|
|
|
default:
|
2015-06-10 22:04:19 +00:00
|
|
|
print_usage(c != GETOPT_VAL_HELP);
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-06-30 03:54:12 +00:00
|
|
|
set_argv0(argv);
|
2016-03-01 15:29:16 +00:00
|
|
|
if (check_argc_min(argc - optind, 2))
|
2015-06-10 22:04:19 +00:00
|
|
|
print_usage(1);
|
2014-06-30 03:54:12 +00:00
|
|
|
|
2016-03-01 15:29:16 +00:00
|
|
|
dev_cnt = argc - optind - 1;
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
|
2014-06-24 03:16:12 +00:00
|
|
|
if (create) {
|
|
|
|
if (old_restore) {
|
2016-09-30 11:00:24 +00:00
|
|
|
error(
|
|
|
|
"create and restore cannot be used at the same time");
|
2014-06-24 03:16:12 +00:00
|
|
|
usage_error++;
|
|
|
|
}
|
|
|
|
} else {
|
2017-10-19 23:01:43 +00:00
|
|
|
if (walk_trees || sanitize != SANITIZE_NONE || compress_level) {
|
2016-09-30 11:00:24 +00:00
|
|
|
error(
|
2018-11-26 17:08:21 +00:00
|
|
|
"using -w, -s, -c options for restore makes no sense");
|
2014-06-24 03:16:12 +00:00
|
|
|
usage_error++;
|
|
|
|
}
|
|
|
|
if (multi_devices && dev_cnt < 2) {
|
2016-09-30 11:00:24 +00:00
|
|
|
error("not enough devices specified for -m option");
|
2014-06-24 03:16:12 +00:00
|
|
|
usage_error++;
|
|
|
|
}
|
|
|
|
if (!multi_devices && dev_cnt != 1) {
|
2016-09-30 11:00:24 +00:00
|
|
|
error("accepts only 1 device without -m option");
|
2014-06-24 03:16:12 +00:00
|
|
|
usage_error++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (usage_error)
|
2015-06-10 22:04:19 +00:00
|
|
|
print_usage(1);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
source = argv[optind];
|
|
|
|
target = argv[optind + 1];
|
|
|
|
|
|
|
|
if (create && !strcmp(target, "-")) {
|
|
|
|
out = stdout;
|
|
|
|
} else {
|
|
|
|
out = fopen(target, "w+");
|
|
|
|
if (!out) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to create target file %s", target);
|
2008-11-20 14:52:48 +00:00
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-09-09 13:32:22 +00:00
|
|
|
if (compress_level > 0 || create == 0) {
|
|
|
|
if (num_threads == 0) {
|
2015-10-30 14:34:55 +00:00
|
|
|
long tmp = sysconf(_SC_NPROCESSORS_ONLN);
|
|
|
|
|
|
|
|
if (tmp <= 0)
|
|
|
|
tmp = 1;
|
btrfs-progs: image: Fix a access-beyond-boundary bug when there are 32 online CPUs
[BUG]
When there are over 32 (in my example, 35) online CPUs, btrfs-image -c9
will just hang.
[CAUSE]
Btrfs-image has a hard coded limit (32) on how many threads we can use.
For the "-t" option we do the up limit check.
But when we don't specify "-t" option and speicified "-c" option, then
btrfs-image will try to auto detect the number of online CPUs, and use
it without checking if it's over the up limit.
And for num_threads larger than the up limit, we will over write the
adjust members of metadump_struct/mdrestore_struct, corrupting
pthread_mutex_t and pthread_cond_t, causing synchronising problem.
Nowadays, with SMT/HT and higher cpu core counts, it's not hard to go
beyond 32 threads, and hit the bug.
[FIX]
Just do extra num_threads check before using the number from sysconf().
Reviewed-by: Su Yue <Damenly_Su@gmx.com>
Signed-off-by: Qu Wenruo <wqu@suse.com>
Signed-off-by: David Sterba <dsterba@suse.com>
2019-06-06 11:06:05 +00:00
|
|
|
tmp = min_t(long, tmp, MAX_WORKER_THREADS);
|
2015-10-30 14:34:55 +00:00
|
|
|
num_threads = tmp;
|
2015-09-09 13:32:22 +00:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
num_threads = 0;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|
|
|
|
|
2014-07-07 01:56:51 +00:00
|
|
|
if (create) {
|
|
|
|
ret = check_mounted(source);
|
|
|
|
if (ret < 0) {
|
2018-10-25 12:10:54 +00:00
|
|
|
errno = -ret;
|
|
|
|
warning("unable to check mount status of: %m");
|
2016-09-08 13:57:42 +00:00
|
|
|
} else if (ret) {
|
|
|
|
warning("%s already mounted, results may be inaccurate",
|
|
|
|
source);
|
|
|
|
}
|
2014-07-07 01:56:51 +00:00
|
|
|
|
2008-11-20 14:52:48 +00:00
|
|
|
ret = create_metadump(source, out, num_threads,
|
2013-03-22 14:52:07 +00:00
|
|
|
compress_level, sanitize, walk_trees);
|
2014-07-07 01:56:51 +00:00
|
|
|
} else {
|
2015-02-06 19:40:45 +00:00
|
|
|
ret = restore_metadump(source, out, old_restore, num_threads,
|
2015-01-28 20:38:03 +00:00
|
|
|
0, target, multi_devices);
|
2014-07-07 01:56:51 +00:00
|
|
|
}
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (ret) {
|
2019-07-04 06:10:55 +00:00
|
|
|
error("%s failed: %d", (create) ? "create" : "restore", ret);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* extended support for multiple devices */
|
|
|
|
if (!create && multi_devices) {
|
|
|
|
struct btrfs_fs_info *info;
|
|
|
|
u64 total_devs;
|
|
|
|
int i;
|
|
|
|
|
2016-03-07 04:57:41 +00:00
|
|
|
info = open_ctree_fs_info(target, 0, 0, 0,
|
2013-10-28 18:28:43 +00:00
|
|
|
OPEN_CTREE_PARTIAL |
|
|
|
|
OPEN_CTREE_RESTORE);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (!info) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("open ctree failed at %s", target);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
total_devs = btrfs_super_num_devices(info->super_copy);
|
|
|
|
if (total_devs != dev_cnt) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("it needs %llu devices but has only %d",
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
total_devs, dev_cnt);
|
|
|
|
close_ctree(info->chunk_root);
|
|
|
|
goto out;
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
/* update super block on other disks */
|
|
|
|
for (i = 2; i <= dev_cnt; i++) {
|
|
|
|
ret = update_disk_super_on_device(info,
|
|
|
|
argv[optind + i], (u64)i);
|
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("update disk superblock failed devid %d: %d",
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
i, ret);
|
|
|
|
close_ctree(info->chunk_root);
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
close_ctree(info->chunk_root);
|
|
|
|
|
|
|
|
/* fix metadata block to map correct chunk */
|
2015-01-28 20:38:03 +00:00
|
|
|
ret = restore_metadump(source, out, 0, num_threads, 1,
|
|
|
|
target, 1);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
if (ret) {
|
2016-09-08 13:57:42 +00:00
|
|
|
error("unable to fixup metadump: %d", ret);
|
Btrfs-progs: enhance btrfs-image to restore image onto multiple disks
This adds a 'btrfs-image -m' option, which let us restore an image that
is built from a btrfs of multiple disks onto several disks altogether.
This aims to address the following case,
$ mkfs.btrfs -m raid0 sda sdb
$ btrfs-image sda image.file
$ btrfs-image -r image.file sdc
---------
so we can only restore metadata onto sdc, and another thing is we can
only mount sdc with degraded mode as we don't provide informations of
another disk. And, it's built as RAID0 and we have only one disk,
so after mount sdc we'll get into readonly mode.
This is just annoying for people(like me) who're trying to restore image
but turn to find they cannot make it work.
So this'll make your life easier, just tap
$ btrfs-image -m image.file sdc sdd
---------
then you get everything about metadata done, the same offset with that of
the originals(of course, you need offer enough disk size, at least the disk
size of the original disks).
Besides, this also works with raid5 and raid6 metadata image.
Signed-off-by: Liu Bo <bo.li.liu@oracle.com>
Signed-off-by: Chris Mason <chris.mason@fusionio.com>
2013-06-22 05:32:45 +00:00
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
out:
|
2014-06-24 03:16:45 +00:00
|
|
|
if (out == stdout) {
|
2008-11-20 14:52:48 +00:00
|
|
|
fflush(out);
|
2014-06-24 03:16:45 +00:00
|
|
|
} else {
|
2008-11-20 14:52:48 +00:00
|
|
|
fclose(out);
|
2014-06-24 03:16:45 +00:00
|
|
|
if (ret && create) {
|
|
|
|
int unlink_ret;
|
|
|
|
|
|
|
|
unlink_ret = unlink(target);
|
|
|
|
if (unlink_ret)
|
2018-01-07 21:54:21 +00:00
|
|
|
error("unlink output file %s failed: %m",
|
|
|
|
target);
|
2014-06-24 03:16:45 +00:00
|
|
|
}
|
|
|
|
}
|
2008-11-20 14:52:48 +00:00
|
|
|
|
2015-09-09 13:32:23 +00:00
|
|
|
btrfs_close_all_devices();
|
|
|
|
|
2013-09-04 15:22:30 +00:00
|
|
|
return !!ret;
|
2008-11-20 14:52:48 +00:00
|
|
|
}
|