ceph/src/tools/osdmaptool.cc
Jan Fajerski d544dfb549 Merge PR #32777 into master
* refs/pull/32777/head:
	common,log,msg: Fix win32 compiler warnings
	win32,common: provide a default ceph.conf location
	common: add newline before parsing config on Windows
	common: verify unix sockets support on Windows
	common: fix md_config_t::get_cluster_name
	global, common: Print config parse errors
	common: accept config files containing whitespaces
	librbd: avoid broken mingw rng
	common: define DEV_NULL
	tools,common,msg: Use O_BINARY for win32 compatibility
	log: fix timestamps on Windows
	common,librbd: add portable ceph_memzero_s
	common,msg: Fix socket handling
	common: Extend win32 compatbility layer

Reviewed-by: Jason Dillaman <dillaman@redhat.com>
2020-11-09 14:10:36 +01:00

847 lines
29 KiB
C++

// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
// vim: ts=8 sw=2 smarttab
/*
* Ceph - scalable distributed file system
*
* Copyright (C) 2004-2006 Sage Weil <sage@newdream.net>
*
* This is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License version 2.1, as published by the Free Software
* Foundation. See file COPYING.
*
*/
#include <string>
#include <sys/stat.h>
#include "common/ceph_argparse.h"
#include "common/errno.h"
#include "common/safe_io.h"
#include "include/random.h"
#include "mon/health_check.h"
#include <time.h>
#include <algorithm>
#include "global/global_init.h"
#include "osd/OSDMap.h"
void usage()
{
cout << " usage: [--print] <mapfilename>" << std::endl;
cout << " --create-from-conf creates an osd map with default configurations" << std::endl;
cout << " --createsimple <numosd> [--clobber] [--pg-bits <bitsperosd>] [--pgp-bits <bits>] creates a relatively generic OSD map with <numosd> devices" << std::endl;
cout << " --pgp-bits <bits> pgp_num map attribute will be shifted by <bits>" << std::endl;
cout << " --pg-bits <bits> pg_num map attribute will be shifted by <bits>" << std::endl;
cout << " --clobber allows osdmaptool to overwrite <mapfilename> if it already exists" << std::endl;
cout << " --export-crush <file> write osdmap's crush map to <file>" << std::endl;
cout << " --import-crush <file> replace osdmap's crush map with <file>" << std::endl;
cout << " --health dump health checks" << std::endl;
cout << " --test-map-pgs [--pool <poolid>] [--pg_num <pg_num>] [--range-first <first> --range-last <last>] map all pgs" << std::endl;
cout << " --test-map-pgs-dump [--pool <poolid>] [--range-first <first> --range-last <last>] map all pgs" << std::endl;
cout << " --test-map-pgs-dump-all [--pool <poolid>] [--range-first <first> --range-last <last>] map all pgs to osds" << std::endl;
cout << " --mark-up-in mark osds up and in (but do not persist)" << std::endl;
cout << " --mark-out <osdid> mark an osd as out (but do not persist)" << std::endl;
cout << " --mark-up <osdid> mark an osd as up (but do not persist)" << std::endl;
cout << " --mark-in <osdid> mark an osd as in (but do not persist)" << std::endl;
cout << " --with-default-pool include default pool when creating map" << std::endl;
cout << " --clear-temp clear pg_temp and primary_temp" << std::endl;
cout << " --clean-temps clean pg_temps" << std::endl;
cout << " --test-random do random placements" << std::endl;
cout << " --test-map-pg <pgid> map a pgid to osds" << std::endl;
cout << " --test-map-object <objectname> [--pool <poolid>] map an object to osds"
<< std::endl;
cout << " --upmap-cleanup <file> clean up pg_upmap[_items] entries, writing" << std::endl;
cout << " commands to <file> [default: - for stdout]" << std::endl;
cout << " --upmap <file> calculate pg upmap entries to balance pg layout" << std::endl;
cout << " writing commands to <file> [default: - for stdout]" << std::endl;
cout << " --upmap-max <max-count> set max upmap entries to calculate [default: 10]" << std::endl;
cout << " --upmap-deviation <max-deviation>" << std::endl;
cout << " max deviation from target [default: 5]" << std::endl;
cout << " --upmap-pool <poolname> restrict upmap balancing to 1 or more pools" << std::endl;
cout << " --upmap-active Act like an active balancer, keep applying changes until balanced" << std::endl;
cout << " --dump <format> displays the map in plain text when <format> is 'plain', 'json' if specified format is not supported" << std::endl;
cout << " --tree displays a tree of the map" << std::endl;
cout << " --test-crush [--range-first <first> --range-last <last>] map pgs to acting osds" << std::endl;
cout << " --adjust-crush-weight <osdid:weight>[,<osdid:weight>,<...>] change <osdid> CRUSH <weight> (but do not persist)" << std::endl;
cout << " --save write modified osdmap with upmap or crush-adjust changes" << std::endl;
exit(1);
}
void print_inc_upmaps(const OSDMap::Incremental& pending_inc, int fd)
{
ostringstream ss;
for (auto& i : pending_inc.old_pg_upmap) {
ss << "ceph osd rm-pg-upmap " << i << std::endl;
}
for (auto& i : pending_inc.new_pg_upmap) {
ss << "ceph osd pg-upmap " << i.first;
for (auto osd : i.second) {
ss << " " << osd;
}
ss << std::endl;
}
for (auto& i : pending_inc.old_pg_upmap_items) {
ss << "ceph osd rm-pg-upmap-items " << i << std::endl;
}
for (auto& i : pending_inc.new_pg_upmap_items) {
ss << "ceph osd pg-upmap-items " << i.first;
for (auto p : i.second) {
ss << " " << p.first << " " << p.second;
}
ss << std::endl;
}
string s = ss.str();
int r = safe_write(fd, s.c_str(), s.size());
if (r < 0) {
cerr << "error writing output: " << cpp_strerror(r) << std::endl;
exit(1);
}
}
int main(int argc, const char **argv)
{
vector<const char*> args;
argv_to_vec(argc, argv, args);
if (args.empty()) {
cerr << argv[0] << ": -h or --help for usage" << std::endl;
exit(1);
}
if (ceph_argparse_need_usage(args)) {
usage();
exit(0);
}
auto cct = global_init(NULL, args, CEPH_ENTITY_TYPE_CLIENT,
CODE_ENVIRONMENT_UTILITY,
CINIT_FLAG_NO_DEFAULT_CONFIG_FILE);
common_init_finish(g_ceph_context);
const char *me = argv[0];
std::string fn;
bool print = false;
boost::scoped_ptr<Formatter> print_formatter;
bool tree = false;
boost::scoped_ptr<Formatter> tree_formatter;
bool createsimple = false;
bool createpool = false;
bool create_from_conf = false;
int num_osd = 0;
int pg_bits = 6;
int pgp_bits = 6;
bool clobber = false;
bool modified = false;
std::string export_crush, import_crush, test_map_pg, test_map_object, adjust_crush_weight;
bool test_crush = false;
int range_first = -1;
int range_last = -1;
int pool = -1;
bool mark_up_in = false;
int marked_out = -1;
int marked_up = -1;
int marked_in = -1;
bool clear_temp = false;
bool clean_temps = false;
bool test_map_pgs = false;
bool test_map_pgs_dump = false;
bool test_random = false;
bool upmap_cleanup = false;
bool upmap = false;
bool health = false;
std::string upmap_file = "-";
int upmap_max = 10;
int upmap_deviation = 5;
bool upmap_active = false;
std::set<std::string> upmap_pools;
int64_t pg_num = -1;
bool test_map_pgs_dump_all = false;
bool save = false;
std::string val;
std::ostringstream err;
for (std::vector<const char*>::iterator i = args.begin(); i != args.end(); ) {
if (ceph_argparse_double_dash(args, i)) {
break;
} else if (ceph_argparse_flag(args, i, "-p", "--print", (char*)NULL)) {
print = true;
} else if (ceph_argparse_witharg(args, i, &val, err, "--dump", (char*)NULL)) {
print = true;
if (!val.empty() && val != "plain") {
print_formatter.reset(Formatter::create(val, "", "json"));
}
} else if (ceph_argparse_witharg(args, i, &val, err, "--tree", (char*)NULL)) {
tree = true;
if (!val.empty() && val != "plain") {
tree_formatter.reset(Formatter::create(val, "", "json"));
}
} else if (ceph_argparse_witharg(args, i, &pg_bits, err, "--osd-pg-bits", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &pgp_bits, err, "--osd-pgp-bits", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &upmap_file, "--upmap-cleanup", (char*)NULL)) {
upmap_cleanup = true;
} else if (ceph_argparse_witharg(args, i, &upmap_file, "--upmap", (char*)NULL)) {
upmap_cleanup = true;
upmap = true;
} else if (ceph_argparse_witharg(args, i, &upmap_max, err, "--upmap-max", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &upmap_deviation, err, "--upmap-deviation", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &val, "--upmap-pool", (char*)NULL)) {
upmap_pools.insert(val);
} else if (ceph_argparse_witharg(args, i, &num_osd, err, "--createsimple", (char*)NULL)) {
if (!err.str().empty()) {
cerr << err.str() << std::endl;
exit(EXIT_FAILURE);
}
createsimple = true;
} else if (ceph_argparse_flag(args, i, "--upmap-active", (char*)NULL)) {
upmap_active = true;
} else if (ceph_argparse_flag(args, i, "--health", (char*)NULL)) {
health = true;
} else if (ceph_argparse_flag(args, i, "--with-default-pool", (char*)NULL)) {
createpool = true;
} else if (ceph_argparse_flag(args, i, "--create-from-conf", (char*)NULL)) {
create_from_conf = true;
} else if (ceph_argparse_flag(args, i, "--mark-up-in", (char*)NULL)) {
mark_up_in = true;
} else if (ceph_argparse_witharg(args, i, &val, "--mark-out", (char*)NULL)) {
marked_out = std::stoi(val);
} else if (ceph_argparse_witharg(args, i, &val, "--mark-up", (char*)NULL)) {
marked_up = std::stod(val);
} else if (ceph_argparse_witharg(args, i, &val, "--mark-in", (char*)NULL)) {
marked_in = std::stod(val);
} else if (ceph_argparse_flag(args, i, "--clear-temp", (char*)NULL)) {
clear_temp = true;
} else if (ceph_argparse_flag(args, i, "--clean-temps", (char*)NULL)) {
clean_temps = true;
} else if (ceph_argparse_flag(args, i, "--test-map-pgs", (char*)NULL)) {
test_map_pgs = true;
} else if (ceph_argparse_flag(args, i, "--test-map-pgs-dump", (char*)NULL)) {
test_map_pgs_dump = true;
} else if (ceph_argparse_flag(args, i, "--test-map-pgs-dump-all", (char*)NULL)) {
test_map_pgs_dump_all = true;
} else if (ceph_argparse_flag(args, i, "--test-random", (char*)NULL)) {
test_random = true;
} else if (ceph_argparse_flag(args, i, "--clobber", (char*)NULL)) {
clobber = true;
} else if (ceph_argparse_witharg(args, i, &pg_bits, err, "--pg_bits", (char*)NULL)) {
if (!err.str().empty()) {
cerr << err.str() << std::endl;
exit(EXIT_FAILURE);
}
} else if (ceph_argparse_witharg(args, i, &pgp_bits, err, "--pgp_bits", (char*)NULL)) {
if (!err.str().empty()) {
cerr << err.str() << std::endl;
exit(EXIT_FAILURE);
}
} else if (ceph_argparse_witharg(args, i, &val, "--export_crush", (char*)NULL)) {
export_crush = val;
} else if (ceph_argparse_witharg(args, i, &val, "--import_crush", (char*)NULL)) {
import_crush = val;
} else if (ceph_argparse_witharg(args, i, &val, "--test_map_pg", (char*)NULL)) {
test_map_pg = val;
} else if (ceph_argparse_witharg(args, i, &val, "--test_map_object", (char*)NULL)) {
test_map_object = val;
} else if (ceph_argparse_flag(args, i, "--test_crush", (char*)NULL)) {
test_crush = true;
} else if (ceph_argparse_witharg(args, i, &val, err, "--pg_num", (char*)NULL)) {
string interr;
pg_num = strict_strtoll(val.c_str(), 10, &interr);
if (interr.length() > 0) {
cerr << "error parsing integer value " << interr << std::endl;
exit(EXIT_FAILURE);
}
} else if (ceph_argparse_witharg(args, i, &range_first, err, "--range_first", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &range_last, err, "--range_last", (char*)NULL)) {
} else if (ceph_argparse_witharg(args, i, &pool, err, "--pool", (char*)NULL)) {
if (!err.str().empty()) {
cerr << err.str() << std::endl;
exit(EXIT_FAILURE);
}
} else if (ceph_argparse_witharg(args, i, &val, err, "--adjust-crush-weight", (char*)NULL)) {
adjust_crush_weight = val;
} else if (ceph_argparse_flag(args, i, "--save", (char*)NULL)) {
save = true;
} else {
++i;
}
}
if (args.empty()) {
cerr << me << ": must specify osdmap filename" << std::endl;
usage();
}
else if (args.size() > 1) {
cerr << me << ": too many arguments" << std::endl;
usage();
}
if (upmap_deviation < 1) {
cerr << me << ": upmap-deviation must be >= 1" << std::endl;
usage();
}
fn = args[0];
if (range_first >= 0 && range_last >= 0) {
set<OSDMap*> maps;
OSDMap *prev = NULL;
for (int i=range_first; i <= range_last; i++) {
ostringstream f;
f << fn << "/" << i;
bufferlist bl;
string error, s = f.str();
int r = bl.read_file(s.c_str(), &error);
if (r < 0) {
cerr << "unable to read " << s << ": " << cpp_strerror(r) << std::endl;
exit(1);
}
cout << s << " got " << bl.length() << " bytes" << std::endl;
OSDMap *o = new OSDMap;
o->decode(bl);
maps.insert(o);
if (prev)
OSDMap::dedup(prev, o);
prev = o;
}
exit(0);
}
OSDMap osdmap;
bufferlist bl;
cerr << me << ": osdmap file '" << fn << "'" << std::endl;
int r = 0;
struct stat st;
if (!createsimple && !create_from_conf && !clobber) {
std::string error;
r = bl.read_file(fn.c_str(), &error);
if (r == 0) {
try {
osdmap.decode(bl);
}
catch (const buffer::error &e) {
cerr << me << ": error decoding osdmap '" << fn << "'" << std::endl;
return -1;
}
}
else {
cerr << me << ": couldn't open " << fn << ": " << error << std::endl;
return -1;
}
}
else if ((createsimple || create_from_conf) && !clobber && ::stat(fn.c_str(), &st) == 0) {
cerr << me << ": " << fn << " exists, --clobber to overwrite" << std::endl;
return -1;
}
if (createsimple || create_from_conf) {
if (createsimple) {
if (num_osd < 1) {
cerr << me << ": osd count must be > 0" << std::endl;
exit(1);
}
} else {
num_osd = -1;
}
uuid_d fsid;
if (createpool) {
osdmap.build_simple_with_pool(
g_ceph_context, 0, fsid, num_osd, pg_bits, pgp_bits);
} else {
osdmap.build_simple(g_ceph_context, 0, fsid, num_osd);
}
modified = true;
}
if (mark_up_in) {
cout << "marking all OSDs up and in" << std::endl;
int n = osdmap.get_max_osd();
for (int i=0; i<n; i++) {
osdmap.set_state(i, osdmap.get_state(i) | CEPH_OSD_UP);
osdmap.set_weight(i, CEPH_OSD_IN);
if (osdmap.crush->get_item_weight(i) == 0 ) {
osdmap.crush->adjust_item_weightf(g_ceph_context, i, 1.0);
}
}
}
if (marked_out >=0 && marked_out < osdmap.get_max_osd()) {
cout << "marking OSD@" << marked_out << " as out" << std::endl;
int id = marked_out;
osdmap.set_state(id, osdmap.get_state(id) | CEPH_OSD_UP);
osdmap.set_weight(id, CEPH_OSD_OUT);
}
if (marked_up >=0 && marked_up < osdmap.get_max_osd()) {
cout << "marking OSD@" << marked_up << " as up" << std::endl;
int id = marked_up;
osdmap.set_state(id, osdmap.get_state(id) | CEPH_OSD_UP);
}
if (marked_in >=0 && marked_in < osdmap.get_max_osd()) {
cout << "marking OSD@" << marked_up << " as up" << std::endl;
int id = marked_up;
osdmap.set_weight(id, CEPH_OSD_IN);
}
for_each_substr(adjust_crush_weight, ",", [&](auto osd_to_adjust) {
std::string_view osd_to_weight_delimiter{":"};
size_t pos = osd_to_adjust.find(osd_to_weight_delimiter);
if (pos == osd_to_adjust.npos) {
cerr << me << ": use ':' as separator of osd id and its weight"
<< std::endl;
usage();
}
int osd_id = std::stoi(string(osd_to_adjust.substr(0, pos)));
float new_weight = std::stof(string(osd_to_adjust.substr(pos + 1)));
osdmap.crush->adjust_item_weightf(g_ceph_context, osd_id, new_weight);
std::cout << "Adjusted osd." << osd_id << " CRUSH weight to " << new_weight
<< std::endl;
if (save) {
OSDMap::Incremental inc;
inc.fsid = osdmap.get_fsid();
inc.epoch = osdmap.get_epoch() + 1;
osdmap.apply_incremental(inc);
modified = true;
}
});
if (clear_temp) {
cout << "clearing pg/primary temp" << std::endl;
osdmap.clear_temp();
}
if (clean_temps) {
cout << "cleaning pg temps" << std::endl;
OSDMap::Incremental pending_inc(osdmap.get_epoch()+1);
OSDMap tmpmap;
tmpmap.deepish_copy_from(osdmap);
tmpmap.apply_incremental(pending_inc);
OSDMap::clean_temps(g_ceph_context, osdmap, tmpmap, &pending_inc);
}
int upmap_fd = STDOUT_FILENO;
if (upmap || upmap_cleanup) {
if (upmap_file != "-") {
upmap_fd = ::open(upmap_file.c_str(), O_CREAT|O_WRONLY|O_TRUNC, 0644);
if (upmap_fd < 0) {
cerr << "error opening " << upmap_file << ": " << cpp_strerror(errno)
<< std::endl;
exit(1);
}
cout << "writing upmap command output to: " << upmap_file << std::endl;
}
}
if (upmap_cleanup) {
cout << "checking for upmap cleanups" << std::endl;
OSDMap::Incremental pending_inc(osdmap.get_epoch()+1);
pending_inc.fsid = osdmap.get_fsid();
int r = osdmap.clean_pg_upmaps(g_ceph_context, &pending_inc);
if (r > 0) {
print_inc_upmaps(pending_inc, upmap_fd);
r = osdmap.apply_incremental(pending_inc);
ceph_assert(r == 0);
}
}
if (upmap) {
cout << "upmap, max-count " << upmap_max
<< ", max deviation " << upmap_deviation
<< std::endl;
vector<int64_t> pools;
set<int64_t> upmap_pool_nums;
for (auto& s : upmap_pools) {
int64_t p = osdmap.lookup_pg_pool_name(s);
if (p < 0) {
cerr << " pool " << s << " does not exist" << std::endl;
exit(1);
}
pools.push_back(p);
upmap_pool_nums.insert(p);
}
if (!pools.empty()) {
cout << " limiting to pools " << upmap_pools << " (" << pools << ")"
<< std::endl;
} else {
mempool::osdmap::map<int64_t,pg_pool_t> opools = osdmap.get_pools();
for (auto& i : opools) {
pools.push_back(i.first);
}
}
if (pools.empty()) {
cout << "No pools available" << std::endl;
goto skip_upmap;
}
int rounds = 0;
struct timespec round_start;
int r = clock_gettime(CLOCK_MONOTONIC, &round_start);
assert(r == 0);
do {
random_device_t rd;
std::shuffle(pools.begin(), pools.end(), std::mt19937{rd()});
cout << "pools ";
for (auto& i: pools)
cout << osdmap.get_pool_name(i) << " ";
cout << std::endl;
OSDMap::Incremental pending_inc(osdmap.get_epoch()+1);
pending_inc.fsid = osdmap.get_fsid();
int total_did = 0;
int left = upmap_max;
struct timespec begin, end;
r = clock_gettime(CLOCK_MONOTONIC, &begin);
assert(r == 0);
for (auto& i: pools) {
set<int64_t> one_pool;
one_pool.insert(i);
int did = osdmap.calc_pg_upmaps(
g_ceph_context, upmap_deviation,
left, one_pool,
&pending_inc);
total_did += did;
left -= did;
if (left <= 0)
break;
}
r = clock_gettime(CLOCK_MONOTONIC, &end);
assert(r == 0);
cout << "prepared " << total_did << "/" << upmap_max << " changes" << std::endl;
float elapsed_time = (end.tv_sec - begin.tv_sec) + 1.0e-9*(end.tv_nsec - begin.tv_nsec);
if (upmap_active)
cout << "Time elapsed " << elapsed_time << " secs" << std::endl;
if (total_did > 0) {
print_inc_upmaps(pending_inc, upmap_fd);
if (save || upmap_active) {
int r = osdmap.apply_incremental(pending_inc);
ceph_assert(r == 0);
if (save)
modified = true;
}
} else {
cout << "Unable to find further optimization, "
<< "or distribution is already perfect"
<< std::endl;
if (upmap_active) {
map<int,set<pg_t>> pgs_by_osd;
for (auto& i : osdmap.get_pools()) {
if (!upmap_pool_nums.empty() && !upmap_pool_nums.count(i.first))
continue;
for (unsigned ps = 0; ps < i.second.get_pg_num(); ++ps) {
pg_t pg(ps, i.first);
vector<int> up;
osdmap.pg_to_up_acting_osds(pg, &up, nullptr, nullptr, nullptr);
//ldout(cct, 20) << __func__ << " " << pg << " up " << up << dendl;
for (auto osd : up) {
if (osd != CRUSH_ITEM_NONE)
pgs_by_osd[osd].insert(pg);
}
}
}
for (auto& i : pgs_by_osd)
cout << "osd." << i.first << " pgs " << i.second.size() << std::endl;
float elapsed_time = (end.tv_sec - round_start.tv_sec) + 1.0e-9*(end.tv_nsec - round_start.tv_nsec);
cout << "Total time elapsed " << elapsed_time << " secs, " << rounds << " rounds" << std::endl;
}
break;
}
++rounds;
} while(upmap_active);
}
skip_upmap:
if (upmap_file != "-") {
::close(upmap_fd);
}
if (!import_crush.empty()) {
bufferlist cbl;
std::string error;
r = cbl.read_file(import_crush.c_str(), &error);
if (r) {
cerr << me << ": error reading crush map from " << import_crush
<< ": " << error << std::endl;
exit(1);
}
// validate
CrushWrapper cw;
auto p = cbl.cbegin();
cw.decode(p);
if (cw.get_max_devices() > osdmap.get_max_osd()) {
cerr << me << ": crushmap max_devices " << cw.get_max_devices()
<< " > osdmap max_osd " << osdmap.get_max_osd() << std::endl;
exit(1);
}
// apply
OSDMap::Incremental inc;
inc.fsid = osdmap.get_fsid();
inc.epoch = osdmap.get_epoch()+1;
inc.crush = cbl;
osdmap.apply_incremental(inc);
cout << me << ": imported " << cbl.length() << " byte crush map from " << import_crush << std::endl;
modified = true;
}
if (!export_crush.empty()) {
bufferlist cbl;
osdmap.crush->encode(cbl, CEPH_FEATURES_SUPPORTED_DEFAULT);
r = cbl.write_file(export_crush.c_str());
if (r < 0) {
cerr << me << ": error writing crush map to " << import_crush << std::endl;
exit(1);
}
cout << me << ": exported crush map to " << export_crush << std::endl;
}
if (!test_map_object.empty()) {
object_t oid(test_map_object);
if (pool == -1) {
cout << me << ": assuming pool 1 (use --pool to override)" << std::endl;
pool = 1;
}
if (!osdmap.have_pg_pool(pool)) {
cerr << "There is no pool " << pool << std::endl;
exit(1);
}
object_locator_t loc(pool);
pg_t raw_pgid = osdmap.object_locator_to_pg(oid, loc);
pg_t pgid = osdmap.raw_pg_to_pg(raw_pgid);
vector<int> acting;
osdmap.pg_to_acting_osds(pgid, acting);
cout << " object '" << oid
<< "' -> " << pgid
<< " -> " << acting
<< std::endl;
}
if (!test_map_pg.empty()) {
pg_t pgid;
if (!pgid.parse(test_map_pg.c_str())) {
cerr << me << ": failed to parse pg '" << test_map_pg << std::endl;
usage();
}
cout << " parsed '" << test_map_pg << "' -> " << pgid << std::endl;
vector<int> raw, up, acting;
int raw_primary, up_primary, acting_primary;
osdmap.pg_to_raw_osds(pgid, &raw, &raw_primary);
osdmap.pg_to_up_acting_osds(pgid, &up, &up_primary,
&acting, &acting_primary);
cout << pgid << " raw (" << raw << ", p" << raw_primary
<< ") up (" << up << ", p" << up_primary
<< ") acting (" << acting << ", p" << acting_primary << ")"
<< std::endl;
}
if (test_map_pgs || test_map_pgs_dump || test_map_pgs_dump_all) {
if (pool != -1 && !osdmap.have_pg_pool(pool)) {
cerr << "There is no pool " << pool << std::endl;
exit(1);
}
int n = osdmap.get_max_osd();
vector<int> count(n, 0);
vector<int> first_count(n, 0);
vector<int> primary_count(n, 0);
vector<int> size(30, 0);
int max_size = 0;
if (test_random)
srand(getpid());
auto& pools = osdmap.get_pools();
for (auto p = pools.begin(); p != pools.end(); ++p) {
if (pool != -1 && p->first != pool)
continue;
if (pg_num > 0)
p->second.set_pg_num(pg_num);
cout << "pool " << p->first
<< " pg_num " << p->second.get_pg_num() << std::endl;
for (unsigned i = 0; i < p->second.get_pg_num(); ++i) {
pg_t pgid = pg_t(i, p->first);
vector<int> osds, raw, up, acting;
int primary, calced_primary, up_primary, acting_primary;
if (test_random) {
osds.resize(p->second.size);
for (unsigned i=0; i<osds.size(); ++i) {
osds[i] = rand() % osdmap.get_max_osd();
}
primary = osds[0];
} else if (test_map_pgs_dump_all) {
osdmap.pg_to_raw_osds(pgid, &raw, &calced_primary);
osdmap.pg_to_up_acting_osds(pgid, &up, &up_primary,
&acting, &acting_primary);
osds = acting;
primary = acting_primary;
} else {
osdmap.pg_to_acting_osds(pgid, &osds, &primary);
}
size[osds.size()]++;
if ((unsigned)max_size < osds.size())
max_size = osds.size();
if (test_map_pgs_dump) {
cout << pgid << "\t" << osds << "\t" << primary << std::endl;
} else if (test_map_pgs_dump_all) {
cout << pgid << " raw (" << raw << ", p" << calced_primary
<< ") up (" << up << ", p" << up_primary
<< ") acting (" << acting << ", p" << acting_primary << ")"
<< std::endl;
}
for (unsigned i=0; i<osds.size(); i++) {
//cout << " rep " << i << " on " << osds[i] << std::endl;
count[osds[i]]++;
}
if (osds.size())
first_count[osds[0]]++;
if (primary >= 0)
primary_count[primary]++;
}
}
uint64_t total = 0;
int in = 0;
int min_osd = -1;
int max_osd = -1;
cout << "#osd\tcount\tfirst\tprimary\tc wt\twt\n";
for (int i=0; i<n; i++) {
if (!osdmap.is_in(i))
continue;
if (osdmap.crush->get_item_weight(i) <= 0)
continue;
in++;
cout << "osd." << i
<< "\t" << count[i]
<< "\t" << first_count[i]
<< "\t" << primary_count[i]
<< "\t" << osdmap.crush->get_item_weightf(i)
<< "\t" << osdmap.get_weightf(i)
<< std::endl;
total += count[i];
if (count[i] &&
(min_osd < 0 ||
count[i] < count[min_osd]))
min_osd = i;
if (count[i] &&
(max_osd < 0 ||
count[i] > count[max_osd]))
max_osd = i;
}
uint64_t avg = in ? (total / in) : 0;
double dev = 0;
for (int i=0; i<n; i++) {
if (!osdmap.is_in(i))
continue;
if (osdmap.crush->get_item_weight(i) <= 0)
continue;
dev += (avg - count[i]) * (avg - count[i]);
}
dev /= in;
dev = sqrt(dev);
//double edev = sqrt(pgavg) * (double)avg / pgavg;
double edev = sqrt((double)total / (double)in * (1.0 - (1.0 / (double)in)));
cout << " in " << in << std::endl;
cout << " avg " << avg
<< " stddev " << dev
<< " (" << (dev/avg) << "x)"
<< " (expected " << edev << " " << (edev/avg) << "x))"
<< std::endl;
if (min_osd >= 0)
cout << " min osd." << min_osd << " " << count[min_osd] << std::endl;
if (max_osd >= 0)
cout << " max osd." << max_osd << " " << count[max_osd] << std::endl;
for (int i=0; i<=max_size; i++) {
if (size[i])
cout << "size " << i << "\t" << size[i] << std::endl;
}
}
if (test_crush) {
int pass = 0;
while (1) {
cout << "pass " << ++pass << std::endl;
ceph::unordered_map<pg_t,vector<int> > m;
for (map<int64_t,pg_pool_t>::const_iterator p = osdmap.get_pools().begin();
p != osdmap.get_pools().end();
++p) {
const pg_pool_t *pool = osdmap.get_pg_pool(p->first);
for (ps_t ps = 0; ps < pool->get_pg_num(); ps++) {
pg_t pgid(ps, p->first);
for (int i=0; i<100; i++) {
cout << pgid << " attempt " << i << std::endl;
vector<int> r;
osdmap.pg_to_acting_osds(pgid, r);
//cout << pgid << " " << r << std::endl;
if (m.count(pgid)) {
if (m[pgid] != r) {
cout << pgid << " had " << m[pgid] << " now " << r << std::endl;
ceph_abort();
}
} else
m[pgid] = r;
}
}
}
}
}
if (!print && !health && !tree && !modified &&
export_crush.empty() && import_crush.empty() &&
test_map_pg.empty() && test_map_object.empty() &&
!test_map_pgs && !test_map_pgs_dump && !test_map_pgs_dump_all &&
adjust_crush_weight.empty() && !upmap && !upmap_cleanup) {
cerr << me << ": no action specified?" << std::endl;
usage();
}
if (modified)
osdmap.inc_epoch();
if (health) {
health_check_map_t checks;
osdmap.check_health(cct.get(), &checks);
JSONFormatter jf(true);
jf.dump_object("checks", checks);
jf.flush(cout);
}
if (print) {
if (print_formatter) {
print_formatter->open_object_section("osdmap");
osdmap.dump(print_formatter.get());
print_formatter->close_section();
print_formatter->flush(cout);
} else {
osdmap.print(cout);
}
}
if (tree) {
if (tree_formatter) {
tree_formatter->open_object_section("tree");
osdmap.print_tree(tree_formatter.get(), NULL);
tree_formatter->close_section();
tree_formatter->flush(cout);
cout << std::endl;
} else {
osdmap.print_tree(NULL, &cout);
}
}
if (modified) {
bl.clear();
osdmap.encode(bl, CEPH_FEATURES_SUPPORTED_DEFAULT | CEPH_FEATURE_RESERVED);
// write it out
cout << me << ": writing epoch " << osdmap.get_epoch()
<< " to " << fn
<< std::endl;
int r = bl.write_file(fn.c_str());
if (r) {
cerr << "osdmaptool: error writing to '" << fn << "': "
<< cpp_strerror(r) << std::endl;
return 1;
}
}
return 0;
}