2019-07-13 02:35:04 +00:00
|
|
|
#!/usr/bin/env bash
|
|
|
|
|
|
|
|
source $CEPH_ROOT/qa/standalone/ceph-helpers.sh
|
|
|
|
|
|
|
|
function run() {
|
|
|
|
local dir=$1
|
|
|
|
shift
|
|
|
|
|
|
|
|
export CEPH_MON="127.0.0.1:7146" # git grep '\<7146\>' : there must be only one
|
|
|
|
export CEPH_ARGS
|
|
|
|
CEPH_ARGS+="--fsid=$(uuidgen) --auth-supported=none "
|
|
|
|
CEPH_ARGS+="--mon-host=$CEPH_MON "
|
|
|
|
CEPH_ARGS+="--debug_disable_randomized_ping=true "
|
|
|
|
CEPH_ARGS+="--debug_heartbeat_testing_span=5 "
|
|
|
|
CEPH_ARGS+="--osd_heartbeat_interval=1 "
|
|
|
|
local funcs=${@:-$(set | sed -n -e 's/^\(TEST_[0-9a-z_]*\) .*/\1/p')}
|
|
|
|
for func in $funcs ; do
|
|
|
|
setup $dir || return 1
|
|
|
|
$func $dir || return 1
|
|
|
|
teardown $dir || return 1
|
|
|
|
done
|
|
|
|
}
|
|
|
|
|
|
|
|
function TEST_network_ping_test1() {
|
|
|
|
local dir=$1
|
|
|
|
|
|
|
|
run_mon $dir a || return 1
|
|
|
|
run_mgr $dir x || return 1
|
|
|
|
run_osd $dir 0 || return 1
|
|
|
|
run_osd $dir 1 || return 1
|
|
|
|
run_osd $dir 2 || return 1
|
|
|
|
|
|
|
|
sleep 5
|
|
|
|
|
|
|
|
create_pool foo 16
|
|
|
|
|
|
|
|
# write some objects
|
|
|
|
timeout 20 rados bench -p foo 10 write -b 4096 --no-cleanup || return 1
|
|
|
|
|
|
|
|
# Get 1 cycle worth of ping data "1 minute"
|
|
|
|
sleep 10
|
|
|
|
flush_pg_stats
|
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "4" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "12" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
|
|
|
# Wait another 4 cycles to get "5 minute interval"
|
|
|
|
sleep 20
|
|
|
|
flush_pg_stats
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "4" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "12" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
|
|
|
|
|
|
|
# Wait another 10 cycles to get "15 minute interval"
|
|
|
|
sleep 50
|
|
|
|
flush_pg_stats
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "0" || return 1
|
2019-09-04 17:13:32 +00:00
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "1000" || return 1
|
2019-07-13 02:35:04 +00:00
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "4" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network 0 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.entries | length')" = "12" || return 1
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "0" || return 1
|
|
|
|
|
2019-09-04 17:13:32 +00:00
|
|
|
# Just check the threshold output matches the input
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path mgr.x) dump_osd_network 99 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "99" || return 1
|
|
|
|
CEPH_ARGS='' ceph daemon $(get_asok_path osd.0) dump_osd_network 98 | tee $dir/json
|
|
|
|
test "$(cat $dir/json | jq '.threshold')" = "98" || return 1
|
|
|
|
|
2019-07-13 02:35:04 +00:00
|
|
|
rm -f $dir/json
|
|
|
|
}
|
|
|
|
|
|
|
|
# Test setting of mon_warn_on_slow_ping_time very low to
|
|
|
|
# get health warning
|
|
|
|
function TEST_network_ping_test2() {
|
|
|
|
local dir=$1
|
|
|
|
|
|
|
|
export CEPH_ARGS
|
2019-09-06 18:20:10 +00:00
|
|
|
export EXTRA_OPTS=" --mon_warn_on_slow_ping_time=0.001"
|
2019-07-13 02:35:04 +00:00
|
|
|
run_mon $dir a || return 1
|
|
|
|
run_mgr $dir x || return 1
|
|
|
|
run_osd $dir 0 || return 1
|
|
|
|
run_osd $dir 1 || return 1
|
|
|
|
run_osd $dir 2 || return 1
|
|
|
|
|
|
|
|
sleep 5
|
|
|
|
|
|
|
|
create_pool foo 16
|
|
|
|
|
|
|
|
# write some objects
|
|
|
|
timeout 20 rados bench -p foo 10 write -b 4096 --no-cleanup || return 1
|
|
|
|
|
|
|
|
# Get at least 1 cycle of ping data (this test runs with 5 second cycles of 1 second pings)
|
|
|
|
sleep 10
|
|
|
|
flush_pg_stats
|
|
|
|
|
|
|
|
ceph health | tee $dir/health
|
|
|
|
grep -q "Long heartbeat" $dir/health || return 1
|
|
|
|
|
|
|
|
ceph health detail | tee $dir/health
|
|
|
|
grep -q "OSD_SLOW_PING_TIME_BACK" $dir/health || return 1
|
|
|
|
grep -q "OSD_SLOW_PING_TIME_FRONT" $dir/health || return 1
|
|
|
|
rm -f $dir/health
|
|
|
|
}
|
|
|
|
|
|
|
|
main network-ping "$@"
|
|
|
|
|
|
|
|
# Local Variables:
|
|
|
|
# compile-command: "cd ../.. ; make -j4 && ../qa/run-standalone.sh network-ping.sh"
|
|
|
|
# End:
|