- log_href:
http://qa-proxy.ceph.com/teuthology/gabrioux-2024-09-21_11:23:40-orch:cephadm-wip-guits-main-2024-09-21-0842-distro-default-smithi/7913922/teuthology.log
- archive_path:
/home/teuthworker/archive/gabrioux-2024-09-21_11:23:40-orch:cephadm-wip-guits-main-2024-09-21-0842-distro-default-smithi/7913922
- description:
orch:cephadm/workunits/{0-distro/centos_9.stream agent/on mon_election/connectivity task/test_host_drain}
- duration:
0:14:53
- email:
gabrioux@ibm.com
- failure_reason:
- flavor:
default
- job_id:
7913922
- kernel:
- last_in_suite:
False
- machine_type:
smithi
- name:
gabrioux-2024-09-21_11:23:40-orch:cephadm-wip-guits-main-2024-09-21-0842-distro-default-smithi
- nuke_on_error:
- os_type:
centos
- os_version:
9.stream
- overrides:
- admin_socket:
- branch:
wip-guits-main-2024-09-21-0842
- ceph:
- conf:
- global:
- mon election default strategy:
3
- mgr:
- debug mgr:
20
- debug ms:
1
- mgr/cephadm/use_agent:
True
- mon:
- debug mon:
20
- debug ms:
1
- debug paxos:
20
- osd:
- debug ms:
1
- debug osd:
20
- flavor:
default
- log-ignorelist:
-
\(MDS_ALL_DOWN\)
-
\(MDS_UP_LESS_THAN_MAX\)
-
MON_DOWN
-
mons down
-
mon down
-
out of quorum
-
CEPHADM_STRAY_HOST
-
CEPHADM_STRAY_DAEMON
-
CEPHADM_FAILED_DAEMON
- log-only-match:
- sha1:
441784946648ff53dd310293f9dd752afeeea72a
- ceph-deploy:
- conf:
- client:
- log file:
/var/log/ceph/ceph-$name.$pid.log
- mon:
- install:
- ceph:
- flavor:
default
- sha1:
441784946648ff53dd310293f9dd752afeeea72a
- selinux:
- allowlist:
-
scontext=system_u:system_r:logrotate_t:s0
-
scontext=system_u:system_r:getty_t:s0
- workunit:
- branch:
wip-guits-main-2024-09-21-0842
- sha1:
441784946648ff53dd310293f9dd752afeeea72a
- owner:
scheduled_gabrioux@teuthology
- pid:
- roles:
-
['host.a', 'mon.a', 'mgr.a', 'osd.0', 'osd.1']
-
['host.b', 'mon.b', 'mgr.b', 'osd.2', 'osd.3']
-
['host.c', 'mon.c', 'osd.4', 'osd.5']
- sentry_event:
- status:
pass
- success:
True
- branch:
wip-guits-main-2024-09-21-0842
- seed:
5896
- sha1:
441784946648ff53dd310293f9dd752afeeea72a
- subset:
1/8
- suite:
orch:cephadm
- suite_branch:
wip-guits-main-2024-09-21-0842
- suite_path:
/home/teuthworker/src/git.ceph.com_ceph-c_441784946648ff53dd310293f9dd752afeeea72a/qa
- suite_relpath:
qa
- suite_repo:
https://git.ceph.com/ceph-ci.git
- suite_sha1:
441784946648ff53dd310293f9dd752afeeea72a
- targets:
- smithi033.front.sepia.ceph.com:
ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBB83zF4HYuataYnPnfWAK7XVXsuwrKiB7O9A15V3QMPyNrQIC4AhXBvSMP3DgzjyMFSMofo0gjPQj3viEuiEkcM=
- smithi050.front.sepia.ceph.com:
ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBKD71dJyxBsbEn4yY8zL5qbUups1lbdvzxyZM8xJAQ6+tNsFswe31M6bJlIhGk/Lzs2SbtuCUMojjKrLAB3efHE=
- smithi121.front.sepia.ceph.com:
ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBHZmqE2iFa4ktBn+PynKk95Ei4j81nxuLU3futFax6bVZZdOGyq4C5fT/smeUm+R31qVCfXFm2/B6qPNJs9ori0=
- tasks:
-
- internal.buildpackages_prep:
-
- internal.save_config:
-
- internal.check_lock:
-
- internal.add_remotes:
-
- console_log:
-
- internal.connect:
-
- internal.push_inventory:
-
- internal.serialize_remote_roles:
-
- internal.check_conflict:
-
- internal.check_ceph_data:
-
- internal.vm_setup:
-
- kernel:
-
- internal.base:
-
- internal.archive_upload:
-
- internal.archive:
-
- internal.coredump:
-
- internal.sudo:
-
- internal.syslog:
-
- internal.timer:
-
- pcp:
-
- selinux:
-
- ansible.cephlab:
-
- clock:
-
- pexec:
- all:
-
sudo dnf remove nvme-cli -y
-
sudo dnf install nvmetcli nvme-cli -y
-
- install:
-
- cephadm:
-
- cephadm.shell:
- host.a:
-
set -ex
HOSTNAMES=$(ceph orch host ls --format json | jq -r '.[] | .hostname')
for host in $HOSTNAMES; do
# find the hostname for "host.c" which will have no mgr
HAS_MGRS=$(ceph orch ps --hostname ${host} --format json | jq 'any(.daemon_type == "mgr")')
if [ "$HAS_MGRS" == "false" ]; then
HOST_C="${host}"
fi
done
# One last thing to worry about before draining the host
# is that the teuthology test tends to put the explicit
# hostnames in the placement for the mon service.
# We want to make sure we can drain without providing
# --force and there is a check for the host being removed
# being listed explicitly in the placements. Therefore,
# we should remove it from the mon placement.
ceph orch ls mon --export > mon.yaml
sed /"$HOST_C"/d mon.yaml > mon_adjusted.yaml
ceph orch apply -i mon_adjusted.yaml
# now drain that host
ceph orch host drain $HOST_C --zap-osd-devices
# wait for drain to complete
HOST_C_DAEMONS=$(ceph orch ps --hostname $HOST_C)
while [ "$HOST_C_DAEMONS" != "No daemons reported" ]; do
sleep 15
HOST_C_DAEMONS=$(ceph orch ps --hostname $HOST_C)
done
# we want to check the ability to remove the host from
# the CRUSH map, so we should first verify the host is in
# the CRUSH map.
ceph osd getcrushmap -o compiled-crushmap
crushtool -d compiled-crushmap -o crushmap.txt
CRUSH_MAP=$(cat crushmap.txt)
if ! grep -q "$HOST_C" <<< "$CRUSH_MAP"; then
printf "Expected to see $HOST_C in CRUSH map. Saw:\n\n$CRUSH_MAP"
exit 1
fi
# If the drain was successful, we should be able to remove the
# host without force with no issues. If there are still daemons
# we will get a response telling us to drain the host and a
# non-zero return code
ceph orch host rm $HOST_C --rm-crush-entry
# verify we've successfully removed the host from the CRUSH map
sleep 30
ceph osd getcrushmap -o compiled-crushmap
crushtool -d compiled-crushmap -o crushmap.txt
CRUSH_MAP=$(cat crushmap.txt)
if grep -q "$HOST_C" <<< "$CRUSH_MAP"; then
printf "Saw $HOST_C in CRUSH map after it should have been removed.\n\n$CRUSH_MAP"
exit 1
fi
teuthology_branch:
main
verbose:
True
pcp_grafana_url:
priority:
70
user:
gabrioux
queue:
posted:
2024-09-21 11:23:57
started:
2024-09-21 12:04:43
updated:
2024-09-21 12:29:44
status_class:
success
runtime:
0:25:01
wait_time:
0:10:08