Description: rados/cephadm/workunits/{0-distro/centos_8.stream_container_tools_crun agent/on mon_election/classic task/test_host_drain}

Log: http://qa-proxy.ceph.com/teuthology/lflores-2023-12-15_16:16:51-rados-wip-yuri10-testing-2023-12-12-1229-distro-default-smithi/7493320/teuthology.log

  • log_href: http://qa-proxy.ceph.com/teuthology/lflores-2023-12-15_16:16:51-rados-wip-yuri10-testing-2023-12-12-1229-distro-default-smithi/7493320/teuthology.log
  • archive_path: /home/teuthworker/archive/lflores-2023-12-15_16:16:51-rados-wip-yuri10-testing-2023-12-12-1229-distro-default-smithi/7493320
  • description: rados/cephadm/workunits/{0-distro/centos_8.stream_container_tools_crun agent/on mon_election/classic task/test_host_drain}
  • duration: 0:19:06
  • email:
  • failure_reason:
  • flavor: default
  • job_id: 7493320
  • kernel:
    • kdb: True
    • sha1: distro
  • last_in_suite: False
  • machine_type: smithi
  • name: lflores-2023-12-15_16:16:51-rados-wip-yuri10-testing-2023-12-12-1229-distro-default-smithi
  • nuke_on_error: True
  • os_type: centos
  • os_version: 8.stream
  • overrides:
    • admin_socket:
      • branch: wip-yuri10-testing-2023-12-12-1229
    • ceph:
      • conf:
        • global:
          • mon election default strategy: 1
        • mgr:
          • debug mgr: 20
          • debug ms: 1
          • mgr/cephadm/use_agent: True
        • mon:
          • debug mon: 20
          • debug ms: 1
          • debug paxos: 20
        • osd:
          • debug ms: 1
          • debug osd: 20
      • flavor: default
      • log-ignorelist:
        • \(MDS_ALL_DOWN\)
        • \(MDS_UP_LESS_THAN_MAX\)
      • sha1: 021ac1670a21c19759080c6da90baaeb42e7d175
    • ceph-deploy:
      • conf:
        • client:
          • log file: /var/log/ceph/ceph-$name.$pid.log
        • mon:
          • osd default pool size: 2
    • install:
      • ceph:
        • flavor: default
        • sha1: 021ac1670a21c19759080c6da90baaeb42e7d175
    • selinux:
      • whitelist:
        • scontext=system_u:system_r:logrotate_t:s0
    • workunit:
      • branch: wip-yuri10-testing-2023-12-12-1229
      • sha1: 021ac1670a21c19759080c6da90baaeb42e7d175
  • owner: scheduled_lflores@teuthology
  • pid:
  • roles:
    • ['host.a', 'mon.a', 'mgr.a', 'osd.0', 'osd.1']
    • ['host.b', 'mon.b', 'mgr.b', 'osd.2', 'osd.3']
    • ['host.c', 'mon.c', 'osd.4', 'osd.5']
  • sentry_event:
  • status: pass
  • success: True
  • branch: wip-yuri10-testing-2023-12-12-1229
  • seed:
  • sha1: 021ac1670a21c19759080c6da90baaeb42e7d175
  • subset:
  • suite:
  • suite_branch: wip-yuri10-testing-2023-12-12-1229
  • suite_path:
  • suite_relpath:
  • suite_repo:
  • suite_sha1: 021ac1670a21c19759080c6da90baaeb42e7d175
  • targets:
    • smithi008.front.sepia.ceph.com: ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBHjzlt2+Ijp9amxW3GE0T6+CRJrexzjJzXYWZrIUwm24GLdHYJUnVtdK9qxOdbyKVYj1I7x3B6zOGu/yu+DLqLc=
    • smithi120.front.sepia.ceph.com: ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBGuGH413hWPAri3S/PN+FYHFAQmexHNiLjJAdhkMIXFXZQAa2TzI9pDLQRtA0OWLrnVMX2h/r4FFxI2KigxE1A4=
    • smithi175.front.sepia.ceph.com: ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBEXgk7P8bpxbKkN5QEl0aubmXg4eHnrtDy3MirTCnSuspk+QjtJlI/kMVvCbHfaQn14Z5RnVmuOwsUqMX3j3drg=
  • tasks:
    • internal.check_packages:
    • internal.buildpackages_prep:
    • internal.save_config:
    • internal.check_lock:
    • internal.add_remotes:
    • console_log:
    • internal.connect:
    • internal.push_inventory:
    • internal.serialize_remote_roles:
    • internal.check_conflict:
    • internal.check_ceph_data:
    • internal.vm_setup:
    • kernel:
      • kdb: True
      • sha1: distro
    • internal.base:
    • internal.archive_upload:
    • internal.archive:
    • internal.coredump:
    • internal.sudo:
    • internal.syslog:
    • internal.timer:
    • pcp:
    • selinux:
    • ansible.cephlab:
    • clock:
    • pexec:
      • all:
        • sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup
        • sudo dnf -y module reset container-tools
        • sudo dnf -y module install container-tools --allowerasing --nobest
        • sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf
        • sudo sed -i 's/runtime = "runc"/#runtime = "runc"/g' /usr/share/containers/containers.conf
        • sudo sed -i 's/#runtime = "crun"/runtime = "crun"/g' /usr/share/containers/containers.conf
    • install:
    • cephadm:
    • cephadm.shell:
      • host.a:
        • set -ex HOSTNAMES=$(ceph orch host ls --format json | jq -r '.[] | .hostname') for host in $HOSTNAMES; do # find the hostname for "host.c" which will have no mgr HAS_MGRS=$(ceph orch ps --hostname ${host} --format json | jq 'any(.daemon_type == "mgr")') if [ "$HAS_MGRS" == "false" ]; then HOST_C="${host}" fi done # One last thing to worry about before draining the host # is that the teuthology test tends to put the explicit # hostnames in the placement for the mon service. # We want to make sure we can drain without providing # --force and there is a check for the host being removed # being listed explicitly in the placements. Therefore, # we should remove it from the mon placement. ceph orch ls mon --export > mon.yaml sed /"$HOST_C"/d mon.yaml > mon_adjusted.yaml ceph orch apply -i mon_adjusted.yaml # now drain that host ceph orch host drain $HOST_C --zap-osd-devices # wait for drain to complete HOST_C_DAEMONS=$(ceph orch ps --hostname $HOST_C) while [ "$HOST_C_DAEMONS" != "No daemons reported" ]; do sleep 15 HOST_C_DAEMONS=$(ceph orch ps --hostname $HOST_C) done # we want to check the ability to remove the host from # the CRUSH map, so we should first verify the host is in # the CRUSH map. ceph osd getcrushmap -o compiled-crushmap crushtool -d compiled-crushmap -o crushmap.txt CRUSH_MAP=$(cat crushmap.txt) if ! grep -q "$HOST_C" <<< "$CRUSH_MAP"; then printf "Expected to see $HOST_C in CRUSH map. Saw:\n\n$CRUSH_MAP" exit 1 fi # If the drain was successful, we should be able to remove the # host without force with no issues. If there are still daemons # we will get a response telling us to drain the host and a # non-zero return code ceph orch host rm $HOST_C --rm-crush-entry # verify we've successfully removed the host from the CRUSH map sleep 30 ceph osd getcrushmap -o compiled-crushmap crushtool -d compiled-crushmap -o crushmap.txt CRUSH_MAP=$(cat crushmap.txt) if grep -q "$HOST_C" <<< "$CRUSH_MAP"; then printf "Saw $HOST_C in CRUSH map after it should have been removed.\n\n$CRUSH_MAP" exit 1 fi
  • teuthology_branch: main
  • verbose: True
  • pcp_grafana_url:
  • priority:
  • user:
  • queue:
  • posted: 2023-12-15 16:19:17
  • started: 2023-12-15 17:07:36
  • updated: 2023-12-15 17:37:22
  • status_class: success
  • runtime: 0:29:46
  • wait_time: 0:10:40