Description: rados/cephadm/osds/{0-distro/centos_9.stream_runc 0-nvme-loop 1-start 2-ops/rm-zap-wait}

Log: http://qa-proxy.ceph.com/teuthology/rzarzynski-2024-06-03_22:14:06-rados-wip-osd-ec-partial-reads-eio-distro-default-smithi/7740355/teuthology.log

Sentry event: https://sentry.ceph.com/organizations/ceph/?query=a13a3d4e31ed4986aeff4ad4b8d69182

Failure Reason:

"2024-06-03T23:15:57.728326+0000 mon.smithi043 (mon.0) 121 : cluster [WRN] Health check failed: failed to probe daemons or devices (CEPHADM_REFRESH_FAILED)" in cluster log

  • log_href: http://qa-proxy.ceph.com/teuthology/rzarzynski-2024-06-03_22:14:06-rados-wip-osd-ec-partial-reads-eio-distro-default-smithi/7740355/teuthology.log
  • archive_path: /home/teuthworker/archive/rzarzynski-2024-06-03_22:14:06-rados-wip-osd-ec-partial-reads-eio-distro-default-smithi/7740355
  • description: rados/cephadm/osds/{0-distro/centos_9.stream_runc 0-nvme-loop 1-start 2-ops/rm-zap-wait}
  • duration: 0:29:24
  • email:
  • failure_reason: "2024-06-03T23:15:57.728326+0000 mon.smithi043 (mon.0) 121 : cluster [WRN] Health check failed: failed to probe daemons or devices (CEPHADM_REFRESH_FAILED)" in cluster log
  • flavor:
  • job_id: 7740355
  • kernel:
    • kdb: 1
    • sha1: distro
  • last_in_suite: False
  • machine_type: smithi
  • name: rzarzynski-2024-06-03_22:14:06-rados-wip-osd-ec-partial-reads-eio-distro-default-smithi
  • nuke_on_error:
  • os_type: centos
  • os_version: 9.stream
  • overrides:
    • admin_socket:
      • branch: wip-osd-ec-partial-reads-eio
    • ceph:
      • conf:
        • mgr:
          • debug mgr: 20
          • debug ms: 1
        • mon:
          • debug mon: 20
          • debug ms: 1
          • debug paxos: 20
        • osd:
          • debug ms: 1
          • debug osd: 20
          • osd shutdown pgref assert: True
      • flavor: default
      • log-ignorelist:
        • \(MDS_ALL_DOWN\)
        • \(MDS_UP_LESS_THAN_MAX\)
        • OSD_DOWN
      • log-only-match:
        • CEPHADM_
      • sha1: 7d208bbce2efc11fb0dcecbb271cb2051d1daa58
    • ceph-deploy:
      • conf:
        • client:
          • log file: /var/log/ceph/ceph-$name.$pid.log
        • mon:
      • install:
        • ceph:
          • flavor: default
          • sha1: 7d208bbce2efc11fb0dcecbb271cb2051d1daa58
      • selinux:
        • allowlist:
          • scontext=system_u:system_r:logrotate_t:s0
      • workunit:
        • branch: wip-osd-ec-partial-reads-eio-fix66321
        • sha1: 5c821233d097eb6eb4287bbd1d0b6d01638e5f90
    • owner: scheduled_rzarzynski@teuthology
    • pid:
    • roles:
      • ['host.a', 'client.0']
      • ['host.b', 'client.1']
    • sentry_event: https://sentry.ceph.com/organizations/ceph/?query=a13a3d4e31ed4986aeff4ad4b8d69182
    • status: fail
    • success: False
    • branch: wip-osd-ec-partial-reads-eio
    • seed: 8148
    • sha1: 7d208bbce2efc11fb0dcecbb271cb2051d1daa58
    • subset: 111/120000
    • suite: rados
    • suite_branch: wip-osd-ec-partial-reads-eio-fix66321
    • suite_path: /home/teuthworker/src/git.ceph.com_ceph-c_5c821233d097eb6eb4287bbd1d0b6d01638e5f90/qa
    • suite_relpath: qa
    • suite_repo: https://git.ceph.com/ceph-ci.git
    • suite_sha1: 5c821233d097eb6eb4287bbd1d0b6d01638e5f90
    • targets:
      • smithi043.front.sepia.ceph.com: ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBD4aHE//zXTUpi1Ekf6TlGpSxESziV00Elutkd9r1pjSIHWqq/aQM6yxvvvrKE4Fr5j9H1GHief9CsA31kWJb6A=
      • smithi053.front.sepia.ceph.com: ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBEwzmncGj+Xor9hikraU3Xl0wuoQ/6RF4IsBNPbi+xMM3W4DqRUEUiItUtm5RVwEyj4XuGl+SLkrrQwTPpXEAbg=
    • tasks:
      • internal.check_packages:
      • internal.buildpackages_prep:
      • internal.save_config:
      • internal.check_lock:
      • internal.add_remotes:
      • console_log:
      • internal.connect:
      • internal.push_inventory:
      • internal.serialize_remote_roles:
      • internal.check_conflict:
      • internal.check_ceph_data:
      • internal.vm_setup:
      • kernel:
        • kdb: 1
        • sha1: distro
      • internal.base:
      • internal.archive_upload:
      • internal.archive:
      • internal.coredump:
      • internal.sudo:
      • internal.syslog:
      • internal.timer:
      • pcp:
      • selinux:
      • ansible.cephlab:
      • clock:
      • pexec:
        • all:
          • sudo dnf install runc -y
          • sudo sed -i 's/^#runtime = "crun"/runtime = "runc"/g' /usr/share/containers/containers.conf
          • sudo sed -i 's/runtime = "crun"/#runtime = "crun"/g' /usr/share/containers/containers.conf
      • nvme_loop:
      • cephadm:
        • roleless: True
        • conf:
          • mgr:
            • debug mgr: 20
            • debug ms: 1
          • mon:
            • debug mon: 20
            • debug ms: 1
            • debug paxos: 20
          • osd:
            • debug ms: 1
            • debug osd: 20
            • osd shutdown pgref assert: True
        • flavor: default
        • log-ignorelist:
          • \(MDS_ALL_DOWN\)
          • \(MDS_UP_LESS_THAN_MAX\)
          • OSD_DOWN
        • log-only-match:
          • CEPHADM_
        • sha1: 7d208bbce2efc11fb0dcecbb271cb2051d1daa58
        • cluster: ceph
        • cephadm_mode: root
      • cephadm.shell:
        • host.a:
          • ceph orch status
          • ceph orch ps
          • ceph orch ls
          • ceph orch host ls
          • ceph orch device ls
          • ceph orch ls | grep '^osd.all-available-devices '
      • cephadm.shell:
        • host.a:
          • set -e set -x ceph orch ps ceph orch device ls DEVID=$(ceph device ls | grep osd.1 | awk '{print $1}') HOST=$(ceph orch device ls | grep $DEVID | awk '{print $1}') DEV=$(ceph orch device ls | grep $DEVID | awk '{print $2}') echo "host $HOST, dev $DEV, devid $DEVID" ceph orch osd rm 1 while ceph orch osd rm status | grep ^1 ; do sleep 5 ; done ceph orch device zap $HOST $DEV --force while ! ceph osd dump | grep osd.1 | grep up ; do sleep 5 ; done
    • teuthology_branch: main
    • verbose: False
    • pcp_grafana_url:
    • priority: 85
    • user: rzarzynski
    • queue:
    • posted: 2024-06-03 22:15:47
    • started: 2024-06-03 22:32:23
    • updated: 2024-06-03 23:26:01
    • status_class: danger
    • runtime: 0:53:38
    • wait_time: 0:24:14