Description: orch:cephadm/smoke-roleless/{0-distro/rhel_8.6_container_tools_rhel8 0-nvme-loop 1-start 2-services/nfs-ingress2 3-final}

Log: http://qa-proxy.ceph.com/teuthology/adking-2023-07-19_13:28:53-orch:cephadm-wip-adk4-testing-2023-07-18-1038-distro-default-smithi/7343326/teuthology.log

Failure Reason:

Error reimaging machines: Failed to power on smithi058

  • log_href: http://qa-proxy.ceph.com/teuthology/adking-2023-07-19_13:28:53-orch:cephadm-wip-adk4-testing-2023-07-18-1038-distro-default-smithi/7343326/teuthology.log
  • archive_path: /home/teuthworker/archive/adking-2023-07-19_13:28:53-orch:cephadm-wip-adk4-testing-2023-07-18-1038-distro-default-smithi/7343326
  • description: orch:cephadm/smoke-roleless/{0-distro/rhel_8.6_container_tools_rhel8 0-nvme-loop 1-start 2-services/nfs-ingress2 3-final}
  • duration:
  • email: adking@redhat.com
  • failure_reason: Error reimaging machines: Failed to power on smithi058
  • flavor:
  • job_id: 7343326
  • kernel:
    • kdb: True
    • sha1: distro
  • last_in_suite: False
  • machine_type: smithi
  • name: adking-2023-07-19_13:28:53-orch:cephadm-wip-adk4-testing-2023-07-18-1038-distro-default-smithi
  • nuke_on_error: True
  • os_type: rhel
  • os_version: 8.6
  • overrides:
    • admin_socket:
      • branch: wip-adk4-testing-2023-07-18-1038
    • ceph:
      • conf:
        • mgr:
          • debug mgr: 20
          • debug ms: 1
        • mon:
          • debug mon: 20
          • debug ms: 1
          • debug paxos: 20
        • osd:
          • debug ms: 1
          • debug osd: 20
          • osd shutdown pgref assert: True
      • flavor: default
      • log-ignorelist:
        • \(MDS_ALL_DOWN\)
        • \(MDS_UP_LESS_THAN_MAX\)
      • sha1: 4ae2a76aad461f2c9f6a1456c25df23ec97a5b2f
    • ceph-deploy:
      • conf:
        • client:
          • log file: /var/log/ceph/ceph-$name.$pid.log
        • mon:
          • osd default pool size: 2
    • install:
      • ceph:
        • flavor: default
        • sha1: 4ae2a76aad461f2c9f6a1456c25df23ec97a5b2f
    • selinux:
      • whitelist:
        • scontext=system_u:system_r:logrotate_t:s0
    • workunit:
      • branch: wip-adk4-testing-2023-07-18-1038
      • sha1: 4ae2a76aad461f2c9f6a1456c25df23ec97a5b2f
  • owner: scheduled_adking@teuthology
  • pid:
  • roles:
    • ['host.a', 'client.0']
    • ['host.b', 'client.1']
  • sentry_event:
  • status: dead
  • success:
  • branch: wip-adk4-testing-2023-07-18-1038
  • seed:
  • sha1: 4ae2a76aad461f2c9f6a1456c25df23ec97a5b2f
  • subset:
  • suite:
  • suite_branch: wip-adk4-testing-2023-07-18-1038
  • suite_path:
  • suite_relpath:
  • suite_repo:
  • suite_sha1: 4ae2a76aad461f2c9f6a1456c25df23ec97a5b2f
  • targets:
    • smithi058.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQDPeer/1mzRb807UMaXDp9LkHxwcCBg5bgfjf9lNbzWOn+IU6zIeru043mogJFkCghfuoX7Iwv3iDtIZA9WJrrb4s0cGfCNyZARH9h3YpfDv5gGFd+ZJHvNm0YREGx7uMdUEtKM6fRJm+X+A+pMLZENDDJKuoagmQbGqp+o5Il6LLx3GRtAZGYduk8dRRjlRcvZdq3kZ4z0X4u9i/bxJJqCDAHEPk9jhyK62f2QaKrFxAHqGLbxCsa/GtZeEP2knptfoiPjiYHbIbIbvbyXInQeoJKxL5B1s5D4RldF55VWyWCMdP57ddrjsfvy3eXINV6DNr854teil5C/Q+GqnusnHERxrqyCQejkBz1BSKsMkDf2FnmG3xLcFarcDcxhfrJ5Ts96cPbPZFBwKtcd5vaomPj1E64zfW9TH7wlNAztJGMJHYQfIGgHsCjhv8fjHmup22O9ZodM0jnbscIpY/bvBKXU0245yuWTvz7SSYeSWXHk967jHbQEYzSoqZajMf8=
    • smithi103.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQDZj7xWEbKqKonVy+gjWjt4GbKTPgY1eduVkpIc7bJNK1U/8cQj4wCuFRoB3bm/+/lYj3QHtWcdqQvVgJP8huhoURCpveM28ghZ3uYe5h8peoJ604HrqWjNujkKdNwyLcFkr9+EvFH7ghG1+Xp1NIl1wkk4tDWahOdMZWGIPj+OnSyW8CR1T8UdGFntZYAqmBz/AFizwdaYyjLAssGztqhVGEK1zylosVKnJvLesjloMoSydpu7xNizLQpPXYSUsPlwOR15bq/eJfZN9TRINjQTe9Eog7wggoO+xrYSCJWS+/v9QlScz8FmMPh9GZnB/Ig8FHB7I3fx8q67b9Hr1ARrduD6F5LMdX3bW6EJiKsLBgb3BjRHx2EcKVgTYWmDOOeRhPBVm4PNWjnES5ahIEcs8tXREkADYHMfh+KDehvh3YDm80/uj0KFBpigmQUGfbxR0sNIvLC9LVYX9Lzh5XtF/In8g8bynzdZUo5aE1OFE4M9Vdju5ZnEq78h9XoHRq0=
  • tasks:
    • pexec:
      • all:
        • sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup
        • sudo dnf -y module reset container-tools
        • sudo dnf -y module install container-tools:rhel8 --allowerasing --nobest
        • sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf
    • nvme_loop:
    • cephadm:
      • roleless: True
    • cephadm.shell:
      • host.a:
        • ceph orch status
        • ceph orch ps
        • ceph orch ls
        • ceph orch host ls
        • ceph orch device ls
    • vip:
    • cephadm.shell:
      • host.a:
        • ceph orch device ls --refresh
    • vip.exec:
      • all-hosts:
        • systemctl stop nfs-server
    • cephadm.shell:
      • host.a:
        • ceph fs volume create foofs
        • ceph nfs cluster create foo --ingress --virtual-ip {{VIP0}}/{{VIPPREFIXLEN}} --port 2999
        • ceph nfs export create cephfs --fsname foofs --cluster-id foo --pseudo-path /fake
    • cephadm.wait_for_service:
      • service: nfs.foo
    • cephadm.wait_for_service:
      • service: ingress.nfs.foo
    • vip.exec:
      • host.a:
        • mkdir /mnt/foo
        • sleep 5
        • mount -t nfs {{VIP0}}:/fake /mnt/foo -o port=2999
        • echo test > /mnt/foo/testfile
        • sync
    • cephadm.shell:
      • host.a:
        • echo "Check with each haproxy down in turn..." for haproxy in `ceph orch ps | grep ^haproxy.nfs.foo. | awk '{print $1}'`; do ceph orch daemon stop $haproxy while ! ceph orch ps | grep $haproxy | grep stopped; do sleep 1 ; done cat /mnt/foo/testfile echo $haproxy > /mnt/foo/testfile sync ceph orch daemon start $haproxy while ! ceph orch ps | grep $haproxy | grep running; do sleep 1 ; done done
      • volumes:
        • /mnt/foo:/mnt/foo
    • vip.exec:
      • all-hosts:
        • echo "Check with $(hostname) ganesha(s) down..." for c in `systemctl | grep ceph- | grep @nfs | awk '{print $1}'`; do cid=`echo $c | sed 's/@/-/'` id=`echo $c | cut -d @ -f 2 | sed 's/.service$//'` fsid=`echo $c | cut -d @ -f 1 | cut -d - -f 2-` echo "Removing daemon $id fsid $fsid..." sudo $TESTDIR/cephadm rm-daemon --fsid $fsid --name $id echo "Waking up cephadm..." sudo $TESTDIR/cephadm shell -- ceph orch ps --refresh while ! timeout 1 cat /mnt/foo/testfile ; do true ; done echo "Mount is back!" done
    • cephadm.shell:
      • host.a:
        • stat -c '%u %g' /var/log/ceph | grep '167 167'
        • ceph orch status
        • ceph orch ps
        • ceph orch ls
        • ceph orch host ls
        • ceph orch device ls
        • ceph orch ls | grep '^osd.all-available-devices '
  • teuthology_branch: main
  • verbose: False
  • pcp_grafana_url:
  • priority:
  • user:
  • queue:
  • posted: 2023-07-19 13:29:13
  • started: 2023-07-19 13:30:06
  • updated: 2023-07-19 13:31:05
  • status_class: danger
  • runtime: 0:00:59