Pulpito :: Results Dashboard

Posted	Started	Updated	Runtime	Duration	In Waiting	Machine	Teuthology Branch	OS Type	OS Version	Nodes	Status
2022-03-09 13:49:47	2022-03-09 13:54:57	2022-03-09 14:31:48	0:36:51	0:22:10	0:14:41	smithi	master	centos	8.stream	2	fail

Nodes: smithi110 smithi166

Description: fs:upgrade/mds_upgrade_sequence/{bluestore-bitmap centos_8.stream_container_tools conf/{client mds mon osd} overrides/{pg-warn syntax whitelist_health whitelist_wrongly_marked_down} roles tasks/{0-from/pacific 1-volume/{0-create 1-ranks/2 2-allow_standby_replay/yes 3-inline/yes 4-verify} 2-client 3-upgrade-with-workload 4-verify}}

Log: http://qa-proxy.ceph.com/teuthology/vshankar-2022-03-09_13:49:18-fs:upgrade-master-testing-default-smithi/6728203/teuthology.log

Sentry event: https://sentry.ceph.com/organizations/ceph/?query=4ee45dc565474981bb5bb5536740e2ce

Failure Reason:

Command failed (workunit test suites/fsstress.sh) on smithi166 with status 126: 'mkdir -p -- /home/ubuntu/cephtest/mnt.1/client.1/tmp && cd -- /home/ubuntu/cephtest/mnt.1/client.1/tmp && CEPH_CLI_TEST_DUP_COMMAND=1 CEPH_REF=27bad0cf8decf43ee4c77b0b76e8f0be5095a177 TESTDIR="/home/ubuntu/cephtest" CEPH_ARGS="--cluster ceph" CEPH_ID="1" PATH=$PATH:/usr/sbin CEPH_BASE=/home/ubuntu/cephtest/clone.client.1 CEPH_ROOT=/home/ubuntu/cephtest/clone.client.1 CEPH_MNT=/home/ubuntu/cephtest/mnt.1 adjust-ulimits ceph-coverage /home/ubuntu/cephtest/archive/coverage timeout 3h /home/ubuntu/cephtest/clone.client.1/qa/workunits/suites/fsstress.sh'

All Details...

log_href: http://qa-proxy.ceph.com/teuthology/vshankar-2022-03-09_13:49:18-fs:upgrade-master-testing-default-smithi/6728203/teuthology.log
archive_path: /home/teuthworker/archive/vshankar-2022-03-09_13:49:18-fs:upgrade-master-testing-default-smithi/6728203
description: fs:upgrade/mds_upgrade_sequence/{bluestore-bitmap centos_8.stream_container_tools conf/{client mds mon osd} overrides/{pg-warn syntax whitelist_health whitelist_wrongly_marked_down} roles tasks/{0-from/pacific 1-volume/{0-create 1-ranks/2 2-allow_standby_replay/yes 3-inline/yes 4-verify} 2-client 3-upgrade-with-workload 4-verify}}
duration: 0:22:10
email: vshankar@redhat.com
failure_reason: Command failed (workunit test suites/fsstress.sh) on smithi166 with status 126: 'mkdir -p -- /home/ubuntu/cephtest/mnt.1/client.1/tmp && cd -- /home/ubuntu/cephtest/mnt.1/client.1/tmp && CEPH_CLI_TEST_DUP_COMMAND=1 CEPH_REF=27bad0cf8decf43ee4c77b0b76e8f0be5095a177 TESTDIR="/home/ubuntu/cephtest" CEPH_ARGS="--cluster ceph" CEPH_ID="1" PATH=$PATH:/usr/sbin CEPH_BASE=/home/ubuntu/cephtest/clone.client.1 CEPH_ROOT=/home/ubuntu/cephtest/clone.client.1 CEPH_MNT=/home/ubuntu/cephtest/mnt.1 adjust-ulimits ceph-coverage /home/ubuntu/cephtest/archive/coverage timeout 3h /home/ubuntu/cephtest/clone.client.1/qa/workunits/suites/fsstress.sh'
flavor: default
job_id: 6728203
kernel:
- flavor: default
- kdb: True
- sha1: f54e082e2b2fd016bc6e204c242f596aafe74c91
last_in_suite: False
machine_type: smithi
name: vshankar-2022-03-09_13:49:18-fs:upgrade-master-testing-default-smithi
nuke_on_error: True
os_type: centos
os_version: 8.stream
overrides:
- admin_socket:
  - branch: master
- ceph:
  - conf:
    - client:
      - client mount timeout: 600
      - debug client: 20
      - debug ms: 1
      - rados mon op timeout: 900
      - rados osd op timeout: 900
    - global:
      - mon pg warn min per osd: 0
    - mds:
      - debug mds: 20
      - debug ms: 1
      - mds debug frag: True
      - mds debug scatterstat: True
      - mds op complaint time: 180
      - mds verify scatter: True
      - osd op complaint time: 180
      - rados mon op timeout: 900
      - rados osd op timeout: 900
    - mgr:
      - debug mgr: 20
      - debug ms: 1
    - mon:
      - debug mon: 20
      - debug ms: 1
      - debug paxos: 20
      - mon op complaint time: 120
    - osd:
      - bdev async discard: True
      - bdev enable discard: True
      - bluestore allocator: bitmap
      - bluestore block size: 96636764160
      - bluestore fsck on mount: True
      - debug bluefs: 1/20
      - debug bluestore: 1/20
      - debug ms: 1
      - debug osd: 20
      - debug rocksdb: 4/10
      - mon osd backfillfull_ratio: 0.85
      - mon osd full ratio: 0.9
      - mon osd nearfull ratio: 0.8
      - osd failsafe full ratio: 0.95
      - osd objectstore: bluestore
      - osd op complaint time: 180
  - flavor: default
  - fs: xfs
  - log-ignorelist:
    - $MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
    - overall HEALTH_
    - $FS_DEGRADED$
    - $MDS_FAILED$
    - $MDS_DEGRADED$
    - $FS_WITH_FAILED_MDS$
    - $MDS_DAMAGE$
    - $MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
    - $FS_INLINE_DATA_DEPRECATED$
    - overall HEALTH_
    - $OSD_DOWN$
    - $OSD_
    - but it is still running
    - is not responding
  - log-whitelist:
    - \(MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
  - sha1: e98697fdcb3b7b8eab3fc453719d4e18f0d62be4
- ceph-deploy:
  - bluestore: True
  - conf:
    - client:
      - log file: /var/log/ceph/ceph-$name.$pid.log
    - mon:
      - osd default pool size: 2
    - osd:
      - bdev async discard: True
      - bdev enable discard: True
      - bluestore block size: 96636764160
      - bluestore fsck on mount: True
      - debug bluefs: 1/20
      - debug bluestore: 1/20
      - debug rocksdb: 4/10
      - mon osd backfillfull_ratio: 0.85
      - mon osd full ratio: 0.9
      - mon osd nearfull ratio: 0.8
      - osd failsafe full ratio: 0.95
      - osd objectstore: bluestore
  - fs: xfs
- install:
  - ceph:
    - flavor: default
    - sha1: e98697fdcb3b7b8eab3fc453719d4e18f0d62be4
- kclient:
  - syntax: v1
- selinux:
  - whitelist:
    - scontext=system_u:system_r:logrotate_t:s0
- thrashosds:
  - bdev_inject_crash: 2
  - bdev_inject_crash_probability: 0.5
- workunit:
  - branch: master
  - sha1: 27bad0cf8decf43ee4c77b0b76e8f0be5095a177
owner: scheduled_vshankar@teuthology
pid:
roles:
- ['host.a', 'client.0', 'osd.0', 'osd.1', 'osd.2']
- ['host.b', 'client.1', 'osd.3', 'osd.4', 'osd.5']
sentry_event: https://sentry.ceph.com/organizations/ceph/?query=4ee45dc565474981bb5bb5536740e2ce
status: fail
success: False
branch: master
seed:
sha1: e98697fdcb3b7b8eab3fc453719d4e18f0d62be4
subset:
suite:
suite_branch: master
suite_path:
suite_relpath:
suite_repo:
suite_sha1: 27bad0cf8decf43ee4c77b0b76e8f0be5095a177
targets:
- smithi110.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC0C16AQSfWpXfZOXRbBZE2hqtoRX7MO4it7xLxW1xCZG/SmOv2GBaFZrp1C2yR0/zddZ5G3rC13b2dfd46bfc+SQiBXS0qsaT9X9ZJNt2M6TcdqEG5pLplZZ11VBmBrcciZyOGQ1dMQKpE1ZMm0HIzyelc8rKwpf/zaTds/nqQpbwms7/23wGsKVoqNFJf9mSjxgUeDpvHQhUdQJNeGz5CYVu7kssItIPKL3bVFjlU7KWXaNMnvf1PiRJ5+87CJZs3wZcPenivVHxRPkWIGcf53QLAa/IFXk9H0fKp9SKDMisGWMaKMz+JSAs5yE5jLcOOiyq5H7q7LCynkHZ3AQgUKM0MHDxuINmFNfQCcMNhSl+KfKi/Fsf9O6Ap81atKhgB2FYeXjOLPfkHqzDMd/OqWcaTJCuT+KqSgia713sNWzt9YfW1oHiBTv4/SbkyfpQ+6mGA5IU+BMSHWgCcs97zztHc8PvtNiH/yd2GiIZVKZzJ/FJLL6DTLnL0uSBoWCU=
- smithi166.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQD19D+91iE99UtYYnFtxTa0URDJl5wYFa45AuBiwQH1mNV8PhMf6M6zdeMerE1t2QRX42PLBKl7UD+nFvXx7jGFdy5KOKvS7Udyv3pNbVqgqyijUSbb515OcoLAwKwwbdkjKGPolWUEpncU8+JGJBZSTfvtPppXuqnhl6Y5Cxp6uqbNABl9Uz+OwWEYmTakcLcR/D/ZLONjZcNPSxrU4sySxrfC1WZp3HwdLrAInnrBqcYsOhOxCWVurgJlo2+TAtujkUjx9GJVIUcd65zXMigKGx8tP4wzvjarVKhZAyp21MElOeOvYfqPzxGz+/S/tiH3P+FYd/Gbfq/TmBVA6gBLKf140erbBIO7zYAsN0+DVKU4rDruYfS7OSBCnL0jHCTUkU869mIkhNAqdXvBP388CRsXNB22fZLRXHjdrVReyUGI7mazcqAoXNnkITFMH/fZLWlqJybrExAlBGdEcsQMZwzQaOGgtdMsf4KI3Qnf2STNr/zBEtvpOD4BK7+cquE=
tasks:
- internal.check_packages:
- internal.buildpackages_prep:
- internal.save_config:
- internal.check_lock:
- internal.add_remotes:
- console_log:
- internal.connect:
- internal.push_inventory:
- internal.serialize_remote_roles:
- internal.check_conflict:
- internal.check_ceph_data:
- internal.vm_setup:
- kernel:
  - flavor: default
  - kdb: True
  - sha1: f54e082e2b2fd016bc6e204c242f596aafe74c91
- internal.base:
- internal.archive_upload:
- internal.archive:
- internal.coredump:
- internal.sudo:
- internal.syslog:
- internal.timer:
- pcp:
- selinux:
- ansible.cephlab:
- clock:
- pexec:
  - all:
    - sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup
    - sudo dnf -y module reset container-tools
    - sudo dnf -y module install container-tools
    - sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf
- install:
  - branch: pacific
  - exclude_packages:
    - ceph-volume
  - flavor: default
  - sha1: e98697fdcb3b7b8eab3fc453719d4e18f0d62be4
- print: **** done install task...
- cephadm:
  - cephadm_branch: pacific
  - cephadm_git_url: https://github.com/ceph/ceph
  - conf:
    - osd:
      - osd_class_default_list: *
      - osd_class_load_list: *
      - bdev async discard: True
      - bdev enable discard: True
      - bluestore allocator: bitmap
      - bluestore block size: 96636764160
      - bluestore fsck on mount: True
      - debug bluefs: 1/20
      - debug bluestore: 1/20
      - debug ms: 1
      - debug osd: 20
      - debug rocksdb: 4/10
      - mon osd backfillfull_ratio: 0.85
      - mon osd full ratio: 0.9
      - mon osd nearfull ratio: 0.8
      - osd failsafe full ratio: 0.95
      - osd objectstore: bluestore
      - osd op complaint time: 180
    - client:
      - client mount timeout: 600
      - debug client: 20
      - debug ms: 1
      - rados mon op timeout: 900
      - rados osd op timeout: 900
    - global:
      - mon pg warn min per osd: 0
    - mds:
      - debug mds: 20
      - debug ms: 1
      - mds debug frag: True
      - mds debug scatterstat: True
      - mds op complaint time: 180
      - mds verify scatter: True
      - osd op complaint time: 180
      - rados mon op timeout: 900
      - rados osd op timeout: 900
    - mgr:
      - debug mgr: 20
      - debug ms: 1
    - mon:
      - debug mon: 20
      - debug ms: 1
      - debug paxos: 20
      - mon op complaint time: 120
  - image: docker.io/ceph/daemon-base:latest-pacific
  - roleless: True
  - flavor: default
  - fs: xfs
  - log-ignorelist:
    - $MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
    - overall HEALTH_
    - $FS_DEGRADED$
    - $MDS_FAILED$
    - $MDS_DEGRADED$
    - $FS_WITH_FAILED_MDS$
    - $MDS_DAMAGE$
    - $MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
    - $FS_INLINE_DATA_DEPRECATED$
    - overall HEALTH_
    - $OSD_DOWN$
    - $OSD_
    - but it is still running
    - is not responding
  - log-whitelist:
    - \(MDS_ALL_DOWN$
    - $MDS_UP_LESS_THAN_MAX$
  - sha1: e98697fdcb3b7b8eab3fc453719d4e18f0d62be4
  - cluster: ceph
  - cephadm_mode: root
- print: **** done end installing pacific cephadm ...
- cephadm.shell:
  - host.a:
    - ceph config set mgr mgr/cephadm/use_repo_digest true --force
- print: **** done cephadm.shell ceph config set mgr...
- cephadm.shell:
  - host.a:
    - ceph orch status
    - ceph orch ps
    - ceph orch ls
    - ceph orch host ls
    - ceph orch device ls
- cephadm.shell:
  - host.a:
    - ceph fs volume create cephfs --placement=4
    - ceph fs dump
- cephadm.shell:
  - host.a:
    - ceph fs set cephfs max_mds 2
- cephadm.shell:
  - host.a:
    - ceph fs set cephfs allow_standby_replay true
- cephadm.shell:
  - host.a:
    - ceph fs set cephfs inline_data true --yes-i-really-really-mean-it
- cephadm.shell:
  - host.a:
    - ceph fs dump
    - ceph --format=json fs dump | jq -e ".filesystems | length == 1"
    - while ! ceph --format=json mds versions | jq -e ". | add == 4"; do sleep 1; done
- fs.pre_upgrade_save:
- kclient:
- print: **** done client
- parallel:
  - upgrade-tasks
  - workload-tasks
- cephadm.shell:
  - host.a:
    - ceph fs dump
- fs.post_upgrade_checks:
teuthology_branch: master
verbose: False
pcp_grafana_url:
priority:
user:
queue:
posted: 2022-03-09 13:49:47
started: 2022-03-09 13:54:57
updated: 2022-03-09 14:31:48
status_class: danger
runtime: 0:36:51
wait_time: 0:14:41