Description: rbd/librbd/{cache/none clusters/{fixed-3 openstack} config/permit-partial-discard min-compat-client/octopus msgr-failures/few objectstore/filestore-xfs pool/ec-data-pool supported-random-distro$/{centos_8} workloads/fsx}

Log: http://qa-proxy.ceph.com/teuthology/yuriw-2023-01-13_17:05:26-rbd-wip-yuri3-testing-2023-01-12-1538-quincy-distro-default-smithi/7141958/teuthology.log

Failure Reason:

"2023-01-14T10:46:42.968966+0000 mon.a (mon.0) 366 : cluster [WRN] Health check failed: 2 mgr modules have recently crashed (RECENT_MGR_MODULE_CRASH)" in cluster log

  • log_href: http://qa-proxy.ceph.com/teuthology/yuriw-2023-01-13_17:05:26-rbd-wip-yuri3-testing-2023-01-12-1538-quincy-distro-default-smithi/7141958/teuthology.log
  • archive_path: /home/teuthworker/archive/yuriw-2023-01-13_17:05:26-rbd-wip-yuri3-testing-2023-01-12-1538-quincy-distro-default-smithi/7141958
  • description: rbd/librbd/{cache/none clusters/{fixed-3 openstack} config/permit-partial-discard min-compat-client/octopus msgr-failures/few objectstore/filestore-xfs pool/ec-data-pool supported-random-distro$/{centos_8} workloads/fsx}
  • duration: 0:21:23
  • email: yweinstein@radhat.com
  • failure_reason: "2023-01-14T10:46:42.968966+0000 mon.a (mon.0) 366 : cluster [WRN] Health check failed: 2 mgr modules have recently crashed (RECENT_MGR_MODULE_CRASH)" in cluster log
  • flavor: default
  • job_id: 7141958
  • kernel:
    • kdb: True
    • sha1: distro
  • last_in_suite: False
  • machine_type: smithi
  • name: yuriw-2023-01-13_17:05:26-rbd-wip-yuri3-testing-2023-01-12-1538-quincy-distro-default-smithi
  • nuke_on_error: True
  • os_type: centos
  • os_version: 8.stream
  • overrides:
    • admin_socket:
      • branch: wip-yuri3-testing-2023-01-12-1538-quincy
    • ceph:
      • conf:
        • client:
          • rbd default data pool: datapool
          • rbd skip partial discard: False
        • global:
          • mon client directed command retry: 5
          • ms inject socket failures: 5000
        • mgr:
          • debug mgr: 20
          • debug ms: 1
        • mon:
          • debug mon: 20
          • debug ms: 1
          • debug paxos: 20
        • osd:
          • bluestore block size: 96636764160
          • debug ms: 1
          • debug osd: 20
          • enable experimental unrecoverable data corrupting features: *
          • osd debug randomize hobject sort order: False
          • osd objectstore: bluestore
          • osd shutdown pgref assert: True
          • osd sloppy crc: True
      • flavor: default
      • fs: xfs
      • log-ignorelist:
        • \(MDS_ALL_DOWN\)
        • \(MDS_UP_LESS_THAN_MAX\)
        • but it is still running
        • \(OSD_SLOW_PING_TIME
      • sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
    • ceph-deploy:
      • conf:
        • client:
          • log file: /var/log/ceph/ceph-$name.$pid.log
        • mon:
          • osd default pool size: 2
        • osd:
          • osd objectstore: filestore
          • osd sloppy crc: True
      • filestore: True
      • fs: xfs
    • install:
      • ceph:
        • flavor: default
        • sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
    • selinux:
      • whitelist:
        • scontext=system_u:system_r:logrotate_t:s0
    • thrashosds:
      • bdev_inject_crash: 2
      • bdev_inject_crash_probability: 0.5
    • workunit:
      • branch: wip-yuri3-testing-2023-01-12-1538-quincy
      • sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
  • owner: scheduled_yuriw@teuthology
  • pid:
  • roles:
    • ['mon.a', 'mon.c', 'mgr.x', 'osd.0', 'osd.1', 'osd.2', 'osd.3']
    • ['mon.b', 'mgr.y', 'osd.4', 'osd.5', 'osd.6', 'osd.7']
    • ['client.0']
  • sentry_event:
  • status: fail
  • success: False
  • branch: wip-yuri3-testing-2023-01-12-1538-quincy
  • seed:
  • sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
  • subset:
  • suite:
  • suite_branch: wip-yuri3-testing-2023-01-12-1538-quincy
  • suite_path:
  • suite_relpath:
  • suite_repo:
  • suite_sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
  • targets:
    • smithi006.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQDYb8fyzZF34ztDHfGbT0WQEuST3WjHPeaHLpr6H+kmtAQWa6P4Fsf6ZRv9u5kd4JFT8e0XnBICziAjSeOL+wD2w0umy7Tyt3PscmMX8yHnnsDSC3srqFPwt30mn8Ijl+lHOX+vVcuyMJQQ5Akq2v1G5tSDnnBiX4wRtyLL+/TFdiSTios3anSulEh6rCct++9EkF/ueaT5SdrLGrjUKRZ6RaM3Io5Xb7fqL5Ca08DMrKIs2PElonZVcEhlb/RhwDzMxkdqOAsN7FPzz+kRQc1lNSwAnBFJ4gTbSWjBkIiSyR1qeuBW7VH7qQZcv0Tx2up5YtZiEkT/HOYvc3qinxLSoktmh3/7vzZF1WzoRtgJhWIhnmSLeOKhac0cdEcyeNSZsvnJeiCbtL5zYz4GOPTU+jSUJCWZinI9jFSXYBP9uFuN7mbghmJtd21eimIuvu4kRi4qAhAcFVi8p55jN41+towLZjJqxe4IG021hkwUavx121zrtJANtM44/yArCNE=
    • smithi016.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCunY9tI82go24CslQfKuIOFW8UUw6/odCXKkHl3/fHxuiYy2XLfeICxleKzy8QRGPMJH3xqIeKI7OKSC1Wzh/hYMYNveXREldxN8U8AW7mqNe6cGSmfVyNRLZph2I1KvCciPUqab+PLqRbTUvnxQLvpkCNuRjYj7UWMhjl6OamRZe62EFoOnGEj/+ddJgS2ZstUpbQBBnPa4av4/nUVb3Ivf3QxWG0Q0nl8ZKGJWx6pP8Kx0447E5q9dyF50piChLIQJWL96hYUSbVir/DLh/V9Wsllgb8wnzaM3t28N7Nl0sybGUf9KRxHx25rEWcZ42m/IZzwZcUSLG7NffbN4aue7Fd+eJ9aMIowALzBkkaIL1p6U0OBE89vKKWk6TsendH1BCv/RKJZn4rJV3Y0zwlsoetcyya8B/0gZ81xpbmdG+7+8W2XBhDIBcJLU/FcJoHr8UX4ukpdh8GJP1VX/ROTKstdOliMinU/mbRiw+Ba5cmUphG8h7AJK7Z+FKuul0=
    • smithi033.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQDNxtI7PGW5XHnuWswNCJUB2TXSo66r+gXQf+ssYh9vDnwZUIFblg6ZBVh7U8kyUcbaoZBKh3qeTWyxbUvSwm9SBQnXjVYlLk+sRbQx46jo55BCIsMpEUOBJadl2JfkAljY3S7DPDcioKUnSyOUetbbYUfr24SKLviEKXQzVTXVW6a7Ri9cjC9E3psdUutUQXKFT328oRbfaOz9lnA5T22utg2HRskgUzRGyAG31qOxlvnAtvDGCk6CkPIyhzWpQd8qeQwEPZ8+KF7fUYqQ/BdCZdPk2QesHdP6vld5v4BcSnOQmnVbSyNugIIug0/naKgmzm89wXPK7M7mns4OrIfzz3Qm+3qMdJMi7oXHTinsguk0AyLrGtTTOgImlqRPDgMGffyAXwjaG63i+4rCLu86nI1G1R1Tl1oKbZ3xv47MhIPxb0HhtYLOOUJOGQgbs3/abucKbMcHiXbOzRpXZVQTXfG4tEK6YMYIlp3bpG6koLSmI+y+tbDT9N0b3eOVm0E=
  • tasks:
    • internal.check_packages:
    • internal.buildpackages_prep:
    • internal.save_config:
    • internal.check_lock:
    • internal.add_remotes:
    • console_log:
    • internal.connect:
    • internal.push_inventory:
    • internal.serialize_remote_roles:
    • internal.check_conflict:
    • internal.check_ceph_data:
    • internal.vm_setup:
    • kernel:
      • kdb: True
      • sha1: distro
    • internal.base:
    • internal.archive_upload:
    • internal.archive:
    • internal.coredump:
    • internal.sudo:
    • internal.syslog:
    • internal.timer:
    • pcp:
    • selinux:
    • ansible.cephlab:
    • clock:
    • install:
    • ceph:
      • conf:
        • client:
          • rbd cache: False
          • rbd default data pool: datapool
          • rbd skip partial discard: False
        • global:
          • mon client directed command retry: 5
          • ms inject socket failures: 5000
        • mgr:
          • debug mgr: 20
          • debug ms: 1
        • mon:
          • debug mon: 20
          • debug ms: 1
          • debug paxos: 20
        • osd:
          • bluestore block size: 96636764160
          • debug ms: 1
          • debug osd: 20
          • enable experimental unrecoverable data corrupting features: *
          • osd debug randomize hobject sort order: False
          • osd objectstore: bluestore
          • osd shutdown pgref assert: True
          • osd sloppy crc: True
      • flavor: default
      • fs: xfs
      • log-ignorelist:
        • \(MDS_ALL_DOWN\)
        • \(MDS_UP_LESS_THAN_MAX\)
        • but it is still running
        • \(OSD_SLOW_PING_TIME
      • sha1: bfd3a6ed50faf52c25e13b78ed4e141204a3b665
      • cluster: ceph
    • exec:
      • client.0:
        • sudo ceph osd set-require-min-compat-client octopus
    • exec:
      • client.0:
        • sudo ceph osd erasure-code-profile set teuthologyprofile crush-failure-domain=osd m=1 k=2
        • sudo ceph osd pool create datapool 4 4 erasure teuthologyprofile
        • sudo ceph osd pool set datapool allow_ec_overwrites true
        • rbd pool init datapool
    • rbd_fsx:
      • clients:
        • client.0
      • ops: 20000
  • teuthology_branch: main
  • verbose: True
  • pcp_grafana_url:
  • priority:
  • user:
  • queue:
  • posted: 2023-01-13 17:08:29
  • started: 2023-01-14 10:20:58
  • updated: 2023-01-14 10:52:40
  • status_class: danger
  • runtime: 0:31:42
  • wait_time: 0:10:19