archive_path: /home/teuthworker/archive/yuriw-2021-11-16_13:07:14-rados-wip-yuri4-testing-2021-11-15-1306-distro-basic-smithi/6506511 branch: wip-yuri4-testing-2021-11-15-1306 description: rados/cephadm/mds_upgrade_sequence/{bluestore-bitmap centos_8.stream_container_tools conf/{client mds mon osd} overrides/{pg-warn whitelist_health whitelist_wrongly_marked_down} roles tasks/{0-v16.2.4 1-volume/{0-create 1-ranks/1 2-allow_standby_replay/no 3-verify} 2-client 3-upgrade-with-workload 4-verify}} email: null first_in_suite: false job_id: '6506511' kernel: kdb: true sha1: distro last_in_suite: false machine_type: smithi meta: - desc: 'setup ceph/pacific v16.2.4 ' name: yuriw-2021-11-16_13:07:14-rados-wip-yuri4-testing-2021-11-15-1306-distro-basic-smithi nuke-on-error: true os_type: centos os_version: 8.stream overrides: admin_socket: branch: wip-yuri4-testing-2021-11-15-1306 ceph: conf: client: client mount timeout: 600 debug client: 20 debug ms: 1 rados mon op timeout: 15m rados osd op timeout: 15m global: mon pg warn min per osd: 0 mds: debug mds: 20 debug ms: 1 mds debug frag: true mds debug scatterstat: true mds op complaint time: 180 mds verify scatter: true osd op complaint time: 180 rados mon op timeout: 15m rados osd op timeout: 15m mgr: debug mgr: 20 debug ms: 1 mon: debug mon: 20 debug ms: 1 debug paxos: 20 mon op complaint time: 120 osd: bdev async discard: true bdev enable discard: true bluestore allocator: bitmap bluestore block size: 96636764160 bluestore fsck on mount: true debug bluefs: 1/20 debug bluestore: 1/20 debug ms: 1 debug osd: 20 debug rocksdb: 4/10 mon osd backfillfull_ratio: 0.85 mon osd full ratio: 0.9 mon osd nearfull ratio: 0.8 osd failsafe full ratio: 0.95 osd objectstore: bluestore osd op complaint time: 180 fs: xfs log-ignorelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) - overall HEALTH_ - \(FS_DEGRADED\) - \(MDS_FAILED\) - \(MDS_DEGRADED\) - \(FS_WITH_FAILED_MDS\) - \(MDS_DAMAGE\) - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) - \(FS_INLINE_DATA_DEPRECATED\) - overall HEALTH_ - \(OSD_DOWN\) - \(OSD_ - but it is still running - is not responding log-whitelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) sha1: f188280b31ba4dafe6a9cbafd87bae7a4fc52a64 ceph-deploy: bluestore: true conf: client: log file: /var/log/ceph/ceph-$name.$pid.log mon: osd default pool size: 2 osd: bdev async discard: true bdev enable discard: true bluestore block size: 96636764160 bluestore fsck on mount: true debug bluefs: 1/20 debug bluestore: 1/20 debug rocksdb: 4/10 mon osd backfillfull_ratio: 0.85 mon osd full ratio: 0.9 mon osd nearfull ratio: 0.8 osd failsafe full ratio: 0.95 osd objectstore: bluestore fs: xfs install: ceph: sha1: f188280b31ba4dafe6a9cbafd87bae7a4fc52a64 selinux: whitelist: - scontext=system_u:system_r:logrotate_t:s0 thrashosds: bdev_inject_crash: 2 bdev_inject_crash_probability: 0.5 workunit: branch: wip-yuri4-testing-2021-11-15-1306 sha1: f188280b31ba4dafe6a9cbafd87bae7a4fc52a64 owner: scheduled_yuriw@teuthology priority: 71 repo: https://github.com/ceph/ceph-ci.git roles: - - host.a - client.0 - osd.0 - osd.1 - osd.2 - - host.b - client.1 - osd.3 - osd.4 - osd.5 sha1: f188280b31ba4dafe6a9cbafd87bae7a4fc52a64 sleep_before_teardown: 0 suite: rados suite_branch: wip-yuri4-testing-2021-11-15-1306 suite_path: /home/teuthworker/src/github.com_ceph_ceph-c_f188280b31ba4dafe6a9cbafd87bae7a4fc52a64/qa suite_relpath: qa suite_repo: https://github.com/ceph/ceph-ci.git suite_sha1: f188280b31ba4dafe6a9cbafd87bae7a4fc52a64 targets: smithi043.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC82UDOitEEk3pCqw1PSc00ZhJ6RXZfLynqx5pdo+yafEEy7IOGXwUNZiEENVzhAM4PbWDvAyWMVbqhUtfIP+125XIyez5MYrX0JdeEX06BIJBefkh78Q+8ObnfDbztEOvfciOzbCgymSCL9tKp819FN9kL6YRcV2AZoOEbyB0Rcm+RvZih4YuSrW+NvzGZKGN9KK+/NqrGNB+NeJMmSv+KfVbFmgkUCC2AK+atWiYpi3pS9Pzc0CE3L83+i4aED2NSOzZMGCxhiWQHi2KYTrKqVmZ7ka9rjwIGLESCA0RP3OJhIvJT1v+oJtmTsnbjj+fmu4R1z18vdxrTiV2cb7+9j4opV7y5MOHWwIv5Qv/IXvapxYdfnBq7dO60fLkKd4KXdt97PWak41gPb79Aa5HEtyrgAQfn8eGj7QZbb1QnDuSYs0IiS+2Y5Q+BCZVfuKW98U5Y+GH37IZqRvzrfTFoKKXHfN+Q84GFz1NeTrGj0RqVy/6eTvqwrmdTSHUhmxE= smithi123.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQChQUEUDj1roPXj9OTEEsCwmQzjlXcBW36RyXknAfIk7R4VcqpKe7ixyrobwb9bngO+3nFm+UtzeUOiUeU3XQd+HFxCWdRDhElazuzj7Roptn6/VbL5SJx9eAUEZ+S8qr35Wi0EKk2o85h818xtREJhv7iTT9jvGGUS2sS6qwTXjRILHYE7aLpqd017KjUqR5bPN3o5GHd28IKdAbBDoEOut3DS2su2+z1ovcGq9aNlJuuC0XgyGw29WPUwQZsY1bwcYVwG/Gktp/ihSbRztkLi+w9mD2/RuIczFRJegS21lxCSNaGZuDnG4MubmS2O1Jpr4y3YoImj1G796nuRc2j5/Wq5qLRC7l1+VPnk45jPtRCJaFSTqIrapk8F/wyidyBI17Mj4rDACqHDZ5+xSx74qzzK2KQG/GJTVvJl7hyKHoVl/XJEfsrC4DFuFfDLFbPr6env/HYB+3GYkUeU5bcocOHS4scMZxcJ4prOBmVA6RcJ6fRpaLzB6J0fNUxA9s0= tasks: - pexec: all: - sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup - sudo dnf -y module reset container-tools - sudo dnf -y module install container-tools - sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf - install: exclude_packages: - ceph-volume tag: v16.2.4 - cephadm: avoid_pacific_features: true cephadm_branch: v16.2.4 cephadm_git_url: https://github.com/ceph/ceph image: docker.io/ceph/ceph:v16.2.4 roleless: true - print: '**** done starting v16.2.4' - cephadm.shell: host.a: - ceph orch status - ceph orch ps - ceph orch ls - ceph orch host ls - ceph orch device ls - cephadm.shell: host.a: - ceph fs volume create cephfs --placement=4 - ceph fs dump - cephadm.shell: host.a: - ceph fs set cephfs max_mds 1 - cephadm.shell: host.a: - ceph fs set cephfs allow_standby_replay false - cephadm.shell: host.a: - ceph fs dump - ceph --format=json fs dump | jq -e ".filesystems | length == 1" - ceph --format=json mds versions | jq -e ". | add == 4" - fs.pre_upgrade_save: null - kclient: null - print: '**** done kclient client' - parallel: - upgrade-tasks - workload-tasks - cephadm.shell: host.a: - ceph fs dump - fs.post_upgrade_checks: null teuthology_branch: master teuthology_sha1: 6cfddd5e1c7d5ede1367cf3087c21af44eb88356 timestamp: 2021-11-16_13:07:14 tube: smithi upgrade-tasks: sequential: - cephadm.shell: env: - sha1 host.a: - ceph config set mon mon_warn_on_insecure_global_id_reclaim false --force - ceph config set mon mon_warn_on_insecure_global_id_reclaim_allowed false --force - ceph config set global log_to_journald false --force - ceph orch upgrade start --image quay.ceph.io/ceph-ci/ceph:$sha1 - cephadm.shell: env: - sha1 host.a: - while ceph orch upgrade status | jq '.in_progress' | grep true ; do ceph orch ps ; ceph versions ; ceph fs dump; sleep 30 ; done - ceph orch ps - ceph versions - echo "wait for servicemap items w/ changing names to refresh" - sleep 60 - ceph orch ps - ceph versions - ceph versions | jq -e '.overall | length == 1' - ceph versions | jq -e '.overall | keys' | grep $sha1 user: yuriw verbose: true worker_log: /home/teuthworker/archive/worker_logs/dispatcher.smithi.20261 workload-tasks: sequential: - workunit: clients: all: - suites/fsstress.sh