archive_path: /home/teuthworker/archive/dparmar-2022-07-11_08:53:46-fs:upgrade-wip-dparmar-cephadm-55715-simple-distro-default-smithi/6923203 branch: wip-dparmar-cephadm-55715-simple description: fs:upgrade/upgrade_without_reducing_max_mds/{bluestore-bitmap centos_8.stream_container_tools conf/{client mds mon osd} overrides/{ignorelist_health ignorelist_wrongly_marked_down pg-warn syntax} roles tasks/{0-from/pacific 1-volume/{0-create 1-ranks/1 2-allow_standby_replay/no 3-inline/yes 4-verify} 2-client 3-upgrade-with-workload 4-verify}} email: null first_in_suite: false job_id: '6923203' kernel: &id001 kdb: true sha1: distro last_in_suite: false machine_type: smithi meta: - desc: 'setup ceph/pacific ' name: dparmar-2022-07-11_08:53:46-fs:upgrade-wip-dparmar-cephadm-55715-simple-distro-default-smithi no_nested_subset: false nuke-on-error: true os_type: centos os_version: 8.stream overrides: admin_socket: branch: wip-dparmar-cephadm-55715-simple ceph: conf: client: client mount timeout: 600 debug client: 20 debug ms: 1 rados mon op timeout: 900 rados osd op timeout: 900 global: mon pg warn min per osd: 0 mds: debug mds: 20 debug mds balancer: 20 debug ms: 1 mds debug frag: true mds debug scatterstat: true mds op complaint time: 180 mds verify scatter: true osd op complaint time: 180 rados mon op timeout: 900 rados osd op timeout: 900 mgr: debug mgr: 20 debug ms: 1 mon: debug mon: 20 debug ms: 1 debug paxos: 20 mon op complaint time: 120 osd: bdev async discard: true bdev enable discard: true bluestore allocator: bitmap bluestore block size: 96636764160 bluestore fsck on mount: true debug bluefs: 1/20 debug bluestore: 1/20 debug ms: 1 debug osd: 20 debug rocksdb: 4/10 mon osd backfillfull_ratio: 0.85 mon osd full ratio: 0.9 mon osd nearfull ratio: 0.8 osd failsafe full ratio: 0.95 osd objectstore: bluestore osd op complaint time: 180 flavor: default fs: xfs log-ignorelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) - overall HEALTH_ - \(FS_DEGRADED\) - \(MDS_FAILED\) - \(MDS_DEGRADED\) - \(FS_WITH_FAILED_MDS\) - \(MDS_DAMAGE\) - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) - \(FS_INLINE_DATA_DEPRECATED\) - overall HEALTH_ - \(OSD_DOWN\) - \(OSD_ - but it is still running - is not responding sha1: 67c3088bbad2bb45fab809eb6d89e0b3248197b6 ceph-deploy: bluestore: true conf: client: log file: /var/log/ceph/ceph-$name.$pid.log mon: osd default pool size: 2 osd: bdev async discard: true bdev enable discard: true bluestore block size: 96636764160 bluestore fsck on mount: true debug bluefs: 1/20 debug bluestore: 1/20 debug rocksdb: 4/10 mon osd backfillfull_ratio: 0.85 mon osd full ratio: 0.9 mon osd nearfull ratio: 0.8 osd failsafe full ratio: 0.95 osd objectstore: bluestore fs: xfs install: ceph: flavor: default sha1: 67c3088bbad2bb45fab809eb6d89e0b3248197b6 kclient: syntax: v1 selinux: whitelist: - scontext=system_u:system_r:logrotate_t:s0 thrashosds: bdev_inject_crash: 2 bdev_inject_crash_probability: 0.5 workunit: branch: wip-dparmar-cephadm-55715-simple sha1: 67c3088bbad2bb45fab809eb6d89e0b3248197b6 owner: scheduled_dparmar@teuthology priority: 85 repo: git://git.ceph.com/ceph-ci.git roles: - - host.a - client.0 - osd.0 - osd.1 - osd.2 - - host.b - client.1 - osd.3 - osd.4 - osd.5 sha1: 67c3088bbad2bb45fab809eb6d89e0b3248197b6 sleep_before_teardown: 0 suite: fs:upgrade suite_branch: wip-dparmar-cephadm-55715-simple suite_path: /home/teuthworker/src/git.ceph.com_ceph-c_67c3088bbad2bb45fab809eb6d89e0b3248197b6/qa suite_relpath: qa suite_repo: git://git.ceph.com/ceph-ci.git suite_sha1: 67c3088bbad2bb45fab809eb6d89e0b3248197b6 targets: smithi075.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCrnTHpr27sQVTzBXq5nfn3DhvNjlI50IEwe7FJRtps1Z8COALtB05jJShmU4BKyNXFScH5rDN+zi60RoazI8CbMCN28/gRNkIutLfIakPOx5TiExqPXh4q4om7chH8O0kDuLS0HGY3q6v2houQpY5KI5XQenSkk0KaMiccW6sAC5RsY4Eb/YC7+pf9CA0eMyZeD4jVsd86QwTRCJxJ3WIWfnTl/AMS5fNqzuoOTQmE9CChYUYv9RZT7JTsGklMIdD4O+O1q+nsaP0ny9b/g+JB7xvWiInSi9jZBodJ9rjqq+cBANtk7oUgzlBGUxpSj1namBD4XFC9c2tseF1LpOMQlSk4LB6TvsPPZNZ9kQ/SiS2EzQy/wzRhwsYASY52Wig9DSReVrzyOpHzKlxbNVUStDmDSqgWzs3znzng4mavaurtFMQri2ppuCw7ak1OKkdaR8ArLqZAZ11QZSINgMCnbiS0O2U0+cNJYJnV8TRnbKMQkHfP6duOU1k10YqvL20= smithi204.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQDMCw2F6fropmdYO3L8TIT9hNILRYeldUMrO0DdB+9SV73zjqtrjeMwuPi2+/rTq1/ArVmZI6l1H4HCsf3F55NHyT0OGDjjjrfv13PQpuXraqBHZMSgUJucU4Tl1WjTCiNL2eTbbZhxlBW9PBZZaPr2sd9SZaoQULMasnnpw2qYLlNLgKrNf7QfXEM7PJUJS3pXEN2Im1VrlifwA9rW/irG+7nlJtLWZUP9I36YvA39JVczI+hdpxJ5hyMjR05aaBNGPBPhi+3xFd/6PMrKEjbok1x8eHaAFSw5srBFv7hBFfs6bbF05a83fJ/EDb9eWG9z8azifEYFAOcaRj4ms3f09lwnkHWa6mL4mydcmGGdAWZZxF/zhaTQIyrLDokyhhverhjEAqTQZxAsq0NiTTOQGD4KzemZX4xrblgaIQJmVFP8Da+3vvKbiCHTUW+SrFBgoHQ1aYtOYBkjhhBTOR92s1ek1MhBjjK8VYXrW/XnDdzFkWj6OVl4S7nH6bKGWT0= tasks: - internal.check_packages: null - internal.buildpackages_prep: null - internal.save_config: null - internal.check_lock: null - internal.add_remotes: null - console_log: null - internal.connect: null - internal.push_inventory: null - internal.serialize_remote_roles: null - internal.check_conflict: null - internal.check_ceph_data: null - internal.vm_setup: null - kernel: *id001 - internal.base: null - internal.archive_upload: null - internal.archive: null - internal.coredump: null - internal.sudo: null - internal.syslog: null - internal.timer: null - pcp: null - selinux: null - ansible.cephlab: null - clock: null - pexec: all: - sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup - sudo dnf -y module reset container-tools - sudo dnf -y module install container-tools - sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf - install: branch: pacific exclude_packages: - ceph-volume - print: '**** done install task...' - cephadm: cephadm_branch: pacific cephadm_git_url: https://github.com/ceph/ceph conf: osd: osd_class_default_list: '*' osd_class_load_list: '*' image: quay.io/ceph/daemon-base:latest-pacific roleless: true - print: '**** done end installing pacific cephadm ...' - cephadm.shell: host.a: - ceph config set mgr mgr/cephadm/use_repo_digest true --force - print: '**** done cephadm.shell ceph config set mgr...' - cephadm.shell: host.a: - ceph orch status - ceph orch ps - ceph orch ls - ceph orch host ls - ceph orch device ls - cephadm.shell: host.a: - ceph fs volume create cephfs --placement=4 - ceph fs dump - cephadm.shell: host.a: - ceph fs set cephfs max_mds 2 - cephadm.shell: host.a: - ceph fs set cephfs allow_standby_replay false - cephadm.shell: host.a: - ceph fs set cephfs inline_data true --yes-i-really-really-mean-it - cephadm.shell: host.a: - ceph fs dump - ceph --format=json fs dump | jq -e ".filesystems | length == 1" - while ! ceph --format=json mds versions | jq -e ". | add == 4"; do sleep 1; done - fs.pre_upgrade_save: null - kclient: null - print: '**** done client' - parallel: - upgrade-tasks - workload-tasks - cephadm.shell: host.a: - ceph fs dump - fs.post_upgrade_checks: null teuthology_branch: main teuthology_sha1: 10062088f503b43eff3624326bda825b23438f9b timestamp: 2022-07-11_08:53:46 tube: smithi upgrade-tasks: sequential: - cephadm.shell: env: - sha1 host.a: - ceph config set mon mon_warn_on_insecure_global_id_reclaim false --force - ceph config set mon mon_warn_on_insecure_global_id_reclaim_allowed false --force - ceph config set global log_to_journald false --force - ceph orch ps - ceph versions - ceph -s - ceph orch ls - ceph orch daemon redeploy "mgr.$(ceph mgr dump -f json | jq .standbys | jq .[] | jq -r .name)" --image quay.ceph.io/ceph-ci/ceph:$sha1 - ceph orch ps --refresh - sleep 180 - ceph orch ps - ceph versions - ceph -s - ceph versions | jq -e '.mgr | length == 2' - ceph mgr fail - sleep 180 - ceph orch daemon redeploy "mgr.$(ceph mgr dump -f json | jq .standbys | jq .[] | jq -r .name)" --image quay.ceph.io/ceph-ci/ceph:$sha1 - ceph orch ps --refresh - sleep 180 - ceph orch ps - ceph versions - ceph -s - ceph mgr fail - sleep 180 - ceph orch ps - ceph versions - ceph -s - ceph versions | jq -e '.mgr | length == 1' - ceph mgr fail - sleep 180 - ceph orch ps - ceph versions - ceph orch upgrade start --image quay.ceph.io/ceph-ci/ceph:$sha1 --daemon-types mgr - while ceph orch upgrade status | jq '.in_progress' | grep true && ! ceph orch upgrade status | jq '.message' | grep Error ; do ceph orch ps ; ceph versions ; ceph orch upgrade status ; sleep 30 ; done - ceph versions | jq -e '.mgr | length == 1' - ceph versions | jq -e '.mgr | keys' | grep $sha1 - ceph versions | jq -e '.overall | length == 2' - ceph orch upgrade check quay.ceph.io/ceph-ci/ceph:$sha1 | jq -e '.up_to_date | length == 2' - ceph orch ps --refresh - sleep 180 - ceph config set mgr mgr/orchestrator/fail_fs true - ceph orch upgrade start --image quay.ceph.io/ceph-ci/ceph:$sha1 - cephadm.shell: env: - sha1 host.a: - while ceph orch upgrade status | jq '.in_progress' | grep true && ! ceph orch upgrade status | jq '.message' | grep Error ; do ceph orch ps ; ceph versions ; ceph fs dump; ceph orch upgrade status ; sleep 30 ; done - ceph orch ps - ceph versions - echo "wait for servicemap items w/ changing names to refresh" - sleep 60 - ceph orch ps - ceph health detail - ceph orch upgrade status - ceph versions - ceph versions | jq -e '.overall | length == 1' - ceph versions | jq -e '.overall | keys' | grep $sha1 user: dparmar verbose: true worker_log: /home/teuthworker/archive/worker_logs/dispatcher.smithi.1713 workload-tasks: sequential: - workunit: clients: all: - suites/fsstress.sh