archive_path: /home/teuthworker/archive/pdhange-2022-07-12_01:40:45-upgrade:pacific-x:stress-split-wip-pdhange-testing-distro-default-smithi/6925260 branch: wip-pdhange-testing description: upgrade:pacific-x:stress-split/{0-distro/rhel_8.6_container_tools_3.0 0-roles 1-start 2-first-half-tasks/prometheus-metrics 3-stress-tasks/{radosbench rbd-cls rbd-import-export rbd_api readwrite snaps-few-objects} 4-second-half-tasks/prometheus-metrics mon_election/connectivity} email: null first-half-sequence: - cephadm.shell: env: - sha1 mon.a: - ceph config set mgr mgr/cephadm/daemon_cache_timeout 60 - ceph config set global log_to_journald false --force - ceph orch upgrade start --image quay.ceph.io/ceph-ci/ceph:$sha1 - ceph orch ps - echo wait for minority of mons to upgrade - while ! ceph mon versions | grep $sha1 ; do sleep 2 ; done - ceph orch ps - ceph orch upgrade pause - sleep 60 - ceph orch upgrade resume - echo wait for majority of mons to upgrade - 'while ! ceph mon versions | grep $sha1 | egrep '': [23]'' ; do sleep 2 ; done' - ceph orch ps - ceph orch upgrade pause - sleep 60 - ceph orch upgrade resume - echo wait for all mons to upgrade - 'while ! ceph mon versions | grep $sha1 | grep '': 3'' ; do sleep 2 ; done' - ceph orch ps - ceph orch upgrade pause - sleep 60 - ceph orch upgrade resume - echo wait for half of osds to upgrade - 'while ! ceph osd versions | grep $sha1 | egrep '': [45678]''; do sleep 2 ; done' - ceph orch upgrade pause - ceph orch ps - ceph orch ps - ceph versions first-half-tasks: - workunit: clients: client.0: - mgr/test_prometheus_metrics.sh - print: '**** done end prometheus-metrics.yaml' first_in_suite: false job_id: '6925260' kernel: &id001 kdb: true sha1: distro last_in_suite: false machine_type: smithi meta: - desc: 'run ceph mon daemon version check on prometheus metrics ' - desc: 'run randomized correctness test for rados operations generate write load with rados bench ' - desc: 'run basic cls tests for rbd ' - desc: 'run basic import/export cli tests for rbd ' - desc: 'librbd C and C++ api tests ' - desc: 'randomized correctness test for rados operations on a replicated pool, using only reads, writes, and deletes ' - desc: 'randomized correctness test for rados operations on a replicated pool with snapshot operations ' - desc: 'run ceph mon daemon version check on prometheus metrics ' name: pdhange-2022-07-12_01:40:45-upgrade:pacific-x:stress-split-wip-pdhange-testing-distro-default-smithi no_nested_subset: false nuke-on-error: true openstack: - volumes: count: 4 size: 10 os_type: rhel os_version: '8.6' overrides: admin_socket: branch: wip-pdhange-testing ceph: conf: global: mon election default strategy: 3 mgr: debug mgr: 20 debug ms: 1 mon: debug mon: 20 debug ms: 1 debug paxos: 20 osd: debug ms: 1 debug osd: 20 osd shutdown pgref assert: true create_rbd_pool: true flavor: default log-ignorelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) sha1: 17f56d5b7a767112ff48cb9978ded24411c31ded ceph-deploy: conf: client: log file: /var/log/ceph/ceph-$name.$pid.log mon: osd default pool size: 2 install: ceph: flavor: default sha1: 17f56d5b7a767112ff48cb9978ded24411c31ded selinux: whitelist: - scontext=system_u:system_r:logrotate_t:s0 workunit: branch: wip-mgr-upgrade-test sha1: ac5ec6e9fdae229e12ef2011c799f53a49eb27e3 owner: scheduled_pdhange@teuthology priority: 90 repo: git://git.ceph.com/ceph-ci.git roles: - - mon.a - mon.c - mgr.y - osd.0 - osd.1 - osd.2 - osd.3 - client.0 - node-exporter.a - alertmanager.a - - mon.b - mgr.x - osd.4 - osd.5 - osd.6 - osd.7 - client.1 - prometheus.a - grafana.a - node-exporter.b second-half-sequence: sequential: - cephadm.shell: env: - sha1 mon.a: - ceph orch upgrade resume - sleep 60 - echo wait for upgrade to complete - while ceph orch upgrade status | jq '.in_progress' | grep true ; do ceph orch ps ; ceph versions ; sleep 30 ; done - echo upgrade complete - ceph orch ps - ceph versions - ceph versions | jq -e '.overall | length == 1' - ceph versions | jq -e '.overall | keys' | grep $sha1 second-half-tasks: - workunit: clients: client.0: - mgr/test_prometheus_metrics.sh - print: '**** done end prometheus-metrics.yaml' sha1: 17f56d5b7a767112ff48cb9978ded24411c31ded sleep_before_teardown: 0 stress-tasks: - thrashosds: aggressive_pg_num_changes: false chance_force_recovery: 0 chance_pgnum_grow: 1 chance_pgpnum_fix: 1 chance_thrash_cluster_full: 0 chance_thrash_pg_upmap: 0 chance_thrash_pg_upmap_items: 0 disable_objectstore_tool_tests: true timeout: 1200 - full_sequential: - radosbench: clients: - client.0 time: 90 - radosbench: clients: - client.0 time: 90 - radosbench: clients: - client.0 time: 90 - radosbench: clients: - client.0 time: 90 - radosbench: clients: - client.0 time: 90 - radosbench: clients: - client.0 time: 90 - print: '**** done end radosbench.yaml' - workunit: branch: octopus clients: client.0: - cls/test_cls_rbd.sh - print: '**** done cls/test_cls_rbd.sh 5-workload' - workunit: branch: octopus clients: client.0: - rbd/import_export.sh env: RBD_CREATE_ARGS: --new-format - print: '**** done rbd/import_export.sh 5-workload' - workunit: branch: octopus clients: client.0: - rbd/test_librbd.sh - print: '**** done rbd/test_librbd.sh 7-workload' - full_sequential: - rados: clients: - client.0 objects: 500 op_weights: delete: 10 read: 45 write: 45 ops: 4000 write_append_excl: false - print: '**** done rados/readwrite 5-workload' - full_sequential: - rados: clients: - client.0 objects: 50 op_weights: delete: 50 read: 100 rollback: 50 snap_create: 50 snap_remove: 50 write: 100 ops: 4000 write_append_excl: false - print: '**** done rados/snaps-few-objects 5-workload' suite: upgrade:pacific-x:stress-split suite_branch: wip-mgr-upgrade-test suite_path: /home/teuthworker/src/github.com_pdvian_ceph_ac5ec6e9fdae229e12ef2011c799f53a49eb27e3/qa suite_relpath: qa suite_repo: https://github.com/pdvian/ceph suite_sha1: ac5ec6e9fdae229e12ef2011c799f53a49eb27e3 targets: smithi005.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQChuNDYztl3WpzYyy4lvxDdToajScnjlgX4KZOyt/JWPABStRM9eGu//9MuT/5fnpJ9ImlJs2SViOOUg84aeFJ4VAQAhZJ2i+QVH/VYViLI1CjCFjC/XmeyrE+4qUPlFZOBrGwbHp5trjBrkU+H9M1e06wmwPmAoMWYZYgAZu1AfcuVHpqP5d4qeRsvOwsaEzr8jYN8zyetxhq6wE7/KXPqMmsFcu6Eb92CABseKN10UQQHumivFPEPKvf+4DZ2LuydZ4NSZ0mvKXuSSkHMSX40QiQk32HzsHj8wYuKUL1SsG3ca6gAaQZ0UIq/bYonkK+Ob5Hxb+TaLdhC+VjkgsRabaHILrB+EQK4EGRdq2RY4SPNECYETS+/s8z61yZl6ivtMJ/I0m8R0SQLvWgnrzhAkjcFTSkl3b03/t2Po9M0R3DbKq/NVCFrvqVtVdq2QRglP5K2tpmIUS9K4MS/vCz/1MWXRF7LnUgLS+b8EjXaihvpviWXiBzR2zKppQKJnpc= smithi131.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC6IRYZ83xE6Qzw1N4AIztpf6nqgZAm888J+mTFMLeUpnSBOWb9f2cIc2hWAmWVLBdqI9I5CZQUkhB3gEEbPZ2G6fgVAi2FIAdzM6ZQRaSGWFo/u8XdEGsu3jz6oAstFfj0pXgbctCo4JugcA7GXvVRtFg7+lJXImLdM3B6m0oPXOGAXHdehTQWu7bkXou0zzpI3gCWHzNKa15mul9HkCLqAbA0CaA7E5J11xoreA2Q7cdpCnINiumxfImzhk9eDXltaFpc7+Uh8lm5o7Sg++p48my1vKsVgzaH47/yXYFGWMuyLiYggrUKJrHTzSUjgq+BmbGjSzNqU6zD7ephrXdvIkHEoWaAb9ajTwVaV6dD/Ndda2acc4nYbkTSqr7IruYeRVwCFsmiHvDjJrshgBM2eB5VxIRP1bwmxuwnxhe1vww1T3f0b7D0dXh8pE5L49L1kRFGf/9TxVaN5A046YIy5jaXfHXZRFayhE8vkxJyA2Xl/ajQ5lNES2qNZFKX2os= tasks: - internal.check_packages: null - internal.buildpackages_prep: null - internal.save_config: null - internal.check_lock: null - internal.add_remotes: null - console_log: null - internal.connect: null - internal.push_inventory: null - internal.serialize_remote_roles: null - internal.check_conflict: null - internal.check_ceph_data: null - internal.vm_setup: null - kernel: *id001 - internal.base: null - internal.archive_upload: null - internal.archive: null - internal.coredump: null - internal.sudo: null - internal.syslog: null - internal.timer: null - pcp: null - selinux: null - ansible.cephlab: null - clock: null - pexec: all: - sudo cp /etc/containers/registries.conf /etc/containers/registries.conf.backup - sudo dnf -y module reset container-tools - sudo dnf -y module install container-tools:3.0 - sudo cp /etc/containers/registries.conf.backup /etc/containers/registries.conf - install: branch: pacific exclude_packages: - ceph-volume - cephadm: cephadm_branch: pacific cephadm_git_url: https://github.com/ceph/ceph conf: osd: osd_class_default_list: '*' osd_class_load_list: '*' image: quay.io/ceph/daemon-base:latest-pacific - cephadm.shell: mon.a: - ceph fs volume create foo - ceph config set mon mon_warn_on_insecure_global_id_reclaim false --force - ceph config set mon mon_warn_on_insecure_global_id_reclaim_allowed false --force - ceph.healthy: null - print: '**** upgrading first half of cluster, with stress ****' - parallel: - first-half-tasks - first-half-sequence - print: '**** done upgrading first half of cluster ****' - ceph.healthy: null - print: '**** applying stress + thrashing to mixed-version cluster ****' - parallel: - stress-tasks - ceph.healthy: null - print: '**** finishing upgrade ****' - parallel: - second-half-tasks - second-half-sequence - ceph.healthy: null teuthology_branch: main teuthology_sha1: 10062088f503b43eff3624326bda825b23438f9b timestamp: 2022-07-12_01:40:45 tube: smithi user: pdhange verbose: true worker_log: /home/teuthworker/archive/worker_logs/dispatcher.smithi.1713