archive_path: /home/teuthworker/archive/benhanokh-2022-02-07_14:20:29-rados-WIP_GBH_safe_shutdown_v2A-distro-basic-smithi/6666511 branch: WIP_GBH_safe_shutdown_v2A description: rados/thrash/{0-size-min-size-overrides/2-size-2-min-size 1-pg-log-overrides/normal_pg_log 2-recovery-overrides/{more-async-partial-recovery} 3-scrub-overrides/{max-simultaneous-scrubs-3} backoff/normal ceph clusters/{fixed-2 openstack} crc-failures/bad_map_crc_failure d-balancer/crush-compat mon_election/classic msgr-failures/few msgr/async-v1only objectstore/bluestore-comp-zlib rados supported-random-distro$/{ubuntu_latest} thrashers/careful thrashosds-health workloads/cache-agent-big} email: null first_in_suite: false job_id: '6666511' kernel: &id001 kdb: true sha1: distro last_in_suite: false machine_type: smithi name: benhanokh-2022-02-07_14:20:29-rados-WIP_GBH_safe_shutdown_v2A-distro-basic-smithi nuke-on-error: true openstack: - volumes: count: 4 size: 10 - volumes: count: 4 size: 30 os_type: ubuntu os_version: '20.04' overrides: admin_socket: branch: WIP_GBH_safe_shutdown_v2A ceph: conf: global: mon client directed command retry: 5 mon election default strategy: 1 ms bind msgr2: false ms inject socket failures: 5000 ms type: async osd_async_recovery_min_cost: 1 osd_object_clean_region_max_num_intervals: 1000 osd_pool_default_min_size: 2 osd_pool_default_size: 2 mgr: debug mgr: 20 debug ms: 1 mon: debug mon: 20 debug ms: 1 debug paxos: 20 mon min osdmap epochs: 50 mon osdmap full prune interval: 2 mon osdmap full prune min: 15 mon osdmap full prune txsize: 2 mon scrub interval: 300 paxos service trim min: 10 osd: bluestore block size: 96636764160 bluestore compression algorithm: zlib bluestore compression mode: aggressive bluestore fsck on mount: true debug bluefs: 20 debug bluestore: 20 debug ms: 1 debug osd: 20 debug rocksdb: 10 mon osd backfillfull_ratio: 0.85 mon osd full ratio: 0.9 mon osd nearfull ratio: 0.8 osd debug reject backfill probability: 0.3 osd debug verify cached snaps: true osd debug verify missing on start: true osd failsafe full ratio: 0.95 osd heartbeat use min delay socket: true osd inject bad map crc probability: 0.1 osd max backfills: 3 osd max markdown count: 1000 osd max scrubs: 3 osd objectstore: bluestore osd op queue: debug_random osd op queue cut off: debug_random osd scrub max interval: 120 osd scrub min interval: 60 osd shutdown pgref assert: true osd snap trim sleep: 2 osd_max_pg_log_entries: 3000 osd_min_pg_log_entries: 3000 fs: xfs log-ignorelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) - \(REQUEST_STUCK\) - failed to encode map - \(OSD_SLOW_PING_TIME - but it is still running - objects unfound and apparently lost - overall HEALTH_ - \(OSDMAP_FLAGS\) - \(OSD_ - \(PG_ - \(POOL_ - \(CACHE_POOL_ - \(SMALLER_PGP_NUM\) - \(OBJECT_ - \(SLOW_OPS\) - \(REQUEST_SLOW\) - \(TOO_FEW_PGS\) - slow request - must scrub before tier agent can activate log-whitelist: - \(MDS_ALL_DOWN\) - \(MDS_UP_LESS_THAN_MAX\) mon_bind_msgr2: false sha1: 8a074fcf8834e0bf886be04d53b6ac80280d9574 ceph-deploy: conf: client: log file: /var/log/ceph/ceph-$name.$pid.log mon: osd default pool size: 2 install: ceph: sha1: 8a074fcf8834e0bf886be04d53b6ac80280d9574 thrashosds: bdev_inject_crash: 2 bdev_inject_crash_probability: 0.5 workunit: branch: WIP_GBH_safe_shutdown_v2A sha1: 8a074fcf8834e0bf886be04d53b6ac80280d9574 owner: scheduled_benhanokh@teuthology priority: 75 repo: https://github.com/ceph/ceph-ci.git roles: - - mon.a - mon.c - mgr.y - osd.0 - osd.1 - osd.2 - osd.3 - client.0 - node-exporter.a - - mon.b - mgr.x - osd.4 - osd.5 - osd.6 - osd.7 - client.1 - prometheus.a - node-exporter.b sha1: 8a074fcf8834e0bf886be04d53b6ac80280d9574 sleep_before_teardown: 0 suite: rados suite_branch: WIP_GBH_safe_shutdown_v2A suite_path: /home/teuthworker/src/git.ceph.com_ceph-c_8a074fcf8834e0bf886be04d53b6ac80280d9574/qa suite_relpath: qa suite_repo: git://git.ceph.com/ceph-ci.git suite_sha1: 8a074fcf8834e0bf886be04d53b6ac80280d9574 targets: smithi134.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC5oRSYe53a7qAdFZaqeFAXF7bS7SUXtopp5wUFv1hpabgm26NpbyxUBhjxkHL66eJqJ+S/0HqrFH532Hr+JNtAgiyLIB2HF0K/qweucX95pb3OSG5sZ1EV/Pl5NRKS/lAoUGNv62EIVvz09/QqYNNck00ory+MKHB+UeNgU89pQSpYegTx4z67Sn3Cyop2J3L4vOhMw+BY1pQGyqApaKGHPCEWeFmMy28Vn3Hr30Mo0KyC0XgY2Bs9i1JQZKn+aCyG0sDqsC9X67FDR/zMAk41hE9ubZwS8tjN930mupdZlXY/VqGb47V5Zhhg0AKO1eXtd84mkQ/QifcarCr1kszG/jBYa872adnuKQL0pLofAs3PrEyTUgB482vxawDDnkeG0PgYAHLAYKskd/SzpNrq2akgl1hHfRPg48ywqxeWILu6FQbPonFfy259uR2PxFpiAOqwqmzQnj4CxeMSNUwIYLV6IaXfx7yR88lnGdEK97LyPb4RVzO8IfpajNQnXh8= smithi185.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQC2TUKe66sKwVI3PR/L1ulpjM8MJo1t/KmI/leImsAKBkb6Z3zSSTjIO+dis4Uch7dAr5fv/vnvG+5yJG5x8qC7xrb9JEt/aa7PkUEILZXnJ27l5OErKyKy/+BvsUkxtAYb0VqRpo4iD2TrBxfHUayZl+CqeEI9exGzTCoPvJ6gVmWpYcztuOaQVoFK9h6Bw6034yEdFhQC7iLjsbZgBDm+pUQ4ijxoo3Z+L3rKi7/kQcs+llcppAPQ85e5ItvbhtOfMJcz6IGKRQeZl99seHj+t88uwtIRPCUV5GXG06sXVPrDp1lQ5MfRyv8kRUPMXIeiLpCShTD2Ns6i826rhUZOLjS5SIJxm5KEkLuWttEKSmL5CF+bRv3JmuFYMLXoupjc0QDgNWoRhbhSfnjg1qlaNXMxsmFufGS8shIHSoTq8f7Kz/3FQ7ian8RpJ/58N9apcYUpTqxwHgUXaTwft4OXvytrAJVYBQwDREHQwwIaHPXTxx//YoV4RL0oljIE/a0= tasks: - internal.check_packages: null - internal.buildpackages_prep: null - internal.save_config: null - internal.check_lock: null - internal.add_remotes: null - console_log: null - internal.connect: null - internal.push_inventory: null - internal.serialize_remote_roles: null - internal.check_conflict: null - internal.check_ceph_data: null - internal.vm_setup: null - kernel: *id001 - internal.base: null - internal.archive_upload: null - internal.archive: null - internal.coredump: null - internal.sudo: null - internal.syslog: null - internal.timer: null - pcp: null - selinux: null - ansible.cephlab: null - clock: null - install: null - ceph: conf: osd: debug monc: 20 - exec: mon.a: - while ! ceph balancer status ; do sleep 1 ; done - ceph balancer mode crush-compat - ceph balancer on - thrashosds: aggressive_pg_num_changes: false chance_pgnum_grow: 1 chance_pgnum_shrink: 1 chance_pgpnum_fix: 1 timeout: 1200 - exec: client.0: - sudo ceph osd erasure-code-profile set myprofile crush-failure-domain=osd m=2 k=2 - sudo ceph osd pool create base 4 4 erasure myprofile - sudo ceph osd pool application enable base rados - sudo ceph osd pool set base min_size 2 - sudo ceph osd pool create cache 4 - sudo ceph osd tier add base cache - sudo ceph osd tier cache-mode cache writeback - sudo ceph osd tier set-overlay base cache - sudo ceph osd pool set cache hit_set_type bloom - sudo ceph osd pool set cache hit_set_count 8 - sudo ceph osd pool set cache hit_set_period 60 - sudo ceph osd pool set cache target_max_objects 5000 - rados: clients: - client.0 max_seconds: 1200 objects: 6600 op_weights: copy_from: 50 delete: 50 read: 100 write: 100 ops: 10000 pools: - base size: 1024 teuthology_branch: master teuthology_sha1: 3094160cc590b786a43d55faaf7c99d5de71ce56 timestamp: 2022-02-07_14:20:29 tube: smithi user: benhanokh verbose: true worker_log: /home/teuthworker/archive/worker_logs/dispatcher.smithi.20261