archive_path: /home/teuthworker/archive/teuthology-2021-01-13_14:23:02-upgrade:nautilus-x-master-distro-basic-smithi/5783117
branch: master
description: upgrade:nautilus-x/stress-split-erasure-code/{0-cluster/{openstack start}
  1-nautilus-install/nautilus 1.1-pg-log-overrides/short_pg_log 2-partial-upgrade/firsthalf
  3-thrash/default 3.1-objectstore/bluestore-bitmap 4-ec-workload/{rados-ec-workload
  rbd-ec-workload} 5-finish-upgrade 6-octopus 7-final-workload mon_election/classic
  thrashosds-health ubuntu_18.04}
email: ceph-qa@ceph.io
exclude_arch: armv7l
first_in_suite: false
job_id: '5783117'
kernel: &id001
  kdb: true
  sha1: distro
last_in_suite: false
machine_type: smithi
meta:
- desc: 'Run ceph on two nodes,

    with a separate client-only node.

    Use xfs beneath the osds.

    '
- desc: install ceph/nautilus latest
- desc: 'install upgrade ceph/-x on 2/3 of cluster

    restart : mons, osd.0-7

    '
- desc: 'randomly kill and revive osd

    small chance to increase the number of pgs

    '
- desc: 'randomized correctness test for rados operations on an erasure coded pool

    '
- desc: 'run rbd tests on EC pool

    overrides => force bluestore since it''s required for ec-overwrite

    use an EC pool for rbd and run xfstests on top of it to verify correctness

    '
- desc: 'randomized correctness test for rados operations on an erasure coded pool

    using the jerasure plugin with k=3 and m=1

    '
name: teuthology-2021-01-13_14:23:02-upgrade:nautilus-x-master-distro-basic-smithi
nuke-on-error: true
openstack:
- machine:
    disk: 100
- volumes:
    count: 4
    size: 30
os_type: ubuntu
os_version: '18.04'
overrides:
  admin_socket:
    branch: master
  ceph:
    conf:
      client:
        rbd default data pool: datapool
      global:
        enable experimental unrecoverable data corrupting features: '*'
        mon election default strategy: 1
        mon warn on msgr2 not enabled: false
      mgr:
        debug mgr: 20
        debug ms: 1
      mon:
        debug mon: 20
        debug ms: 1
        debug paxos: 20
        mon warn on osd down out interval zero: false
      osd:
        bdev async discard: true
        bdev enable discard: true
        bluestore allocator: bitmap
        bluestore block size: 96636764160
        bluestore fsck on mount: true
        debug bluefs: 20
        debug bluestore: 20
        debug filestore: 20
        debug journal: 20
        debug ms: 20
        debug osd: 25
        debug rocksdb: 10
        mon osd backfillfull_ratio: 0.85
        mon osd full ratio: 0.9
        mon osd nearfull ratio: 0.8
        osd failsafe full ratio: 0.95
        osd max markdown count: 1000
        osd max pg log entries: 2
        osd min pg log entries: 1
        osd objectstore: bluestore
    fs: xfs
    log-ignorelist:
    - \(MDS_ALL_DOWN\)
    - \(MDS_UP_LESS_THAN_MAX\)
    - overall HEALTH_
    - \(MON_DOWN\)
    - \(MGR_DOWN\)
    - slow request
    - \(MON_MSGR2_NOT_ENABLED\)
    - but it is still running
    - wrongly marked me down
    - objects unfound and apparently lost
    - log bound mismatch
    - overall HEALTH_
    - \(OSDMAP_FLAGS\)
    - \(OSD_
    - \(PG_
    - \(POOL_
    - \(CACHE_POOL_
    - \(SMALLER_PGP_NUM\)
    - \(OBJECT_
    - \(SLOW_OPS\)
    - \(REQUEST_SLOW\)
    - \(TOO_FEW_PGS\)
    - slow request
    log-whitelist:
    - \(MDS_ALL_DOWN\)
    - \(MDS_UP_LESS_THAN_MAX\)
    mon_bind_addrvec: false
    mon_bind_msgr2: false
    sha1: 6c805c640527f9600fe04369ac4a5d8ec8583707
  ceph-deploy:
    bluestore: true
    conf:
      client:
        log file: /var/log/ceph/ceph-$name.$pid.log
      mon:
        osd default pool size: 2
      osd:
        bdev async discard: true
        bdev enable discard: true
        bluestore block size: 96636764160
        bluestore fsck on mount: true
        debug bluefs: 20
        debug bluestore: 20
        debug rocksdb: 10
        mon osd backfillfull_ratio: 0.85
        mon osd full ratio: 0.9
        mon osd nearfull ratio: 0.8
        osd failsafe full ratio: 0.95
        osd objectstore: bluestore
    fs: xfs
  install:
    ceph:
      sha1: 6c805c640527f9600fe04369ac4a5d8ec8583707
  thrashosds:
    bdev_inject_crash: 2
    bdev_inject_crash_probability: 0.5
  workunit:
    branch: master
    sha1: 6c805c640527f9600fe04369ac4a5d8ec8583707
owner: scheduled_teuthology@teuthology
priority: 70
repo: git://git.ceph.com/ceph.git
roles:
- - mon.a
  - mgr.x
  - osd.0
  - osd.1
  - osd.2
  - osd.3
- - mon.b
  - osd.4
  - osd.5
  - osd.6
  - osd.7
- - mon.c
- - osd.8
  - osd.9
  - osd.10
  - osd.11
- - client.0
sha1: 6c805c640527f9600fe04369ac4a5d8ec8583707
sleep_before_teardown: 0
stress-tasks:
- thrashosds:
    aggressive_pg_num_changes: false
    chance_force_recovery: 0
    chance_pgnum_grow: 1
    chance_pgpnum_fix: 1
    chance_thrash_cluster_full: 0
    chance_thrash_pg_upmap: 0
    chance_thrash_pg_upmap_items: 0
    disable_objectstore_tool_tests: true
    min_in: 4
    timeout: 1200
- print: '**** done thrashosds 3-thrash'
- rados:
    clients:
    - client.0
    ec_pool: true
    objects: 50
    op_weights:
      append: 100
      copy_from: 50
      delete: 50
      read: 100
      rmattr: 25
      rollback: 50
      setattr: 25
      snap_create: 50
      snap_remove: 50
      write: 0
    ops: 4000
    write_append_excl: false
- print: '**** done rados ec task'
suite: upgrade:nautilus-x
suite_branch: master
suite_path: /home/teuthworker/src/git.ceph.com_ceph_master/qa
suite_relpath: qa
suite_repo: git://git.ceph.com/ceph.git
suite_sha1: 6c805c640527f9600fe04369ac4a5d8ec8583707
targets:
  smithi086.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABAQDOS4hCuB9UDNeVnv2LSfmFtJX3puyXEUccOQIiOMw3dczrYtYStPuamGxthSY6RwIKuAp3OWX4QGc6d2mvXhWq1ljSddMy+o8VYnOV8sN5ptdYfiSwSGH/969yr+X4k4pcrMnUWvSFRaOc1FUnwEIuMueb96pST/n1FEIs0cV7PFInNERlN3IdPL8HURSvXsiExoiR28IkkQZ9JRzKYKZHP2is0v/y2NDL5YU19KP3qQiGiu4lv7kdpyirqeIDMvkMcj6ObB+kLhcD+M7iT2sIoZuHC5Z8qt+rFrF5LQ8J9ZY2f++blkS/jd/oe35KLm5RQvIojekDjCvecM+ctboX
  smithi137.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABAQCm11Kt69ZP4b5iwdUi7KhohPXj1s/E7lfIxjM2QMbvGRNU3cJVc9xv36FZdSD8SwlTKILA4Tocsj6aT74O0nfA+OFK20X4GFvrISTOzQXMzf36ZKzXBN4U3KaxlrKtG3JwM2aCyF9nJ0slE5vr8FgzyE4fW8TAlenSh5oXQvM6dodoDR3TMVCDY317SoKMBs8fzeFdmUoPQkF28A2DCG3+Z4R26SYlF1j9okpmshwRxZ9IqhnQKb8ZOThrona+b3xUSe/lwuPNEFDGvtm3vGEFklqdt2+rQsQl1Hf/uYmoH8byvFcTtnlEGVt2QtDdB51KSu1tbTfz+or5RaqMnTyd
  smithi166.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABAQDR5viewA3Bdxja+12RkFB9Z8SwX/Vvmy0PMO+hNI/XvpkCKb2dVoVpruoP1t42qQTrgPxe0lIslELfqUPM5aG/dIUiCK2Uluuu/TeYv0QiLbgxjGZ1m9a0oF3syz8I7Kthx8C6uzYJp3oV2q0gO463wTqYb1PAjJuzbCd+Au3Qajmun5JySGDy3VdczjobbYwZ/SokL505qEAP4v2Qs1UKQBZK5xxjF8HNHBKtyL9Ymzc+QzCfMUl3rRZoFj2ppqpyLB3MdM9DxP9Cjp40NxssV33Yn0evVwtCg1SUENAqUN+irXPkf6UNI7MKSvaBEILOvipXrTOkvTPyWonyjGhf
  smithi201.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABAQDe0PHvV6kvDkL7InhWO+w88T87M/KPgwqhlxXa/9oqAkWEkLr21m6+qJhwXw0pZocbM7Mvy3wxn6a/4EyS0+5eULCWl9/pOfgk/MzobmWQK7DrsWT6FZ4oWm5R00Mi5o2VuV29ClV7jhJGJo+xuyvch9zyY9B4AmrXB7jjFYzDCBX6f1eLj0MrDD+mrxcJKkuv+PMd99Hfmm63r+mpM0Cw5Zz5Uj4e7W+vVIzM/desduJ288beTFKICNxkzqAUQx7vNIWDrLULqzJkUT/zWGb5Oco1DKgJQb9/rc0P9UyKpadYCGy4Xqb3i8z9xtSfXuj2aB3MSENJ318QRi4QBoPN
  smithi203.front.sepia.ceph.com: ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABAQCbD2m+yVC94+a18Ph83WlbFq84sfjpeKJiuRev81Z1yQ9PC1CLdIItIxjXQH2KydeMbcYIsAjwnTb8TYz+/e1u9XN73PxklYq56j216AMPCYPp+IDWaI4SZpWHRsyRYyOA6DZaPqVyE8/VMs+ENJxpoy8zV30xCDy/WoXag9CvsEBJeWk7SUdiNkFfSRckaZ1/A18LWSChjZcXlcovZ5Bl4QP2doZ/qx7pHFapAnXYodcjnEauSZrlNL37kmUcNpql5Dx0xsfUo3TCD/il+oHxC/5MqnOqkNTOirjtmcl3ddkgRbmoVaJYGNkmwq7XkhN6bhugfEmXEDAFNjcaO9UR
tasks:
- internal.check_packages: null
- internal.buildpackages_prep: null
- internal.lock_machines:
  - 5
  - smithi
- internal.save_config: null
- internal.check_lock: null
- internal.add_remotes: null
- console_log: null
- internal.connect: null
- internal.push_inventory: null
- internal.serialize_remote_roles: null
- internal.check_conflict: null
- internal.check_ceph_data: null
- internal.vm_setup: null
- kernel: *id001
- internal.base: null
- internal.archive_upload: null
- internal.archive: null
- internal.coredump: null
- internal.sudo: null
- internal.syslog: null
- internal.timer: null
- pcp: null
- selinux: null
- ansible.cephlab: null
- clock: null
- install:
    branch: nautilus
    exclude_packages:
    - ceph-mgr-cephadm
    - cephadm
    - libcephfs-dev
- print: '**** done install nautilus'
- ceph:
    conf:
      global:
        bluestore warn on no per pool omap: false
        bluestore_warn_on_legacy_statfs: false
        mon pg warn min per osd: 0
    log-ignorelist:
    - Not found or unloadable
    - evicting unresponsive client
- exec:
    osd.0:
    - ceph osd require-osd-release nautilus
    - ceph osd set-require-min-compat-client nautilus
- print: '**** done ceph'
- rgw:
  - client.0
- print: '**** done => started rgw client.0'
- install.upgrade:
    mon.a: null
    mon.b: null
    mon.c: null
- print: '**** done install.upgrade of first 3 nodes'
- ceph.restart:
    daemons:
    - mon.a
    - mon.b
    - mgr.x
    - osd.0
    - osd.1
    - osd.2
    - osd.3
    - osd.4
    - osd.5
    - osd.6
    - osd.7
    mon-health-to-clog: false
- print: '**** done ceph.restart of all mons and 2/3 of osds'
- parallel:
  - stress-tasks
- exec:
    client.0:
    - sudo ceph osd erasure-code-profile set teuthologyprofile crush-failure-domain=osd
      m=1 k=2
    - sudo ceph osd pool create datapool 4 4 erasure teuthologyprofile
    - sudo ceph osd pool set datapool allow_ec_overwrites true
    - rbd pool init datapool
- qemu:
    all:
      clone: true
      disks: 3
      test: qa/run_xfstests_qemu.sh
      type: block
- print: '**** done rbd/qemu ec task'
- install.upgrade:
    client.0: null
    extra_packages:
    - python3-rados
    - python3-rgw
    - python3-rbd
    - python3-cephfs
    osd.8: null
- ceph.restart:
    daemons:
    - mon.c
    - osd.8
    - osd.9
    - osd.10
    - osd.11
    - rgw.*
    wait-for-healthy: false
    wait-for-osds-up: true
- print: '**** restarted/upgrated => mon.c, osd.8, osd.9, osd.10, osd.11, rgw.*'
- exec:
    osd.0:
    - ceph osd set pglog_hardlimit
    - ceph osd dump --format=json-pretty | grep "flags"
    - ceph config set global mon_warn_on_msgr2_not_enabled false
- print: '**** try to set pglog_hardlimit again, should succeed'
- exec:
    osd.0:
    - ceph osd require-osd-release octopus
    - ceph osd set-require-min-compat-client octopus
    - for f in `ceph osd pool ls` ; do ceph osd pool set $f pg_autoscale_mode off
      ; done
- ceph.healthy: null
- rados:
    clients:
    - client.0
    ec_pool: true
    erasure_code_profile:
      crush-failure-domain: osd
      k: 3
      m: 1
      name: jerasure31profile
      plugin: jerasure
      technique: reed_sol_van
    objects: 50
    op_weights:
      append: 100
      copy_from: 50
      delete: 50
      read: 100
      rmattr: 25
      rollback: 50
      setattr: 25
      snap_create: 50
      snap_remove: 50
      write: 0
    ops: 4000
    write_append_excl: false
teuthology_branch: master
timestamp: 2021-01-13_14:23:02
tube: smithi
user: teuthology
verbose: true
worker_log: /home/teuthworker/archive/worker_logs/worker.smithi.6154