Found 99 jobs
Missing teuthology log /home/teuthworker/mnt/teuthology/adking-2026-02-13_15:54:16-orch:cephadm-wip-adk3-testing-2026-02-12-2007-distro-default-trial/49483/teuthology.log
Found 15 distinct failure reasons
Failure: Command failed on trial040 with status 1: 'sudo /home/ubuntu/cephtest/cephadm --image quay.ceph.io/ceph-ci/ceph:042df16cd9ee8a8df553b188fef8a8c4a9e7ab01 shell -c /etc/ceph/ceph.conf -k /etc/ceph/ceph.client.admin.keyring --fsid 5998a032-0b90-11f1-a7ea-d404e6e7d460 -- bash -c \'set -ex\n\n# Function to wait for a service to be healthy and log response on error\nwait_for_service() {\n  local name="$1"\n  local url="$2"\n  local jq_filter="$3"\n\n  echo "Waiting for service $name to be healthy at $url..."\n  for i in {1..30}; do\n    local response\n    response=$(curl -k -s -u admin:admin "$url")\n    if echo "$response" | jq -e "$jq_filter" > /dev/null; then\n      echo "Service $name is healthy."\n      return 0\n    fi\n    echo "Attempt $i: service $name not ready yet"\n    sleep 10\n  done\n\n  echo "Timeout waiting for $name at $url"\n  echo "Last HTTP response:"\n  echo "$response"\n  echo "jq output:"\n  echo "$response" | jq "$jq_filter" || echo "(jq parse error or no match)"\n  return 1\n}\n\n# retrieve mgmt hostname and ip\nMGMT_GTW_HOST=$(ceph orch ps --daemon-type mgmt-gateway -f json | jq -e \'"\'"\'.[]\'"\'"\' | jq -r \'"\'"\'.hostname\'"\'"\')\nMGMT_GTW_IP=$(ceph orch host ls -f json | jq -r --arg MGMT_GTW_HOST "$MGMT_GTW_HOST" \'"\'"\'.[] | select(.hostname==$MGMT_GTW_HOST) | .addr\'"\'"\')\n\n# check mgmt-gateway health\ncurl -k -s https://${MGMT_GTW_IP}/health\ncurl -k -s https://${MGMT_GTW_IP}:29443/health\n\n# wait for monitoring services\nwait_for_service "Grafana" "https://${MGMT_GTW_IP}/grafana/api/health" \'"\'"\'.database == "ok"\'"\'"\' || exit 1\nwait_for_service "Prometheus" "https://${MGMT_GTW_IP}/prometheus/api/v1/status/config" \'"\'"\'.status == "success"\'"\'"\' || exit 1\nwait_for_service "Alertmanager" "https://${MGMT_GTW_IP}/alertmanager/api/v2/status" \'"\'"\'.cluster.status == "ready"\'"\'"\' || exit 1\n\''
1 jobs: ['49450']
suites: ['agent/off', 'mon_election/classic', 'orch:cephadm/workunits/{0-distro/ubuntu_22.04', 'task/test_mgmt_gateway}']

Failure: Command failed on trial028 with status 1: 'sudo TESTDIR=/home/ubuntu/cephtest bash -ex -c \'grep \'"\'"\'pnn:0 .*OK\'"\'"\' /tmp/ctdb_status\''
1 jobs: ['49489']
suites: ['orch:cephadm/smb/{0-distro/ubuntu_22.04', 'tasks/deploy_smb_mgr_ctdb_res_ips}']

Failure: Test failure: test_error (tasks.mgr.test_orchestrator_cli.TestOrchestratorCli.test_error)
2 jobs: ['49418', '49474']
suites intersection: ['2-node-mgr', 'orch:cephadm/orchestrator_cli/{0-random-distro$/{centos_9.stream_runc}', 'orchestrator_cli}']
suites union: ['2-node-mgr', 'agent/off', 'agent/on', 'orch:cephadm/orchestrator_cli/{0-random-distro$/{centos_9.stream_runc}', 'orchestrator_cli}']

Failure: Command failed on trial013 with status 1: 'test -s /home/ubuntu/cephtest/cephadm && test $(stat -c%s /home/ubuntu/cephtest/cephadm) -gt 1000 && chmod +x /home/ubuntu/cephtest/cephadm'
3 jobs: ['49500', '49449', '49415']
suites intersection: []
suites union: ['1-bootstrap/18.2.0', '1-start', '2-nfs', '2-repo_digest/defaut', '2-repo_digest/repo_digest', '3-upgrade-with-workload', '3-upgrade/simple', '3-upgrade/staggered', '4-final}', '4-wait', '5-upgrade-ls', 'agent/off', 'agent/on', 'mon_election/classic}', 'mon_election/connectivity}', 'orch:cephadm/mgr-nfs-upgrade/{0-centos_9.stream', 'orch:cephadm/upgrade/{1-start-distro/1-start-centos_9.stream-reef', 'orch:cephadm/upgrade/{1-start-distro/1-start-ubuntu_22.04-squid']

Failure: reached maximum tries (120) after waiting for 120 seconds
3 jobs: ['49457', '49470', '49462']
suites intersection: []
suites union: ['0-nvme-loop', '1-start', '2-ops/deploy-raw}', 'agent/off', 'agent/on', 'mon_election/classic', 'mon_election/connectivity', 'orch:cephadm/osds/{0-distro/centos_9.stream_runc', 'orch:cephadm/workunits/{0-distro/centos_9.stream_runc', 'orch:cephadm/workunits/{0-distro/ubuntu_22.04', 'task/test_nvmeof_basic_mtls_disabled}', 'task/test_nvmeof_mtls_enabled_cephadm_signed_certs}']

Failure: "2026-02-14T00:17:12.097606+0000 mon.a (mon.0) 525 : cluster [WRN] Health check failed: Degraded data redundancy: 2/6 objects degraded (33.333%), 1 pg degraded (PG_DEGRADED)" in cluster log
2 jobs: ['49420', '49473']
suites intersection: []
suites union: ['cluster/{fixed-3}', 'conf/{disable-pool-app}', 'mon_election/connectivity', 'orch:cephadm/no-agent-workunits/{0-distro/centos_9.stream', 'orch:cephadm/rbd_iscsi/{base/install', 'supported-container-hosts$/{centos_9.stream}', 'task/test_cephadm_timeout}', 'workloads/cephadm_iscsi}']

Failure: Command failed on trial036 with status 1: 'sudo /home/ubuntu/cephtest/cephadm --image quay.ceph.io/ceph-ci/ceph:squid shell -c /etc/ceph/ceph.conf -k /etc/ceph/ceph.client.admin.keyring --fsid f02426d3-0b90-11f1-be65-d404e6e7d460 -e sha1=042df16cd9ee8a8df553b188fef8a8c4a9e7ab01 -- bash -c \'ceph versions | jq -e \'"\'"\'.overall | length == 1\'"\'"\'\''
3 jobs: ['49463', '49429', '49499']
suites intersection: ['1-volume/{0-create', '3-inline/yes', '3-upgrade-mgr-staggered', '4-config-upgrade/{fail_fs}', '4-verify}', '5-upgrade-with-workload', '6-verify}}', 'centos_9.stream', 'conf/{client', 'fail_fs/yes', 'ignorelist_upgrade', 'ignorelist_wrongly_marked_down', 'kernel', 'mds', 'mgr', 'mon', 'orch:cephadm/mds_upgrade_sequence/{bluestore-bitmap', 'osd}', 'overrides/{ignorelist_health', 'pg-warn', 'pg_health', 'roles', 'syntax}', 'tasks/{0-from/squid']
suites union: ['1-ranks/1', '1-ranks/2', '1-volume/{0-create', '2-allow_standby_replay/no', '2-allow_standby_replay/yes', '2-client/fuse', '2-client/kclient', '3-inline/yes', '3-upgrade-mgr-staggered', '4-config-upgrade/{fail_fs}', '4-verify}', '5-upgrade-with-workload', '6-verify}}', 'centos_9.stream', 'conf/{client', 'fail_fs/yes', 'ignorelist_upgrade', 'ignorelist_wrongly_marked_down', 'kernel', 'mds', 'mgr', 'mon', 'orch:cephadm/mds_upgrade_sequence/{bluestore-bitmap', 'osd}', 'overrides/{ignorelist_health', 'pg-warn', 'pg_health', 'roles', 'syntax}', 'tasks/{0-from/squid']

Dead: None
2 jobs: ['49483', '49424']

Failure: Command failed on trial042 with status 4: 'sudo /home/ubuntu/cephtest/cephadm --image quay.ceph.io/ceph-ci/ceph:042df16cd9ee8a8df553b188fef8a8c4a9e7ab01 shell -c /etc/ceph/ceph.conf -k /etc/ceph/ceph.client.admin.keyring --fsid d709c9aa-0b90-11f1-947c-d404e6e7d460 -- bash -c \'set -e\nset -x\nceph orch apply node-exporter\nceph orch apply grafana\nceph orch apply alertmanager\nceph orch apply prometheus\nsleep 240\nceph orch ls\nceph orch ps\nceph orch host ls\nMON_DAEMON=$(ceph orch ps --daemon-type mon -f json | jq -r \'"\'"\'last | .daemon_name\'"\'"\')\nGRAFANA_HOST=$(ceph orch ps --daemon-type grafana -f json | jq -e \'"\'"\'.[]\'"\'"\' | jq -r \'"\'"\'.hostname\'"\'"\')\nPROM_HOST=$(ceph orch ps --daemon-type prometheus -f json | jq -e \'"\'"\'.[]\'"\'"\' | jq -r \'"\'"\'.hostname\'"\'"\')\nALERTM_HOST=$(ceph orch ps --daemon-type alertmanager -f json | jq -e \'"\'"\'.[]\'"\'"\' | jq -r \'"\'"\'.hostname\'"\'"\')\nGRAFANA_IP=$(ceph orch host ls -f json | jq -r --arg GRAFANA_HOST "$GRAFANA_HOST" \'"\'"\'.[] | select(.hostname==$GRAFANA_HOST) | .addr\'"\'"\')\nPROM_IP=$(ceph orch host ls -f json | jq -r --arg PROM_HOST "$PROM_HOST" \'"\'"\'.[] | select(.hostname==$PROM_HOST) | .addr\'"\'"\')\nALERTM_IP=$(ceph orch host ls -f json | jq -r --arg ALERTM_HOST "$ALERTM_HOST" \'"\'"\'.[] | select(.hostname==$ALERTM_HOST) | .addr\'"\'"\')\n# check each host node-exporter metrics endpoint is responsive\nALL_HOST_IPS=$(ceph orch host ls -f json | jq -r \'"\'"\'.[] | .addr\'"\'"\')\nfor ip in $ALL_HOST_IPS; do\n  curl -s http://${ip}:9100/metric\ndone\n# check grafana endpoints are responsive and database health is okay\ncurl -k -s https://${GRAFANA_IP}:3000/api/health\ncurl -k -s https://${GRAFANA_IP}:3000/api/health | jq -e \'"\'"\'.database == "ok"\'"\'"\'\n# stop mon daemon in order to trigger an alert\nceph orch daemon stop $MON_DAEMON\nsleep 120\n# check prometheus endpoints are responsive and mon down alert is firing\ncurl -s http://${PROM_IP}:9095/api/v1/status/config\ncurl -s http://${PROM_IP}:9095/api/v1/status/config | jq -e \'"\'"\'.status == "success"\'"\'"\'\ncurl -s http://${PROM_IP}:9095/api/v1/alerts\ncurl -s http://${PROM_IP}:9095/api/v1/alerts | jq -e \'"\'"\'.data | .alerts | .[] | select(.labels | .alertname == "CephMonDown") | .state == "firing"\'"\'"\'\n# check alertmanager endpoints are responsive and mon down alert is active\ncurl -s http://${ALERTM_IP}:9093/api/v2/status\ncurl -s http://${ALERTM_IP}:9093/api/v2/alerts\ncurl -s http://${ALERTM_IP}:9093/api/v2/alerts | jq -e \'"\'"\'.[] | select(.labels | .alertname == "CephMonDown") | .status | .state == "active"\'"\'"\'\n# check prometheus metrics endpoint is not empty and make sure we can get metrics\nMETRICS_URL=$(ceph mgr services | jq -r .prometheus)\n[ -n "$METRICS_URL" ] || exit 1\ncurl -s "${METRICS_URL}metrics" | grep -q \'"\'"\'^ceph_health_status\'"\'"\'\n\''
1 jobs: ['49455']
suites: ['agent/on', 'mon_election/connectivity', 'orch:cephadm/workunits/{0-distro/centos_9.stream', 'task/test_monitoring_stack_basic}']

Failure: Command failed on trial030 with status 1: 'sudo /home/ubuntu/cephtest/cephadm --image quay.ceph.io/ceph-ci/ceph:042df16cd9ee8a8df553b188fef8a8c4a9e7ab01 shell -c /etc/ceph/ceph.conf -k /etc/ceph/ceph.client.admin.keyring --fsid ccdf7b8c-0b90-11f1-a609-d404e6e7d460 -- bash -c \'set -ex\n# since we don\'"\'"\'t know the real hostnames before the test, the next\n# bit is in order to replace the fake hostnames "host.a/b/c" with\n# the actual names cephadm knows the host by within the mon spec\nceph orch host ls --format json | jq -r \'"\'"\'.[] | .hostname\'"\'"\' > realnames\necho $\'"\'"\'host.a\\nhost.b\\nhost.c\'"\'"\' > fakenames\necho $\'"\'"\'a\\nb\\nc\'"\'"\' > mon_ids\necho $\'"\'"\'{datacenter=a}\\n{datacenter=b,rack=2}\\n{datacenter=a,rack=3}\'"\'"\' > crush_locs\nceph orch ls --service-name mon --export > mon.yaml\nMONSPEC=`cat mon.yaml`\necho "$MONSPEC"\nwhile read realname <&3 && read fakename <&4; do\n  MONSPEC="${MONSPEC//$fakename/$realname}"\ndone 3<realnames 4<fakenames\necho "$MONSPEC" > mon.yaml\ncat mon.yaml\n# now the spec should have the real hostnames, so let\'"\'"\'s re-apply\nceph orch apply -i mon.yaml\nsleep 90\nceph orch ps --refresh\nceph orch ls --service-name mon --export > mon.yaml; ceph orch apply -i mon.yaml\nsleep 90\nceph mon dump\nceph mon dump --format json\n# verify all the crush locations got set from "ceph mon dump" output\nwhile read monid <&3 && read crushloc <&4; do\n  ceph mon dump --format json | jq --arg monid "$monid" --arg crushloc "$crushloc" -e \'"\'"\'.mons | .[] | select(.name == $monid) | .crush_location == $crushloc\'"\'"\'\ndone 3<mon_ids 4<crush_locs\n\''
1 jobs: ['49486']
suites: ['agent/on', 'mon_election/connectivity', 'orch:cephadm/workunits/{0-distro/centos_9.stream_runc', 'task/test_set_mon_crush_locations}']

Failure: Command failed on trial002 with status 1: 'sudo /home/ubuntu/cephtest/cephadm --image quay.ceph.io/ceph-ci/ceph:reef shell -c /etc/ceph/ceph.conf -k /etc/ceph/ceph.client.admin.keyring --fsid cbf9e8b1-0939-11f1-9661-d404e6e7d460 -e sha1=042df16cd9ee8a8df553b188fef8a8c4a9e7ab01 -- bash -c \'ceph versions | jq -e \'"\'"\'.overall | length == 1\'"\'"\'\''
1 jobs: ['49410']
suites: ['2-repo_digest/defaut', '3-upgrade/simple', '4-wait', '5-upgrade-ls', 'agent/off', 'mon_election/connectivity}', 'orch:cephadm/upgrade/{1-start-distro/1-start-ubuntu_22.04-reef']

Failure: Test failure: test_cluster_info (tasks.cephfs.test_nfs.TestNFS.test_cluster_info)
1 jobs: ['49416']
suites: ['conf/{client', 'ignorelist_health', 'mds', 'mgr', 'mon', 'nfs-version/{4.1}', 'orch:cephadm/nfs/{cluster/{1-node}', 'osd}', 'overrides/{ignore_mgr_down', 'pg_health}', 'supported-random-distros$/{centos_latest}', 'tasks/nfs}']

Failure: 502 Server Error: Bad Gateway for url: https://1.chacra.ceph.com/repos/ceph/reef/e6ab650721089ed287ed684011c35b550bf20fe7/centos/9/flavors/default/repo
1 jobs: ['49446']
suites: ['1-ranks/1', '1-volume/{0-create', '2-allow_standby_replay/no', '2-client/kclient', '3-inline/no', '3-upgrade-mgr-staggered', '4-config-upgrade/{fail_fs}', '4-verify}', '5-upgrade-with-workload', '6-verify}}', 'centos_9.stream', 'conf/{client', 'fail_fs/no', 'ignorelist_upgrade', 'ignorelist_wrongly_marked_down', 'kernel', 'mds', 'mgr', 'mon', 'orch:cephadm/mds_upgrade_sequence/{bluestore-bitmap', 'osd}', 'overrides/{ignorelist_health', 'pg-warn', 'pg_health', 'roles', 'syntax}', 'tasks/{0-from/reef/{reef}']

Dead: b'2026-02-17T05:30:48.229 DEBUG:teuthology.exit:Finished running handlers'
1 jobs: ['49440']
suites: ['agent/on', 'mon_election/connectivity', 'orch:cephadm/workunits/{0-distro/centos_9.stream_runc', 'task/test_iscsi_container/{centos_9.stream', 'test_iscsi_container}}']

Failure: Command failed (workunit test cephadm/test_cephadm.sh) on trial098 with status 1: 'mkdir -p -- /home/ubuntu/cephtest/mnt.0/client.0/tmp && cd -- /home/ubuntu/cephtest/mnt.0/client.0/tmp && CEPH_CLI_TEST_DUP_COMMAND=1 CEPH_REF=632a9804aab65871427145f015001eb516b59504 TESTDIR="/home/ubuntu/cephtest" CEPH_ARGS="--cluster ceph" CEPH_ID="0" PATH=$PATH:/usr/sbin CEPH_BASE=/home/ubuntu/cephtest/clone.client.0 CEPH_ROOT=/home/ubuntu/cephtest/clone.client.0 CEPH_MNT=/home/ubuntu/cephtest/mnt.0 adjust-ulimits ceph-coverage /home/ubuntu/cephtest/archive/coverage timeout 3h /home/ubuntu/cephtest/clone.client.0/qa/workunits/cephadm/test_cephadm.sh'
1 jobs: ['49502']
suites: ['agent/on', 'mon_election/connectivity', 'orch:cephadm/workunits/{0-distro/ubuntu_22.04', 'task/test_cephadm}']