|
2026-04-29
ยง
|
| 10:14 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db1194 (T419961)', diff saved to https://phabricator.wikimedia.org/P91878 and previous config saved to /var/cache/conftool/dbconfig/20260429-101426-fceratto.json |
[production] |
| 10:14 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1194.eqiad.wmnet with reason: Maintenance |
[production] |
| 10:14 |
<mvernon@cumin2002> |
START - Cookbook sre.swift.roll-restart-reboot-swift-ms-proxies rolling restart_daemons on A:swift-fe-codfw |
[production] |
| 10:13 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1191 (T419961)', diff saved to https://phabricator.wikimedia.org/P91877 and previous config saved to /var/cache/conftool/dbconfig/20260429-101358-fceratto.json |
[production] |
| 10:13 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reimage for host ganeti5005.eqsin.wmnet with OS bookworm |
[production] |
| 10:12 |
<jmm@cumin2002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host ganeti5005.eqsin.wmnet with OS bookworm |
[production] |
| 10:12 |
<Emperor> |
disable puppet in apus/codfw rgws for TLS key rollover T424674 |
[production] |
| 10:09 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db2190.codfw.wmnet with reason: host reimage |
[production] |
| 10:09 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/airflow-test-k8s: apply |
[production] |
| 10:08 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-test-k8s: apply |
[production] |
| 10:07 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.pool pool db1229: after reimage to trixie |
[production] |
| 10:04 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db1229.eqiad.wmnet with OS trixie |
[production] |
| 10:04 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db2190.codfw.wmnet with reason: host reimage |
[production] |
| 10:03 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1191', diff saved to https://phabricator.wikimedia.org/P91875 and previous config saved to /var/cache/conftool/dbconfig/20260429-100349-fceratto.json |
[production] |
| 10:00 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db2175.codfw.wmnet with OS trixie |
[production] |
| 09:57 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1166.eqiad.wmnet with reason: host reimage |
[production] |
| 09:54 |
<marostegui@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host db2175.codfw.wmnet with OS trixie |
[production] |
| 09:53 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/airflow-test-k8s: apply |
[production] |
| 09:53 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1191', diff saved to https://phabricator.wikimedia.org/P91874 and previous config saved to /var/cache/conftool/dbconfig/20260429-095341-fceratto.json |
[production] |
| 09:52 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-test-k8s: apply |
[production] |
| 09:51 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1166.eqiad.wmnet with reason: host reimage |
[production] |
| 09:45 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db2190.codfw.wmnet with OS trixie |
[production] |
| 09:44 |
<marostegui@cumin1003> |
END (FAIL) - Cookbook sre.mysql.depool (exit_code=99) depool db2190: Reimage to Trixie |
[production] |
| 09:44 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db2190: Reimage to Trixie |
[production] |
| 09:44 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db2190.codfw.wmnet with reason: Reimage to Trixie |
[production] |
| 09:44 |
<jelto@cumin1003> |
END (PASS) - Cookbook sre.gitlab.upgrade (exit_code=0) on GitLab host gitlab1003.wikimedia.org with reason: Test noop upgrade on the replica |
[production] |
| 09:43 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1191 (T419961)', diff saved to https://phabricator.wikimedia.org/P91873 and previous config saved to /var/cache/conftool/dbconfig/20260429-094333-fceratto.json |
[production] |
| 09:42 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1229.eqiad.wmnet with reason: host reimage |
[production] |
| 09:41 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db2190: Reimage to Trixie |
[production] |
| 09:41 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db2190: Reimage to Trixie |
[production] |
| 09:41 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db2190.codfw.wmnet with reason: Reimage to Trixie |
[production] |
| 09:40 |
<jelto@cumin1003> |
START - Cookbook sre.gitlab.upgrade on GitLab host gitlab1003.wikimedia.org with reason: Test noop upgrade on the replica |
[production] |
| 09:39 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool db2194: after reimage to trixie |
[production] |
| 09:37 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1229.eqiad.wmnet with reason: host reimage |
[production] |
| 09:36 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db1191 (T419961)', diff saved to https://phabricator.wikimedia.org/P91870 and previous config saved to /var/cache/conftool/dbconfig/20260429-093624-fceratto.json |
[production] |
| 09:36 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1191.eqiad.wmnet with reason: Maintenance |
[production] |
| 09:35 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1174 (T419961)', diff saved to https://phabricator.wikimedia.org/P91869 and previous config saved to /var/cache/conftool/dbconfig/20260429-093557-fceratto.json |
[production] |
| 09:35 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db1166.eqiad.wmnet with OS trixie |
[production] |
| 09:34 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db1166: Reimage to Trixie |
[production] |
| 09:34 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db1166: Reimage to Trixie |
[production] |
| 09:34 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db1166.eqiad.wmnet with reason: Reimage to Trixie |
[production] |
| 09:30 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool db1175: after reimage to trixie |
[production] |
| 09:25 |
<ayounsi@cumin1003> |
END (PASS) - Cookbook sre.dns.admin (exit_code=0) DNS admin: pool ulsfo [reason: primary network link stable, no task ID specified] |
[production] |
| 09:25 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1174', diff saved to https://phabricator.wikimedia.org/P91866 and previous config saved to /var/cache/conftool/dbconfig/20260429-092551-fceratto.json |
[production] |
| 09:25 |
<ayounsi@cumin1003> |
START - Cookbook sre.dns.admin DNS admin: pool ulsfo [reason: primary network link stable, no task ID specified] |
[production] |
| 09:22 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db1229.eqiad.wmnet with OS trixie |
[production] |
| 09:21 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db2175.codfw.wmnet with OS trixie |
[production] |
| 09:21 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db1229: Reimage to Trixie |
[production] |
| 09:20 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db2175: Reimage to Trixie |
[production] |
| 09:20 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db1229: Reimage to Trixie |
[production] |