|
2026-04-27
ยง
|
| 15:35 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] START helmfile.d/admin 'sync'. |
[production] |
| 15:35 |
<jiji@deploy1003> |
Unlocked for deployment [ALL REPOSITORIES]: Upgrading mw-mcrouter - effie (duration: 37m 12s) |
[production] |
| 15:31 |
<bking@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudelastic1010.eqiad.wmnet with reason: host reimage |
[production] |
| 15:30 |
<btullis@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/opensearch-ipoid-test: apply |
[production] |
| 15:30 |
<btullis@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/opensearch-ipoid-test: apply |
[production] |
| 15:30 |
<btullis@deploy1003> |
helmfile [dse-k8s-codfw] DONE helmfile.d/dse-k8s-services/opensearch-ipoid-test: apply |
[production] |
| 15:30 |
<btullis@deploy1003> |
helmfile [dse-k8s-codfw] START helmfile.d/dse-k8s-services/opensearch-ipoid-test: apply |
[production] |
| 15:29 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on ms-be1092.eqiad.wmnet with reason: host reimage |
[production] |
| 15:27 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] DONE helmfile.d/admin 'sync'. |
[production] |
| 15:27 |
<btullis@deploy1003> |
helmfile [dse-k8s-codfw] DONE helmfile.d/dse-k8s-services/opensearch-test: apply |
[production] |
| 15:26 |
<btullis@deploy1003> |
helmfile [dse-k8s-codfw] START helmfile.d/dse-k8s-services/opensearch-test: apply |
[production] |
| 15:26 |
<btullis@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/opensearch-test: apply |
[production] |
| 15:26 |
<btullis@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/opensearch-test: apply |
[production] |
| 15:26 |
<bking@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on cloudelastic1010.eqiad.wmnet with reason: host reimage |
[production] |
| 15:25 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] START helmfile.d/admin 'sync'. |
[production] |
| 15:25 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1252', diff saved to https://phabricator.wikimedia.org/P91632 and previous config saved to /var/cache/conftool/dbconfig/20260427-152536-fceratto.json |
[production] |
| 15:25 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] DONE helmfile.d/admin 'sync'. |
[production] |
| 15:23 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] START helmfile.d/admin 'sync'. |
[production] |
| 15:20 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2171 (T419635)', diff saved to https://phabricator.wikimedia.org/P91631 and previous config saved to /var/cache/conftool/dbconfig/20260427-152038-fceratto.json |
[production] |
| 15:20 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on db2171.codfw.wmnet with reason: Maintenance |
[production] |
| 15:20 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2157 (T419635)', diff saved to https://phabricator.wikimedia.org/P91630 and previous config saved to /var/cache/conftool/dbconfig/20260427-152013-fceratto.json |
[production] |
| 15:15 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1252 (T419961)', diff saved to https://phabricator.wikimedia.org/P91629 and previous config saved to /var/cache/conftool/dbconfig/20260427-151528-fceratto.json |
[production] |
| 15:12 |
<jiji@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/mw-mcrouter: apply |
[production] |
| 15:11 |
<jiji@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mw-mcrouter: apply |
[production] |
| 15:10 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'articletopic-outlink' for release 'main' . |
[production] |
| 15:10 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2157', diff saved to https://phabricator.wikimedia.org/P91627 and previous config saved to /var/cache/conftool/dbconfig/20260427-151005-fceratto.json |
[production] |
| 15:09 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] DONE helmfile.d/admin 'sync'. |
[production] |
| 15:08 |
<jiji@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/mw-mcrouter: apply |
[production] |
| 15:08 |
<herron@cumin1003> |
END (PASS) - Cookbook sre.kafka.roll-restart-reboot-brokers (exit_code=0) rolling restart_daemons on A:kafka-logging-codfw |
[production] |
| 15:07 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.move-vlan (exit_code=0) for host ms-be1092 |
[production] |
| 15:07 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host ms-be1092 |
[production] |
| 15:07 |
<bking@cumin2002> |
START - Cookbook sre.hosts.reimage for host cloudelastic1010.eqiad.wmnet with OS trixie |
[production] |
| 15:07 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] START helmfile.d/admin 'sync'. |
[production] |
| 15:07 |
<jiji@deploy1003> |
helmfile [codfw] START helmfile.d/services/mw-mcrouter: apply |
[production] |
| 15:07 |
<mvernon@cumin2002> |
START - Cookbook sre.network.configure-switch-interfaces for host ms-be1092 |
[production] |
| 15:07 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) ms-be1092.eqiad.wmnet 32.32.64.10.in-addr.arpa 2.3.0.0.2.3.0.0.4.6.0.0.0.1.0.0.3.0.1.0.1.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors |
[production] |
| 15:07 |
<mvernon@cumin2002> |
START - Cookbook sre.dns.wipe-cache ms-be1092.eqiad.wmnet 32.32.64.10.in-addr.arpa 2.3.0.0.2.3.0.0.4.6.0.0.0.1.0.0.3.0.1.0.1.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors |
[production] |
| 15:07 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
| 15:07 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host ms-be1092 - mvernon@cumin2002" |
[production] |
| 15:07 |
<mvernon@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host ms-be1092 - mvernon@cumin2002" |
[production] |
| 15:07 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] DONE helmfile.d/admin 'sync'. |
[production] |
| 15:06 |
<ladsgroup@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ms-be1070.eqiad.wmnet with reason: vacuum overlarge container dbs |
[production] |
| 15:06 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db1252 (T419961)', diff saved to https://phabricator.wikimedia.org/P91626 and previous config saved to /var/cache/conftool/dbconfig/20260427-150616-fceratto.json |
[production] |
| 15:06 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1252.eqiad.wmnet with reason: Maintenance |
[production] |
| 15:05 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1249 (T419961)', diff saved to https://phabricator.wikimedia.org/P91625 and previous config saved to /var/cache/conftool/dbconfig/20260427-150547-fceratto.json |
[production] |
| 15:05 |
<dpogorzelski@deploy1003> |
helmfile [ml-staging-codfw] START helmfile.d/admin 'sync'. |
[production] |
| 15:02 |
<mvernon@cumin2002> |
START - Cookbook sre.dns.netbox |
[production] |
| 15:00 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.move-vlan for host ms-be1092 |
[production] |
| 15:00 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reimage for host ms-be1092.eqiad.wmnet with OS bullseye |
[production] |
| 14:59 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2157', diff saved to https://phabricator.wikimedia.org/P91624 and previous config saved to /var/cache/conftool/dbconfig/20260427-145957-fceratto.json |
[production] |