2024-08-26
ยง
|
18:08 |
<swfrench@deploy1003> |
helmfile [eqiad] START helmfile.d/services/eventstreams: apply |
[production] |
17:53 |
<swfrench@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/eventstreams-internal: apply |
[production] |
17:52 |
<swfrench@deploy1003> |
helmfile [codfw] START helmfile.d/services/eventstreams-internal: apply |
[production] |
17:52 |
<swfrench@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/eventstreams: apply |
[production] |
17:51 |
<swfrench@deploy1003> |
helmfile [codfw] START helmfile.d/services/eventstreams: apply |
[production] |
17:43 |
<ryankemper@cumin2002> |
conftool action : set/pooled=yes:weight=10; selector: cluster=wdqs-main |
[production] |
17:43 |
<ryankemper@cumin2002> |
conftool action : set/pooled=yes:weight=10; selector: cluster=wdqs-scholarly |
[production] |
17:41 |
<swfrench@deploy1003> |
helmfile [staging] DONE helmfile.d/services/eventstreams-internal: apply |
[production] |
17:41 |
<swfrench@deploy1003> |
helmfile [staging] START helmfile.d/services/eventstreams-internal: apply |
[production] |
17:40 |
<kamila@cumin1002> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host kubernetes2018.codfw.wmnet |
[production] |
17:40 |
<swfrench@deploy1003> |
helmfile [staging] DONE helmfile.d/services/eventstreams: apply |
[production] |
17:39 |
<kamila@cumin1002> |
START - Cookbook sre.k8s.pool-depool-node depool for host kubernetes2018.codfw.wmnet |
[production] |
17:39 |
<swfrench@deploy1003> |
helmfile [staging] START helmfile.d/services/eventstreams: apply |
[production] |
17:39 |
<ryankemper> |
T364364 Created PTR & A records for new graph split services `wdqs-main` and `wdqs-scholarly` (merged https://gerrit.wikimedia.org/r/c/operations/dns/+/1051446 and ran `sudo authdns-update` on `dns1004.wikimedia.org`) |
[production] |
17:23 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 16:00:00 on 11 hosts with reason: Maintenance |
[production] |
17:23 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 16:00:00 on 11 hosts with reason: Maintenance |
[production] |
17:23 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db2129.codfw.wmnet with reason: Maintenance |
[production] |
17:22 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db2129.codfw.wmnet with reason: Maintenance |
[production] |
17:22 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2124 (T370903)', diff saved to https://phabricator.wikimedia.org/P67809 and previous config saved to /var/cache/conftool/dbconfig/20240826-172250-ladsgroup.json |
[production] |
17:07 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2124', diff saved to https://phabricator.wikimedia.org/P67808 and previous config saved to /var/cache/conftool/dbconfig/20240826-170742-ladsgroup.json |
[production] |
16:54 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2035.codfw.wmnet |
[production] |
16:54 |
<cgoubert@cumin1002> |
START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2035.codfw.wmnet |
[production] |
16:53 |
<claime> |
homer 'lsw1-b8-codfw*' commit T372878 |
[production] |
16:52 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2035.codfw.wmnet with OS bullseye |
[production] |
16:52 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2124', diff saved to https://phabricator.wikimedia.org/P67807 and previous config saved to /var/cache/conftool/dbconfig/20240826-165235-ladsgroup.json |
[production] |
16:37 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2124 (T370903)', diff saved to https://phabricator.wikimedia.org/P67806 and previous config saved to /var/cache/conftool/dbconfig/20240826-163728-ladsgroup.json |
[production] |
16:32 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2035.codfw.wmnet with reason: host reimage |
[production] |
16:30 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Depooling db2124 (T370903)', diff saved to https://phabricator.wikimedia.org/P67805 and previous config saved to /var/cache/conftool/dbconfig/20240826-163032-ladsgroup.json |
[production] |
16:30 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db2124.codfw.wmnet with reason: Maintenance |
[production] |
16:30 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db2124.codfw.wmnet with reason: Maintenance |
[production] |
16:30 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db2114.codfw.wmnet with reason: Maintenance |
[production] |
16:29 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db2114.codfw.wmnet with reason: Maintenance |
[production] |
16:29 |
<cgoubert@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2035.codfw.wmnet with reason: host reimage |
[production] |
16:28 |
<claime> |
homer 'cr*codfw*' commit 'T372878' |
[production] |
16:26 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on dbstore1009.eqiad.wmnet with reason: Maintenance |
[production] |
16:25 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 8:00:00 on dbstore1009.eqiad.wmnet with reason: Maintenance |
[production] |
16:25 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1231 (T370903)', diff saved to https://phabricator.wikimedia.org/P67804 and previous config saved to /var/cache/conftool/dbconfig/20240826-162553-ladsgroup.json |
[production] |
16:25 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Depooling db1199 (T371742)', diff saved to https://phabricator.wikimedia.org/P67803 and previous config saved to /var/cache/conftool/dbconfig/20240826-162544-ladsgroup.json |
[production] |
16:25 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on db1199.eqiad.wmnet with reason: Maintenance |
[production] |
16:25 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 12:00:00 on db1199.eqiad.wmnet with reason: Maintenance |
[production] |
16:25 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1190 (T371742)', diff saved to https://phabricator.wikimedia.org/P67802 and previous config saved to /var/cache/conftool/dbconfig/20240826-162522-ladsgroup.json |
[production] |
16:13 |
<dancy@deploy1003> |
Stopping before sync operations |
[production] |
16:13 |
<dancy@deploy1003> |
Started scap sync-world: testing |
[production] |
16:10 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1231', diff saved to https://phabricator.wikimedia.org/P67801 and previous config saved to /var/cache/conftool/dbconfig/20240826-161039-ladsgroup.json |
[production] |
16:10 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.hosts.move-vlan (exit_code=0) for host <spicerack.netbox.NetboxServer object at 0x7f6bc9767d90> |
[production] |
16:10 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2035 |
[production] |
16:10 |
<ladsgroup@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1190', diff saved to https://phabricator.wikimedia.org/P67800 and previous config saved to /var/cache/conftool/dbconfig/20240826-161015-ladsgroup.json |
[production] |
16:10 |
<cgoubert@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2035 |
[production] |
16:10 |
<cgoubert@cumin1002> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) wikikube-worker2035.codfw.wmnet 62.16.192.10.in-addr.arpa 2.6.0.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors |
[production] |
16:10 |
<cgoubert@cumin1002> |
START - Cookbook sre.dns.wipe-cache wikikube-worker2035.codfw.wmnet 62.16.192.10.in-addr.arpa 2.6.0.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors |
[production] |