2024-06-05
ยง
|
10:01 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2207 (re)pooling @ 100%: Repooling', diff saved to https://phabricator.wikimedia.org/P64083 and previous config saved to /var/cache/conftool/dbconfig/20240605-100117-root.json |
[production] |
10:00 |
<fabfur> |
disabling puppet on cp4037 to test Benthos performances (T358109) |
[production] |
10:00 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host wikikube-worker1012.eqiad.wmnet with OS bullseye |
[production] |
10:00 |
<mvernon@cumin1002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1057.eqiad.wmnet |
[production] |
10:00 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host wikikube-worker1011.eqiad.wmnet with OS bullseye |
[production] |
10:00 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2055.codfw.wmnet |
[production] |
09:59 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) netbox.discovery.wmnet. on all recursors |
[production] |
09:59 |
<jmm@cumin2002> |
START - Cookbook sre.dns.wipe-cache netbox.discovery.wmnet. on all recursors |
[production] |
09:59 |
<cgoubert@cumin1002> |
conftool action : set/pooled=yes:weight=10; selector: name=wikikube-worker1001.eqiad.wmnet,cluster=kubernetes,service=kubesvc |
[production] |
09:58 |
<claime> |
pooling and uncordoning wikikube-worker1001 - T351074 |
[production] |
09:57 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw1456 to wikikube-worker1012 |
[production] |
09:57 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker1012 |
[production] |
09:56 |
<aikochou@deploy1002> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revertrisk' for release 'main' . |
[production] |
09:55 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host wikikube-worker1010.eqiad.wmnet with OS bullseye |
[production] |
09:55 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host wikikube-worker1009.eqiad.wmnet with OS bullseye |
[production] |
09:55 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host wikikube-worker1008.eqiad.wmnet with OS bullseye |
[production] |
09:55 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) wikikube-worker1008.eqiad.wmnet wikikube-worker1009.eqiad.wmnet wikikube-worker1010.eqiad.wmnet wikikube-worker1011.eqiad.wmnet wikikube-worker1012.eqiad.wmnet on all recursors |
[production] |
09:55 |
<hnowlan@cumin1002> |
START - Cookbook sre.dns.wipe-cache wikikube-worker1008.eqiad.wmnet wikikube-worker1009.eqiad.wmnet wikikube-worker1010.eqiad.wmnet wikikube-worker1011.eqiad.wmnet wikikube-worker1012.eqiad.wmnet on all recursors |
[production] |
09:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker1012 |
[production] |
09:54 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
09:54 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw1456 to wikikube-worker1012 - hnowlan@cumin1002" |
[production] |
09:54 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1152.eqiad.wmnet with reason: host reimage |
[production] |
09:54 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) netbox.discovery.wmnet. on all recursors |
[production] |
09:54 |
<jmm@cumin2002> |
START - Cookbook sre.dns.wipe-cache netbox.discovery.wmnet. on all recursors |
[production] |
09:54 |
<jmm@cumin2002> |
START - Cookbook sre.netbox.restart-reboot rolling reboot on A:netbox |
[production] |
09:53 |
<hnowlan@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw1456 to wikikube-worker1012 - hnowlan@cumin1002" |
[production] |
09:53 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1227 (re)pooling @ 10%: Repooling', diff saved to https://phabricator.wikimedia.org/P64082 and previous config saved to /var/cache/conftool/dbconfig/20240605-095336-root.json |
[production] |
09:53 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1186 (re)pooling @ 75%: Repooling', diff saved to https://phabricator.wikimedia.org/P64081 and previous config saved to /var/cache/conftool/dbconfig/20240605-095303-root.json |
[production] |
09:52 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw1428 to wikikube-worker1011 |
[production] |
09:52 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker1011 |
[production] |
09:51 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1152.eqiad.wmnet with reason: host reimage |
[production] |
09:51 |
<dcaro@cumin1002> |
START - Cookbook sre.hosts.reboot-single for host cloudcephosd1031.eqiad.wmnet |
[production] |
09:51 |
<hnowlan@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
09:51 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.rename from mw1456 to wikikube-worker1012 |
[production] |
09:50 |
<hnowlan@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker1011 |
[production] |
09:50 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
09:50 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw1428 to wikikube-worker1011 - hnowlan@cumin1002" |
[production] |
09:49 |
<hnowlan@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw1428 to wikikube-worker1011 - hnowlan@cumin1002" |
[production] |
09:46 |
<hnowlan@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
09:46 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.rename from mw1428 to wikikube-worker1011 |
[production] |
09:46 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2207 (re)pooling @ 75%: Repooling', diff saved to https://phabricator.wikimedia.org/P64080 and previous config saved to /var/cache/conftool/dbconfig/20240605-094611-root.json |
[production] |
09:46 |
<hnowlan@cumin1002> |
END (FAIL) - Cookbook sre.hosts.rename (exit_code=99) from mw1428 to wikikube-worker1011 |
[production] |
09:45 |
<hnowlan@cumin1002> |
END (FAIL) - Cookbook sre.dns.netbox (exit_code=99) |
[production] |
09:45 |
<hnowlan@cumin1002> |
END (FAIL) - Cookbook sre.hosts.rename (exit_code=99) from mw1456 to wikikube-worker1012 |
[production] |
09:44 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw1410 to wikikube-worker1010 |
[production] |
09:44 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.rename from mw1456 to wikikube-worker1012 |
[production] |
09:44 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker1010 |
[production] |
09:44 |
<hnowlan@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
09:44 |
<claime> |
homer 'cr*eqiad*' commit 'T351074' |
[production] |
09:44 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.rename from mw1428 to wikikube-worker1011 |
[production] |