2024-02-22
ยง
|
18:22 |
<bking@cumin2002> |
START - Cookbook sre.elasticsearch.ban Unbanning all hosts in search_codfw |
[production] |
18:22 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mw1484.eqiad.wmnet with OS bullseye |
[production] |
18:21 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw2384.codfw.wmnet with reason: host reimage |
[production] |
18:18 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw2384.codfw.wmnet with reason: host reimage |
[production] |
18:17 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mw1468.eqiad.wmnet with OS bullseye |
[production] |
18:15 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2152', diff saved to https://phabricator.wikimedia.org/P57753 and previous config saved to /var/cache/conftool/dbconfig/20240222-181502-arnaudb.json |
[production] |
18:14 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mw1483.eqiad.wmnet with OS bullseye |
[production] |
18:12 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mw1458.eqiad.wmnet with OS bullseye |
[production] |
18:11 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1485.eqiad.wmnet with reason: host reimage |
[production] |
18:07 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1467.eqiad.wmnet with reason: host reimage |
[production] |
18:04 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1484.eqiad.wmnet with reason: host reimage |
[production] |
18:04 |
<bd808@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/developer-portal: apply |
[production] |
18:04 |
<bd808@deploy2002> |
helmfile [codfw] START helmfile.d/services/developer-portal: apply |
[production] |
18:04 |
<bd808@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/developer-portal: apply |
[production] |
18:03 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host mw2384.codfw.wmnet with OS bullseye |
[production] |
18:03 |
<bd808@deploy2002> |
helmfile [eqiad] START helmfile.d/services/developer-portal: apply |
[production] |
18:03 |
<hnowlan@cumin1002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=93) for host mw2384.codfw.wmnet with OS bullseye |
[production] |
18:03 |
<bd808@deploy2002> |
helmfile [staging] DONE helmfile.d/services/developer-portal: apply |
[production] |
18:02 |
<bd808@deploy2002> |
helmfile [staging] START helmfile.d/services/developer-portal: apply |
[production] |
18:01 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1494.eqiad.wmnet with reason: host reimage |
[production] |
17:59 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2152', diff saved to https://phabricator.wikimedia.org/P57752 and previous config saved to /var/cache/conftool/dbconfig/20240222-175956-arnaudb.json |
[production] |
17:59 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1468.eqiad.wmnet with reason: host reimage |
[production] |
17:57 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1483.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1494.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1483.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mw1458.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1484.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1485.eqiad.wmnet with reason: host reimage |
[production] |
17:54 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1468.eqiad.wmnet with reason: host reimage |
[production] |
17:52 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1467.eqiad.wmnet with reason: host reimage |
[production] |
17:52 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on mw1458.eqiad.wmnet with reason: host reimage |
[production] |
17:51 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host mw2384.codfw.wmnet with OS bullseye |
[production] |
17:45 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:44 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] START helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:44 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2152 (T357189)', diff saved to https://phabricator.wikimedia.org/P57751 and previous config saved to /var/cache/conftool/dbconfig/20240222-174449-arnaudb.json |
[production] |
17:44 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:43 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] START helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:43 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:43 |
<cdanis@deploy2002> |
helmfile [aux-k8s-eqiad] START helmfile.d/aus-k8s-eqiad-services/jaeger: apply |
[production] |
17:43 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Depooling db2152 (T357189)', diff saved to https://phabricator.wikimedia.org/P57750 and previous config saved to /var/cache/conftool/dbconfig/20240222-174328-arnaudb.json |
[production] |
17:43 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2152.codfw.wmnet with reason: Maintenance |
[production] |
17:43 |
<btullis@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/superset-next: apply |
[production] |
17:43 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2152.codfw.wmnet with reason: Maintenance |
[production] |
17:42 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2100.codfw.wmnet with reason: Maintenance |
[production] |
17:42 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2100.codfw.wmnet with reason: Maintenance |
[production] |
17:42 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2098.codfw.wmnet with reason: Maintenance |
[production] |
17:42 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2098.codfw.wmnet with reason: Maintenance |
[production] |
17:42 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on dbstore1009.eqiad.wmnet with reason: Maintenance |
[production] |
17:42 |
<hnowlan@cumin1002> |
START - Cookbook sre.hosts.reimage for host mw1494.eqiad.wmnet with OS bullseye |
[production] |
17:41 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on dbstore1009.eqiad.wmnet with reason: Maintenance |
[production] |