2022-03-31
ยง
|
20:04 |
<mutante> |
mw2271,mw2222 - canary appserver, rebooting |
[production] |
20:04 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp2035.codfw.wmnet |
[production] |
20:04 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs4005.ulsfo.wmnet |
[production] |
20:01 |
<mutante> |
mw2251,mw2252 - canary appserver, rebooting |
[production] |
20:00 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs4005.ulsfo.wmnet |
[production] |
19:59 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw2272.codfw.wmnet |
[production] |
19:59 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw2271.codfw.wmnet |
[production] |
19:58 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw2252.codfw.wmnet |
[production] |
19:57 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw2251.codfw.wmnet |
[production] |
19:55 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs3006.esams.wmnet |
[production] |
19:46 |
<mutante> |
phab2001 - systemctl restart ssh-phab |
[production] |
19:45 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs3006.esams.wmnet |
[production] |
19:44 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp3052.esams.wmnet |
[production] |
19:43 |
<rzl> |
Rolling-restarted zotero to un-wedge wedged pods with offscale high CPU |
[production] |
19:42 |
<rzl@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/zotero: sync |
[production] |
19:42 |
<rzl@deploy1002> |
helmfile [codfw] START helmfile.d/services/zotero: sync |
[production] |
19:38 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs2008.codfw.wmnet |
[production] |
19:33 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp5014.eqsin.wmnet |
[production] |
19:31 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp3052.esams.wmnet |
[production] |
19:28 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp3051.esams.wmnet |
[production] |
19:28 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1016.eqiad.wmnet |
[production] |
19:27 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp5015.eqsin.wmnet |
[production] |
19:26 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs2008.codfw.wmnet |
[production] |
19:24 |
<dzahn@cumin2002> |
conftool action : set/pooled=yes; selector: dc=codfw,name=phab2001-vcs.codfw.wmnet |
[production] |
19:24 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs1016.eqiad.wmnet |
[production] |
19:24 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1015.eqiad.wmnet |
[production] |
19:23 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1018.eqiad.wmnet |
[production] |
19:21 |
<cwhite> |
remove openjdk-8-jre from eqiad logstash nodes T301770 |
[production] |
19:21 |
<mutante> |
phab2001 - powercycling via mgmt |
[production] |
19:20 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs1015.eqiad.wmnet |
[production] |
19:20 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1014.eqiad.wmnet |
[production] |
19:19 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs1018.eqiad.wmnet |
[production] |
19:17 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=phab2001-vcs.codfw.wmnet |
[production] |
19:15 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs1014.eqiad.wmnet |
[production] |
19:15 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1013.eqiad.wmnet |
[production] |
19:14 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs6002.drmrs.wmnet |
[production] |
19:14 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp3051.esams.wmnet |
[production] |
19:14 |
<mutante> |
phab2001 - git-ssh.codfw - rebooting - might cause pybal alert |
[production] |
19:13 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp5015.eqsin.wmnet |
[production] |
19:12 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp4022.ulsfo.wmnet |
[production] |
19:11 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs1013.eqiad.wmnet |
[production] |
19:09 |
<bblack@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host lvs6002.drmrs.wmnet |
[production] |
19:08 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp2035.codfw.wmnet |
[production] |
19:07 |
<bblack@cumin1001> |
conftool action : set/pooled=yes; selector: cluster=ml_staging |
[production] |
19:07 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp1075.eqiad.wmnet |
[production] |
19:07 |
<bblack@cumin1001> |
conftool action : set/weight=1; selector: cluster=ml_staging |
[production] |
19:07 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp5013.eqsin.wmnet |
[production] |
19:06 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host cp3050.esams.wmnet |
[production] |
19:06 |
<bblack@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs5002.eqsin.wmnet |
[production] |
19:05 |
<mutante> |
doc.wikimedia.org - short downtime due to maintenance, rebooting doc1001 |
[production] |