|
2022-04-01
§
|
| 19:00 |
<sukhe@cumin2002> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=1) for host cp2036.codfw.wmnet |
[production] |
| 19:00 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=eqiad,name=mw1414.wmnet |
[production] |
| 19:00 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=eqiad,name=mw141[4-8].wmnet |
[production] |
| 19:00 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw1414.wmnet |
[production] |
| 18:58 |
<dzahn@cumin2002> |
conftool action : set/pooled=no; selector: dc=codfw,name=mw141[4-8].wmnet |
[production] |
| 18:42 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host cp2036.codfw.wmnet |
[production] |
| 13:05 |
<dcausse> |
reseting jvmquake flag on all wdqs hosts |
[production] |
| 12:52 |
<dcausse> |
restarting blazegraph on wdqs1006 and resetting jvmquake warning flag |
[production] |
| 11:31 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host sretest1001.eqiad.wmnet |
[production] |
| 11:26 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host sretest1001.eqiad.wmnet |
[production] |
| 11:01 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host acmechief2001.codfw.wmnet |
[production] |
| 10:55 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host acmechief2001.codfw.wmnet |
[production] |
| 10:54 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host acmechief1001.eqiad.wmnet |
[production] |
| 10:50 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host acmechief1001.eqiad.wmnet |
[production] |
| 10:47 |
<vgutierrez> |
reboot acme-chief instances to catch up on kernel upgrades |
[production] |
| 10:34 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir6002.drmrs.wmnet |
[production] |
| 10:29 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir6002.drmrs.wmnet |
[production] |
| 10:29 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir6001.drmrs.wmnet |
[production] |
| 10:21 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir6001.drmrs.wmnet |
[production] |
| 10:20 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir5002.eqsin.wmnet |
[production] |
| 10:14 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir5002.eqsin.wmnet |
[production] |
| 10:06 |
<vgutierrez> |
vgutierrez@puppetmaster2001:~$ sudo -i rm /var/run/confd-template/.ml-staging-ctrl*.err |
[production] |
| 10:04 |
<vgutierrez> |
vgutierrez@puppetmaster1001:~$ sudo -i rm /var/run/confd-template/.ml-staging-ctrl*.err |
[production] |
| 10:03 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir5001.eqsin.wmnet |
[production] |
| 09:57 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir5001.eqsin.wmnet |
[production] |
| 09:47 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir4002.ulsfo.wmnet |
[production] |
| 09:43 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir4002.ulsfo.wmnet |
[production] |
| 09:43 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir4001.ulsfo.wmnet |
[production] |
| 09:37 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir4001.ulsfo.wmnet |
[production] |
| 09:35 |
<vgutierrez@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=1) for host ncredir3002.esams.wmnet |
[production] |
| 09:24 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir3002.esams.wmnet |
[production] |
| 09:24 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir3001.esams.wmnet |
[production] |
| 09:18 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir3001.esams.wmnet |
[production] |
| 09:16 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir2002.codfw.wmnet |
[production] |
| 09:10 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir2002.codfw.wmnet |
[production] |
| 09:10 |
<vgutierrez@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=1) for host ncredir2001.codfw.wmnet |
[production] |
| 08:59 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir2001.codfw.wmnet |
[production] |
| 08:58 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir1002.eqiad.wmnet |
[production] |
| 08:54 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir1002.eqiad.wmnet |
[production] |
| 08:53 |
<vgutierrez@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ncredir1001.eqiad.wmnet |
[production] |
| 08:49 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir1001.eqiad.wmnet |
[production] |
| 08:48 |
<vgutierrez@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=99) for host ncredir1001.eqiad.wmnet |
[production] |
| 08:48 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-single for host ncredir1001.eqiad.wmnet |
[production] |
| 08:44 |
<vgutierrez@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-cluster (exit_code=99) |
[production] |
| 08:44 |
<vgutierrez@cumin1001> |
START - Cookbook sre.hosts.reboot-cluster |
[production] |
| 08:42 |
<vgutierrez> |
rolling restart of ncredir instances to catch up on kernel upgrades |
[production] |
| 06:54 |
<XioNoX> |
traffic engineering in drmrs to prevent link saturation |
[production] |