|
2026-05-21
ยง
|
| 14:42 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1028.eqiad.wmnet |
[production] |
| 14:42 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.reboot-nodes (exit_code=0) rolling reboot on A:ml-serve-worker-eqiad |
[production] |
| 14:42 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host ml-serve1011.eqiad.wmnet |
[production] |
| 14:42 |
<klausman@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node pool for host ml-serve1011.eqiad.wmnet |
[production] |
| 14:41 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:41 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:40 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance es2039', diff saved to https://phabricator.wikimedia.org/P92795 and previous config saved to /var/cache/conftool/dbconfig/20260521-144055-fceratto.json |
[production] |
| 14:39 |
<andrew@cloudcumin1001> |
END (PASS) - Cookbook wmcs.ceph.roll_reboot_mons (exit_code=0) |
[admin] |
| 14:39 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host maps1012.eqiad.wmnet |
[production] |
| 14:38 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) pki.discovery.wmnet. on all recursors |
[production] |
| 14:37 |
<elukey@cumin1003> |
START - Cookbook sre.dns.wipe-cache pki.discovery.wmnet. on all recursors |
[production] |
| 14:37 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host ml-serve1011.eqiad.wmnet |
[production] |
| 14:35 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1027.eqiad.wmnet |
[production] |
| 14:35 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1027.eqiad.wmnet |
[production] |
| 14:32 |
<klausman@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node depool for host ml-serve1011.eqiad.wmnet |
[production] |
| 14:32 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host maps1012.eqiad.wmnet |
[production] |
| 14:32 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host ml-serve1010.eqiad.wmnet |
[production] |
| 14:32 |
<klausman@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node pool for host ml-serve1010.eqiad.wmnet |
[production] |
| 14:30 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance es2039', diff saved to https://phabricator.wikimedia.org/P92793 and previous config saved to /var/cache/conftool/dbconfig/20260521-143045-fceratto.json |
[production] |
| 14:30 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) pki.discovery.wmnet. on all recursors |
[production] |
| 14:30 |
<elukey@cumin1003> |
START - Cookbook sre.dns.wipe-cache pki.discovery.wmnet. on all recursors |
[production] |
| 14:29 |
<elukey@cumin1003> |
START - Cookbook sre.pki.restart-reboot rolling reboot on A:pki |
[production] |
| 14:29 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti1027.eqiad.wmnet |
[production] |
| 14:29 |
<andrew@cloudcumin1001> |
START - Cookbook wmcs.ceph.roll_reboot_mons |
[admin] |
| 14:28 |
<andrew@cloudcumin1001> |
END (PASS) - Cookbook wmcs.ceph.roll_reboot_mons (exit_code=0) |
[admin] |
| 14:27 |
<slyngshede@cumin1003> |
END (FAIL) - Cookbook sre.cdn.roll-reboot (exit_code=1) rolling reboot on P{cp601[5-6].drmrs.wmnet} and A:cp |
[production] |
| 14:26 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1027.eqiad.wmnet |
[production] |
| 14:26 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:26 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:25 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1054.eqiad.wmnet |
[production] |
| 14:25 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1054.eqiad.wmnet |
[production] |
| 14:24 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host ml-serve1010.eqiad.wmnet |
[production] |
| 14:21 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:21 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:21 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host maps1011.eqiad.wmnet |
[production] |
| 14:20 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance es2039 (T426633)', diff saved to https://phabricator.wikimedia.org/P92792 and previous config saved to /var/cache/conftool/dbconfig/20260521-142037-fceratto.json |
[production] |
| 14:19 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti1054.eqiad.wmnet |
[production] |
| 14:19 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:19 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 14:17 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1054.eqiad.wmnet |
[production] |
| 14:17 |
<andrew@cloudcumin1001> |
START - Cookbook wmcs.ceph.roll_reboot_mons |
[admin] |
| 14:17 |
<andrew@cloudcumin1001> |
END (ERROR) - Cookbook wmcs.ceph.roll_reboot_mons (exit_code=97) |
[admin] |
| 14:17 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1053.eqiad.wmnet |
[production] |
| 14:16 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1053.eqiad.wmnet |
[production] |
| 14:16 |
<andrew@cloudcumin1001> |
START - Cookbook wmcs.ceph.roll_reboot_mons |
[admin] |
| 14:14 |
<klausman@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node depool for host ml-serve1010.eqiad.wmnet |
[production] |
| 14:14 |
<klausman@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host ml-serve1009.eqiad.wmnet |
[production] |
| 14:14 |
<klausman@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node pool for host ml-serve1009.eqiad.wmnet |
[production] |
| 14:13 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 14:13 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host maps1011.eqiad.wmnet |
[production] |