2025-04-30
ยง
|
10:46 |
<hnowlan@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mw-cron: apply |
[production] |
10:45 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti2035.codfw.wmnet |
[production] |
10:41 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2035.codfw.wmnet |
[production] |
10:40 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.drain-node (exit_code=99) for draining ganeti node ganeti2033.codfw.wmnet |
[production] |
10:40 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2033.codfw.wmnet |
[production] |
10:40 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti2031.codfw.wmnet |
[production] |
10:39 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti2031.codfw.wmnet |
[production] |
10:33 |
<moritzm> |
installing curl security updates |
[production] |
10:32 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti2031.codfw.wmnet |
[production] |
10:24 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2031.codfw.wmnet |
[production] |
10:23 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.drain-node (exit_code=99) for draining ganeti node ganeti2030.codfw.wmnet |
[production] |
10:16 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2030.codfw.wmnet |
[production] |
10:16 |
<fnegri@cumin1002> |
END (FAIL) - Cookbook sre.wikireplicas.add-wiki (exit_code=99) for database nupwiki (T390714) |
[production] |
10:15 |
<fnegri@cumin1002> |
START - Cookbook sre.wikireplicas.add-wiki for database nupwiki (T390714) |
[production] |
10:14 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti2022.codfw.wmnet |
[production] |
10:13 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti2022.codfw.wmnet |
[production] |
10:06 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti2022.codfw.wmnet |
[production] |
10:01 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2022.codfw.wmnet |
[production] |
09:55 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti2021.codfw.wmnet |
[production] |
09:55 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti2021.codfw.wmnet |
[production] |
09:48 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti2021.codfw.wmnet |
[production] |
09:41 |
<klausman@cumin1002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ml-lab1002.eqiad.wmnet |
[production] |
09:38 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revision-models' for release 'main' . |
[production] |
09:38 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revertrisk' for release 'main' . |
[production] |
09:38 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2021.codfw.wmnet |
[production] |
09:36 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'readability' for release 'main' . |
[production] |
09:35 |
<klausman@cumin1002> |
START - Cookbook sre.hosts.reboot-single for host ml-lab1002.eqiad.wmnet |
[production] |
09:34 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'logo-detection' for release 'main' . |
[production] |
09:32 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'llm' for release 'main' . |
[production] |
09:31 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'article-models' for release 'main' . |
[production] |
09:31 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti2020.codfw.wmnet |
[production] |
09:31 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti2020.codfw.wmnet |
[production] |
09:30 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es2031 (re)pooling @ 100%: Repooling', diff saved to https://phabricator.wikimedia.org/P75695 and previous config saved to /var/cache/conftool/dbconfig/20250430-093053-root.json |
[production] |
09:30 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1026 (re)pooling @ 100%: Repooling', diff saved to https://phabricator.wikimedia.org/P75694 and previous config saved to /var/cache/conftool/dbconfig/20250430-093040-root.json |
[production] |
09:30 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'article-descriptions' for release 'main' . |
[production] |
09:29 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-drafttopic' for release 'main' . |
[production] |
09:28 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-draftquality' for release 'main' . |
[production] |
09:28 |
<godog> |
bounce prometheus-statsd-exporter on stat1011 - T389344 |
[production] |
09:27 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-articletopic' for release 'main' . |
[production] |
09:26 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-articlequality' for release 'main' . |
[production] |
09:24 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ganeti2020.codfw.wmnet |
[production] |
09:22 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-editquality-goodfaith' for release 'main' . |
[production] |
09:18 |
<elukey@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-editquality-damaging' for release 'main' . |
[production] |
09:17 |
<elukey> |
manual restart of the waterline service on maps1009 |
[production] |
09:17 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti2020.codfw.wmnet |
[production] |
09:16 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host bast7001.wikimedia.org |
[production] |
09:15 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es2031 (re)pooling @ 75%: Repooling', diff saved to https://phabricator.wikimedia.org/P75693 and previous config saved to /var/cache/conftool/dbconfig/20250430-091547-root.json |
[production] |
09:15 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1026 (re)pooling @ 75%: Repooling', diff saved to https://phabricator.wikimedia.org/P75692 and previous config saved to /var/cache/conftool/dbconfig/20250430-091534-root.json |
[production] |
09:12 |
<vgutierrez@cumin1002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1013.eqiad.wmnet |
[production] |
09:10 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host bast7001.wikimedia.org |
[production] |