2025-07-17
ยง
|
11:24 |
<stevemunene@cumin1003> |
END (PASS) - Cookbook sre.hadoop.init-hadoop-workers (exit_code=0) for hosts an-worker1176.eqiad.wmnet |
[production] |
11:24 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
11:22 |
<stevemunene@cumin1003> |
START - Cookbook sre.hadoop.init-hadoop-workers for hosts an-worker1176.eqiad.wmnet |
[production] |
11:22 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2227 (re)pooling @ 25%: 10', diff saved to https://phabricator.wikimedia.org/P79325 and previous config saved to /var/cache/conftool/dbconfig/20250717-112220-root.json |
[production] |
11:17 |
<marostegui> |
Restart pc4 T399540 |
[production] |
11:17 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on pc2014.codfw.wmnet,pc1014.eqiad.wmnet with reason: Maintenance |
[production] |
11:15 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM install1004.wikimedia.org |
[production] |
11:14 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1166 (re)pooling @ 25%: 10', diff saved to https://phabricator.wikimedia.org/P79323 and previous config saved to /var/cache/conftool/dbconfig/20250717-111454-root.json |
[production] |
11:14 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.mysql.parsercache (exit_code=0) |
[production] |
11:14 |
<marostegui@cumin1002> |
START - Cookbook sre.mysql.parsercache |
[production] |
11:11 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db2227 for migration to mariadb 10.11', diff saved to https://phabricator.wikimedia.org/P79321 and previous config saved to /var/cache/conftool/dbconfig/20250717-111132-marostegui.json |
[production] |
11:11 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db2227.codfw.wmnet with reason: Maintenance |
[production] |
11:08 |
<elukey@cumin1003> |
START - Cookbook sre.ganeti.reboot-vm for VM install1004.wikimedia.org |
[production] |
11:04 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db1166 for migration to mariadb 10.11', diff saved to https://phabricator.wikimedia.org/P79320 and previous config saved to /var/cache/conftool/dbconfig/20250717-110405-marostegui.json |
[production] |
11:04 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db1166.eqiad.wmnet with reason: Maintenance |
[production] |
11:00 |
<elukey@cumin1003> |
END (ERROR) - Cookbook sre.hosts.provision (exit_code=97) for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:57 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db1182 (T399249)', diff saved to https://phabricator.wikimedia.org/P79319 and previous config saved to /var/cache/conftool/dbconfig/20250717-105741-marostegui.json |
[production] |
10:57 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1182.eqiad.wmnet with reason: Maintenance |
[production] |
10:57 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1162 (T399249)', diff saved to https://phabricator.wikimedia.org/P79318 and previous config saved to /var/cache/conftool/dbconfig/20250717-105719-marostegui.json |
[production] |
10:52 |
<jiji@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/mw-experimental: apply |
[production] |
10:51 |
<jiji@deploy1003> |
helmfile [codfw] START helmfile.d/services/mw-experimental: apply |
[production] |
10:50 |
<jiji@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/mw-experimental: apply |
[production] |
10:49 |
<jiji@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mw-experimental: apply |
[production] |
10:49 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:49 |
<jiji@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/mw-experimental: apply |
[production] |
10:48 |
<jiji@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mw-experimental: apply |
[production] |
10:48 |
<elukey@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:48 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:42 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1162', diff saved to https://phabricator.wikimedia.org/P79317 and previous config saved to /var/cache/conftool/dbconfig/20250717-104211-marostegui.json |
[production] |
10:28 |
<jgiannelos@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/mobileapps: apply |
[production] |
10:27 |
<jgiannelos@deploy1003> |
helmfile [codfw] START helmfile.d/services/mobileapps: apply |
[production] |
10:27 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1162', diff saved to https://phabricator.wikimedia.org/P79316 and previous config saved to /var/cache/conftool/dbconfig/20250717-102704-marostegui.json |
[production] |
10:24 |
<jgiannelos@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/mobileapps: apply |
[production] |
10:24 |
<jgiannelos@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mobileapps: apply |
[production] |
10:23 |
<elukey@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:23 |
<jgiannelos@deploy1003> |
helmfile [staging] DONE helmfile.d/services/mobileapps: apply |
[production] |
10:23 |
<jgiannelos@deploy1003> |
helmfile [staging] START helmfile.d/services/mobileapps: apply |
[production] |
10:18 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:16 |
<elukey@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:16 |
<cmooney@cumin1003> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'configure' for AS: 30182 |
[production] |
10:16 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:15 |
<elukey@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:14 |
<cmooney@cumin1003> |
START - Cookbook sre.network.peering with action 'configure' for AS: 30182 |
[production] |
10:14 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host ml-serve1012.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART |
[production] |
10:11 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1162 (T399249)', diff saved to https://phabricator.wikimedia.org/P79315 and previous config saved to /var/cache/conftool/dbconfig/20250717-101156-marostegui.json |
[production] |
09:36 |
<jakob@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/wikidata-query-gui: apply |
[production] |
09:36 |
<jakob@deploy1003> |
helmfile [eqiad] START helmfile.d/services/wikidata-query-gui: apply |
[production] |
09:35 |
<jakob@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/wikidata-query-gui: apply |
[production] |
09:35 |
<jakob@deploy1003> |
helmfile [codfw] START helmfile.d/services/wikidata-query-gui: apply |
[production] |
09:34 |
<jakob@deploy1003> |
helmfile [staging] DONE helmfile.d/services/wikidata-query-gui: apply |
[production] |