2023-11-16
ยง
|
14:51 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/mw-api-int: apply |
[production] |
14:51 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/mw-api-int: apply |
[production] |
14:51 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/mw-web: apply |
[production] |
14:50 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/mw-web: apply |
[production] |
14:50 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/mw-web: apply |
[production] |
14:50 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/mw-web: apply |
[production] |
14:50 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/mw-debug: apply |
[production] |
14:49 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/mw-debug: apply |
[production] |
14:49 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/mw-debug: apply |
[production] |
14:49 |
<arnaudb@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts db1136.eqiad.wmnet |
[production] |
14:49 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/mw-debug: apply |
[production] |
14:48 |
<claime> |
Redeploying mw-on-k8s for T350430 |
[production] |
14:46 |
<ayounsi@cumin1001> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'configure' for AS: 141626 |
[production] |
14:45 |
<ayounsi@cumin1001> |
START - Cookbook sre.network.peering with action 'configure' for AS: 141626 |
[production] |
14:43 |
<jbond> |
re-enable puppet on puppet7 agents |
[production] |
14:43 |
<kartik@deploy2002> |
Finished scap: Backport for [[gerrit:974242|TranslatablePageMarker: Add patrol status for translatable page (T351273)]] (duration: 21m 41s) |
[production] |
14:37 |
<kartik@deploy2002> |
kartik and abi: Continuing with sync |
[production] |
14:23 |
<kartik@deploy2002> |
kartik and abi: Backport for [[gerrit:974242|TranslatablePageMarker: Add patrol status for translatable page (T351273)]] synced to the testservers (https://wikitech.wikimedia.org/wiki/Mwdebug) |
[production] |
14:21 |
<kartik@deploy2002> |
Started scap: Backport for [[gerrit:974242|TranslatablePageMarker: Add patrol status for translatable page (T351273)]] |
[production] |
14:20 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.puppet.migrate-role (exit_code=0) for role: kafka::monitoring_bullseye |
[production] |
14:15 |
<jbond> |
stop puppet on puppet7 agents to debug puppet performance |
[production] |
14:10 |
<hnowlan@cumin1001> |
END (PASS) - Cookbook sre.loadbalancer.restart-pybal (exit_code=0) rolling-restart of pybal on P{lvs1019*,lvs2013*} and A:lvs (T349796) |
[production] |
14:09 |
<hnowlan@cumin1001> |
START - Cookbook sre.loadbalancer.restart-pybal rolling-restart of pybal on P{lvs1019*,lvs2013*} and A:lvs (T349796) |
[production] |
14:08 |
<hnowlan@cumin1001> |
END (PASS) - Cookbook sre.loadbalancer.restart-pybal (exit_code=0) rolling-restart of pybal on P{lvs1020*,lvs2014*} and A:lvs (T349796) |
[production] |
14:07 |
<jmm@cumin2002> |
START - Cookbook sre.puppet.migrate-role for role: kafka::monitoring_bullseye |
[production] |
14:07 |
<hnowlan@cumin1001> |
START - Cookbook sre.loadbalancer.restart-pybal rolling-restart of pybal on P{lvs1020*,lvs2014*} and A:lvs (T349796) |
[production] |
14:03 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.puppet.migrate-role (exit_code=0) for role: prometheus |
[production] |
13:49 |
<jmm@cumin2002> |
START - Cookbook sre.puppet.migrate-role for role: prometheus |
[production] |
13:47 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be2050.codfw.wmnet |
[production] |
13:44 |
<jynus> |
restart bacula at backup1001 |
[production] |
13:40 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2050.codfw.wmnet |
[production] |
13:39 |
<jbond@cumin1001> |
END (PASS) - Cookbook sre.puppet.migrate-host (exit_code=0) for host backup2001.codfw.wmnet |
[production] |
13:37 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.puppet.migrate-host (exit_code=0) for host ms-be2050.codfw.wmnet |
[production] |
13:34 |
<sergi0> |
stat1008: Add `sowiki`, `stwiki`, `tgwiki` and `ugwiki` to `/srv/published/datasets/one-off/research-mwaddlink/wikis.txt` (T340944) |
[production] |
13:33 |
<jbond@cumin1001> |
START - Cookbook sre.puppet.migrate-host for host backup2001.codfw.wmnet |
[production] |
13:30 |
<jbond@cumin1001> |
END (PASS) - Cookbook sre.puppet.migrate-host (exit_code=0) for host dbprov2001.codfw.wmnet |
[production] |
13:29 |
<jmm@cumin2002> |
START - Cookbook sre.puppet.migrate-host for host ms-be2050.codfw.wmnet |
[production] |
13:28 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.puppet.migrate-host (exit_code=99) for host ms-be2050.codfw.wmnet |
[production] |
13:21 |
<jbond@cumin1001> |
START - Cookbook sre.puppet.migrate-host for host dbprov2001.codfw.wmnet |
[production] |
13:19 |
<jbond@cumin1001> |
END (PASS) - Cookbook sre.puppet.migrate-host (exit_code=0) for host backup1001.eqiad.wmnet |
[production] |
13:17 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-fe1014.eqiad.wmnet |
[production] |
13:10 |
<jbond@cumin1001> |
START - Cookbook sre.puppet.migrate-host for host backup1001.eqiad.wmnet |
[production] |
13:09 |
<jbond@cumin1001> |
END (PASS) - Cookbook sre.puppet.migrate-host (exit_code=0) for host db1133.eqiad.wmnet |
[production] |
13:09 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-fe1014.eqiad.wmnet |
[production] |
13:02 |
<jbond@cumin1001> |
START - Cookbook sre.puppet.migrate-host for host db1133.eqiad.wmnet |
[production] |
13:00 |
<arnaudb@cumin1001> |
START - Cookbook sre.mysql.clone of db1141.eqiad.wmnet onto db1241.eqiad.wmnet |
[production] |
12:56 |
<arnaudb@cumin1001> |
dbctl commit (dc=all): 'cloning db1141 - T350458', diff saved to https://phabricator.wikimedia.org/P53516 and previous config saved to /var/cache/conftool/dbconfig/20231116-125649-arnaudb.json |
[production] |
12:56 |
<cmooney@cumin1001> |
END (PASS) - Cookbook sre.deploy.python-code (exit_code=0) homer to cumin2002.codfw.wmnet,cumin1001.eqiad.wmnet with reason: Release v0.6.4 - cmooney@cumin1001 |
[production] |
12:55 |
<arnaudb@cumin1001> |
dbctl commit (dc=all): 'cloning db1141 - T350458', diff saved to https://phabricator.wikimedia.org/P53515 and previous config saved to /var/cache/conftool/dbconfig/20231116-125515-arnaudb.json |
[production] |
12:55 |
<arnaudb@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1241.eqiad.wmnet with reason: provisionning db1241.eqiad.wmnet - T344036 |
[production] |