|
2025-11-24
ยง
|
| 12:54 |
<gehel@cumin2002> |
START - Cookbook sre.hosts.reboot-cluster |
[production] |
| 12:49 |
<gehel@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host wdqs2025.codfw.wmnet |
[production] |
| 12:47 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on db1223.eqiad.wmnet with reason: Maintenance |
[production] |
| 12:45 |
<bwojtowicz@deploy2002> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'experimental' for release 'main' . |
[production] |
| 12:42 |
<gehel@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host wdqs2025.codfw.wmnet |
[production] |
| 12:32 |
<aikochou@deploy2002> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revise-tone-task-generator' for release 'main' . |
[production] |
| 12:23 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on dbstore1007.eqiad.wmnet with reason: Maintenance |
[production] |
| 12:17 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) db1187 gradually with 4 steps - repool after schema change test |
[production] |
| 12:13 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on db1240.eqiad.wmnet with reason: Maintenance |
[production] |
| 12:13 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1212 (T410531)', diff saved to https://phabricator.wikimedia.org/P85515 and previous config saved to /var/cache/conftool/dbconfig/20251124-121341-marostegui.json |
[production] |
| 12:02 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host idp2005.wikimedia.org |
[production] |
| 12:01 |
<moritzm> |
installing Squid security updates |
[production] |
| 11:58 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host idp2005.wikimedia.org |
[production] |
| 11:58 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1212', diff saved to https://phabricator.wikimedia.org/P85513 and previous config saved to /var/cache/conftool/dbconfig/20251124-115834-marostegui.json |
[production] |
| 11:58 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host idp-test1005.wikimedia.org |
[production] |
| 11:56 |
<daniel@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 11:56 |
<daniel@deploy2002> |
helmfile [codfw] START helmfile.d/services/rest-gateway: apply |
[production] |
| 11:54 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host idp-test1005.wikimedia.org |
[production] |
| 11:53 |
<daniel@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 11:52 |
<daniel@deploy2002> |
helmfile [eqiad] START helmfile.d/services/rest-gateway: apply |
[production] |
| 11:46 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 11:46 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 11:44 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host idp-test2005.wikimedia.org |
[production] |
| 11:43 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1212', diff saved to https://phabricator.wikimedia.org/P85511 and previous config saved to /var/cache/conftool/dbconfig/20251124-114326-marostegui.json |
[production] |
| 11:40 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host idp-test2005.wikimedia.org |
[production] |
| 11:31 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.pool db1187 gradually with 4 steps - repool after schema change test |
[production] |
| 11:28 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Depooling db1187 (T299441)', diff saved to https://phabricator.wikimedia.org/P85509 and previous config saved to /var/cache/conftool/dbconfig/20251124-112850-marostegui.json |
[production] |
| 11:28 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on db1187.eqiad.wmnet with reason: Maintenance |
[production] |
| 11:28 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1212 (T410531)', diff saved to https://phabricator.wikimedia.org/P85508 and previous config saved to /var/cache/conftool/dbconfig/20251124-112819-marostegui.json |
[production] |
| 11:26 |
<marostegui@cumin1003> |
END (ERROR) - Cookbook sre.mysql.pool (exit_code=97) db1187 gradually with 4 steps - repool after schema change test |
[production] |
| 11:25 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 11:25 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 11:24 |
<gehel@cumin1003> |
END (PASS) - Cookbook sre.hosts.reboot-cluster (exit_code=0) |
[production] |
| 11:23 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.pool db1187 gradually with 4 steps - repool after schema change test |
[production] |
| 11:23 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Depooling db1212 (T410531)', diff saved to https://phabricator.wikimedia.org/P85506 and previous config saved to /var/cache/conftool/dbconfig/20251124-112306-marostegui.json |
[production] |
| 11:22 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on 6 hosts with reason: Maintenance |
[production] |
| 11:22 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on db1212.eqiad.wmnet with reason: Maintenance |
[production] |
| 11:22 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1198 (T410531)', diff saved to https://phabricator.wikimedia.org/P85505 and previous config saved to /var/cache/conftool/dbconfig/20251124-112231-marostegui.json |
[production] |
| 11:21 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Depooling db1187 (T299441)', diff saved to https://phabricator.wikimedia.org/P85504 and previous config saved to /var/cache/conftool/dbconfig/20251124-112111-marostegui.json |
[production] |
| 11:21 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on db1187.eqiad.wmnet with reason: Maintenance |
[production] |
| 11:07 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1198', diff saved to https://phabricator.wikimedia.org/P85503 and previous config saved to /var/cache/conftool/dbconfig/20251124-110723-marostegui.json |
[production] |
| 10:57 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 10:56 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/rest-gateway: apply |
[production] |
| 10:56 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 10:56 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/rest-gateway: apply |
[production] |
| 10:56 |
<btullis@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/growthbook: apply |
[production] |
| 10:56 |
<btullis@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/growthbook: apply |
[production] |
| 10:56 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 10:55 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/rest-gateway: apply |
[production] |
| 10:52 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/api-gateway: apply |
[production] |