|
2026-05-27
§
|
| 16:38 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1224', diff saved to https://phabricator.wikimedia.org/P93290 and previous config saved to /var/cache/conftool/dbconfig/20260527-163808-fceratto.json |
[production] |
| 16:37 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool db2163: Repooling after testing patch |
[production] |
| 16:28 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1224', diff saved to https://phabricator.wikimedia.org/P93287 and previous config saved to /var/cache/conftool/dbconfig/20260527-162800-fceratto.json |
[production] |
| 16:17 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1224 (T426633)', diff saved to https://phabricator.wikimedia.org/P93285 and previous config saved to /var/cache/conftool/dbconfig/20260527-161753-fceratto.json |
[production] |
| 16:14 |
<otto@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/eventstreams: apply |
[production] |
| 16:13 |
<otto@deploy1003> |
helmfile [codfw] START helmfile.d/services/eventstreams: apply |
[production] |
| 16:13 |
<otto@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/eventstreams: apply |
[production] |
| 16:12 |
<otto@deploy1003> |
helmfile [eqiad] START helmfile.d/services/eventstreams: apply |
[production] |
| 16:11 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db1224 (T426633)', diff saved to https://phabricator.wikimedia.org/P93284 and previous config saved to /var/cache/conftool/dbconfig/20260527-161101-fceratto.json |
[production] |
| 16:10 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1224.eqiad.wmnet with reason: Maintenance |
[production] |
| 16:10 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1220 (T426633)', diff saved to https://phabricator.wikimedia.org/P93283 and previous config saved to /var/cache/conftool/dbconfig/20260527-161034-fceratto.json |
[production] |
| 16:10 |
<otto@deploy1003> |
helmfile [staging] DONE helmfile.d/services/eventstreams: apply |
[production] |
| 16:10 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool db1178: Recovering from failure in cookbook |
[production] |
| 16:10 |
<otto@deploy1003> |
helmfile [staging] START helmfile.d/services/eventstreams: apply |
[production] |
| 16:05 |
<sukhe@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host durum5003.eqsin.wmnet with OS trixie |
[production] |
| 16:03 |
<brett@cumin2002> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp6016.drmrs.wmnet |
[production] |
| 16:00 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1220', diff saved to https://phabricator.wikimedia.org/P93280 and previous config saved to /var/cache/conftool/dbconfig/20260527-160027-fceratto.json |
[production] |
| 15:59 |
<brett@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host lvs1017.eqiad.wmnet |
[production] |
| 15:53 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for db2163.codfw.wmnet |
[production] |
| 15:53 |
<cwilliams@cumin1003> |
START - Cookbook sre.hosts.remove-downtime for db2163.codfw.wmnet |
[production] |
| 15:52 |
<brett@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host lvs1017.eqiad.wmnet |
[production] |
| 15:52 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.pool pool db2163: Repooling after testing patch |
[production] |
| 15:52 |
<brett@cumin2002> |
START - Cookbook sre.cdn.roll-reboot rolling reboot on P{cp6016.drmrs.wmnet,cp[1112,1114].eqiad.wmnet,cp[5024,5031-5032].eqsin.wmnet} and A:cp |
[production] |
| 15:51 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db2163: Testing cookbook |
[production] |
| 15:50 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.depool depool db2163: Testing cookbook |
[production] |
| 15:50 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1220', diff saved to https://phabricator.wikimedia.org/P93276 and previous config saved to /var/cache/conftool/dbconfig/20260527-155019-fceratto.json |
[production] |
| 15:45 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:45 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:40 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db1220 (T426633)', diff saved to https://phabricator.wikimedia.org/P93274 and previous config saved to /var/cache/conftool/dbconfig/20260527-154011-fceratto.json |
[production] |
| 15:33 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.mysql.major-upgrade (exit_code=0) |
[production] |
| 15:33 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool db2163: Migration of db2163.codfw.wmnet completed |
[production] |
| 15:32 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.pool pool db2163: Migration of db2163.codfw.wmnet completed |
[production] |
| 15:32 |
<cwilliams@cumin1003> |
END (ERROR) - Cookbook sre.mysql.pool (exit_code=97) pool db2163: Migration of db2163.codfw.wmnet completed |
[production] |
| 15:24 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.pool pool db1178: Recovering from failure in cookbook |
[production] |
| 15:22 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for db1178.eqiad.wmnet |
[production] |
| 15:22 |
<cwilliams@cumin1003> |
START - Cookbook sre.hosts.remove-downtime for db1178.eqiad.wmnet |
[production] |
| 15:19 |
<sukhe@cumin1003> |
START - Cookbook sre.hosts.reimage for host durum5003.eqsin.wmnet with OS trixie |
[production] |
| 15:19 |
<cdanis> |
💙cdanis@cp4047.ulsfo.wmnet ~ 🕦☕ sudo apt install lua5.4-ciderbloom lua5.4-ciderbloom-dbgsym |
[production] |
| 15:13 |
<cdanis> |
💙cdanis@cp5026.eqsin.wmnet ~ 🕚☕ sudo apt install lua5.4-ciderbloom lua5.4-ciderbloom-dbgsym |
[production] |
| 15:12 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:12 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:11 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:11 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:11 |
<cwilliams@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1178.eqiad.wmnet with reason: Icinga wait failed during run |
[production] |
| 15:10 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:10 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:10 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:09 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |
| 15:09 |
<cdanis> |
💔cdanis@apt1002.wikimedia.org ~ 🕚☕ sudo -i reprepro --component main --restrict cidergrinder update trixie-wikimedia |
[production] |
| 15:08 |
<javiermonton@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/webrequest-page-view-next: apply |
[production] |