|
2026-05-27
ยง
|
| 09:34 |
<jayme@deploy1003> |
helmfile [staging-codfw] START helmfile.d/admin 'apply'. |
[production] |
| 09:28 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2173 (T426633)', diff saved to https://phabricator.wikimedia.org/P93202 and previous config saved to /var/cache/conftool/dbconfig/20260527-092842-fceratto.json |
[production] |
| 09:28 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2173.codfw.wmnet with reason: Maintenance |
[production] |
| 09:28 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.pool pool db1203: Migration of db1203.eqiad.wmnet completed |
[production] |
| 09:28 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2170 (T426633)', diff saved to https://phabricator.wikimedia.org/P93200 and previous config saved to /var/cache/conftool/dbconfig/20260527-092814-fceratto.json |
[production] |
| 09:27 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host es1050.eqiad.wmnet with OS trixie |
[production] |
| 09:26 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool es1050: Upgrading es1050.eqiad.wmnet |
[production] |
| 09:25 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool es1050: Upgrading es1050.eqiad.wmnet |
[production] |
| 09:25 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.major-upgrade |
[production] |
| 09:25 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool es1050: repool after maintenance |
[production] |
| 09:25 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.pool pool es1050: repool after maintenance |
[production] |
| 09:24 |
<cwilliams@cumin1003> |
START - Cookbook sre.mysql.pool pool db2166: Migration of db2166.codfw.wmnet completed |
[production] |
| 09:23 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) pool es2051: repool after maintenance |
[production] |
| 09:19 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db1203.eqiad.wmnet with OS trixie |
[production] |
| 09:18 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2170', diff saved to https://phabricator.wikimedia.org/P93196 and previous config saved to /var/cache/conftool/dbconfig/20260527-091806-fceratto.json |
[production] |
| 09:16 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db2166.codfw.wmnet with OS trixie |
[production] |
| 09:08 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2170', diff saved to https://phabricator.wikimedia.org/P93194 and previous config saved to /var/cache/conftool/dbconfig/20260527-090759-fceratto.json |
[production] |
| 09:03 |
<fabfur@cumin1003> |
conftool action : set/pooled=yes; selector: name=cp3074.* |
[production] |
| 09:03 |
<fabfur@cumin1003> |
conftool action : set/pooled=yes; selector: name=cp3066.* |
[production] |
| 09:02 |
<fabfur> |
repooling cp3074 and cp3066 (T419825) |
[production] |
| 09:02 |
<slyngshede@cumin1003> |
END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for cp6015.drmrs.wmnet |
[production] |
| 09:02 |
<slyngshede@cumin1003> |
START - Cookbook sre.hosts.remove-downtime for cp6015.drmrs.wmnet |
[production] |
| 09:02 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1203.eqiad.wmnet with reason: host reimage |
[production] |
| 09:02 |
<slyngshede@cumin1003> |
conftool action : set/pooled=yes; selector: name=cp6015.* |
[production] |
| 08:59 |
<cwilliams@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db2166.codfw.wmnet with reason: host reimage |
[production] |
| 08:57 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2170 (T426633)', diff saved to https://phabricator.wikimedia.org/P93193 and previous config saved to /var/cache/conftool/dbconfig/20260527-085751-fceratto.json |
[production] |
| 08:55 |
<cwilliams@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1203.eqiad.wmnet with reason: host reimage |
[production] |
| 08:54 |
<Emperor> |
restart swift on ms-fe2011 T360913 |
[production] |
| 08:54 |
<jayme@deploy1003> |
helmfile [aux-k8s-codfw] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:54 |
<cwilliams@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db2166.codfw.wmnet with reason: host reimage |
[production] |
| 08:54 |
<jayme@deploy1003> |
helmfile [aux-k8s-codfw] START helmfile.d/admin 'apply'. |
[production] |
| 08:53 |
<jayme@deploy1003> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:53 |
<jayme@deploy1003> |
helmfile [aux-k8s-eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 08:53 |
<jayme@deploy1003> |
helmfile [dse-k8s-codfw] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:53 |
<jayme@deploy1003> |
helmfile [dse-k8s-codfw] START helmfile.d/admin 'apply'. |
[production] |
| 08:53 |
<jayme@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [ml-serve-codfw] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [ml-serve-codfw] START helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 08:52 |
<jayme@deploy1003> |
helmfile [codfw] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:51 |
<jayme@deploy1003> |
helmfile [codfw] START helmfile.d/admin 'apply'. |
[production] |
| 08:51 |
<jayme@deploy1003> |
helmfile [eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 08:51 |
<fabfur@cumin1003> |
conftool action : set/pooled=no; selector: name=cp3066.* |
[production] |
| 08:51 |
<fabfur@cumin1003> |
conftool action : set/pooled=no; selector: name=cp3074.* |
[production] |
| 08:51 |
<jayme@deploy1003> |
helmfile [eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 08:50 |
<fabfur> |
depooling and installing haproxy-awslc on cp3074 and cp3066 (T419825) |
[production] |
| 08:50 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2170 (T426633)', diff saved to https://phabricator.wikimedia.org/P93191 and previous config saved to /var/cache/conftool/dbconfig/20260527-085024-fceratto.json |
[production] |
| 08:50 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2170.codfw.wmnet with reason: Maintenance |
[production] |