2025-07-18
ยง
|
13:45 |
<marostegui@cumin1002> |
START - Cookbook sre.mysql.pool db2242 gradually with 4 steps - Upgrade of db2242.codfw.wmnet completed |
[production] |
13:41 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1212 (re)pooling @ 50%: 10', diff saved to https://phabricator.wikimedia.org/P79400 and previous config saved to /var/cache/conftool/dbconfig/20250718-134144-root.json |
[production] |
13:40 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1048 (re)pooling @ 100%: Repooling', diff saved to https://phabricator.wikimedia.org/P79399 and previous config saved to /var/cache/conftool/dbconfig/20250718-134021-root.json |
[production] |
13:39 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) db2242 - Upgrading db2242.codfw.wmnet |
[production] |
13:39 |
<marostegui@cumin1002> |
START - Cookbook sre.mysql.depool db2242 - Upgrading db2242.codfw.wmnet |
[production] |
13:39 |
<marostegui@cumin1002> |
START - Cookbook sre.mysql.upgrade for db2242.codfw.wmnet |
[production] |
13:38 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db2242.codfw.wmnet with reason: Maintenance |
[production] |
13:37 |
<elukey@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host ml-serve1012.eqiad.wmnet with OS bookworm |
[production] |
13:35 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db2149 (T399249)', diff saved to https://phabricator.wikimedia.org/P79397 and previous config saved to /var/cache/conftool/dbconfig/20250718-133533-marostegui.json |
[production] |
13:35 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db2149.codfw.wmnet with reason: Maintenance |
[production] |
13:34 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1259 (T399249)', diff saved to https://phabricator.wikimedia.org/P79396 and previous config saved to /var/cache/conftool/dbconfig/20250718-133424-marostegui.json |
[production] |
13:30 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.reimage for host ml-serve1012.eqiad.wmnet with OS bookworm |
[production] |
13:26 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1212 (re)pooling @ 25%: 10', diff saved to https://phabricator.wikimedia.org/P79395 and previous config saved to /var/cache/conftool/dbconfig/20250718-132638-root.json |
[production] |
13:25 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1048 (re)pooling @ 75%: Repooling', diff saved to https://phabricator.wikimedia.org/P79394 and previous config saved to /var/cache/conftool/dbconfig/20250718-132515-root.json |
[production] |
13:23 |
<jynus@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3 days, 0:00:00 on backup1007.eqiad.wmnet with reason: failed disk |
[production] |
13:19 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1259', diff saved to https://phabricator.wikimedia.org/P79393 and previous config saved to /var/cache/conftool/dbconfig/20250718-131917-marostegui.json |
[production] |
13:17 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:17 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:16 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:15 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db1212 for migration to mariadb 10.11', diff saved to https://phabricator.wikimedia.org/P79392 and previous config saved to /var/cache/conftool/dbconfig/20250718-131554-marostegui.json |
[production] |
13:15 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db1212.eqiad.wmnet with reason: Maintenance |
[production] |
13:15 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:15 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3:00:00 on 10 hosts with reason: Maintenance |
[production] |
13:14 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1198 (re)pooling @ 100%: 10', diff saved to https://phabricator.wikimedia.org/P79391 and previous config saved to /var/cache/conftool/dbconfig/20250718-131431-root.json |
[production] |
13:14 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:12 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:12 |
<gmodena@deploy1003> |
helmfile [staging] DONE helmfile.d/services/mw-page-content-change-enrich: apply |
[production] |
13:12 |
<gmodena@deploy1003> |
helmfile [staging] START helmfile.d/services/mw-page-content-change-enrich: apply |
[production] |
13:12 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:10 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1048 (re)pooling @ 65%: Repooling', diff saved to https://phabricator.wikimedia.org/P79390 and previous config saved to /var/cache/conftool/dbconfig/20250718-131009-root.json |
[production] |
13:09 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:09 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:07 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:05 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
13:05 |
<gmodena@deploy1003> |
helmfile [staging] DONE helmfile.d/services/mw-page-content-change-enrich: apply |
[production] |
13:05 |
<gmodena@deploy1003> |
helmfile [staging] START helmfile.d/services/mw-page-content-change-enrich: apply |
[production] |
13:04 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1259', diff saved to https://phabricator.wikimedia.org/P79389 and previous config saved to /var/cache/conftool/dbconfig/20250718-130410-marostegui.json |
[production] |
13:02 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
13:02 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/admin 'apply'. |
[production] |
12:59 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
12:59 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1198 (re)pooling @ 75%: 10', diff saved to https://phabricator.wikimedia.org/P79388 and previous config saved to /var/cache/conftool/dbconfig/20250718-125925-root.json |
[production] |
12:59 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] START helmfile.d/services/miscweb: apply |
[production] |
12:58 |
<jelto@deploy1003> |
helmfile [aux-k8s-codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
12:58 |
<jelto@deploy1003> |
helmfile [aux-k8s-codfw] START helmfile.d/services/miscweb: apply |
[production] |
12:57 |
<jelto@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
12:56 |
<jelto@deploy1003> |
helmfile [eqiad] START helmfile.d/services/miscweb: apply |
[production] |
12:56 |
<jelto@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
12:56 |
<jelto@deploy1003> |
helmfile [codfw] START helmfile.d/services/miscweb: apply |
[production] |
12:55 |
<jelto@deploy1003> |
helmfile [staging] DONE helmfile.d/services/miscweb: apply |
[production] |
12:55 |
<jelto@deploy1003> |
helmfile [staging] START helmfile.d/services/miscweb: apply |
[production] |