2025-07-10
ยง
|
10:04 |
<jgiannelos@deploy1003> |
helmfile [staging] START helmfile.d/services/changeprop: apply |
[production] |
10:04 |
<vgutierrez> |
resetting eqiad.resource-topic offsets for cp5017 consumer group |
[production] |
09:45 |
<hnowlan@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/changeprop: apply |
[production] |
09:45 |
<hnowlan@deploy1003> |
helmfile [eqiad] START helmfile.d/services/changeprop: apply |
[production] |
09:44 |
<hnowlan@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/changeprop: apply |
[production] |
09:44 |
<hnowlan@deploy1003> |
helmfile [codfw] START helmfile.d/services/changeprop: apply |
[production] |
09:43 |
<moritzm> |
installing initramfs-tools bugfix updates from Bookworm point release |
[production] |
09:31 |
<dcaro@cloudcumin1001> |
END (FAIL) - Cookbook wmcs.toolforge.component.deploy (exit_code=99) for component jobs-cli |
[toolsbeta] |
09:30 |
<dcaro@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component jobs-cli |
[toolsbeta] |
09:26 |
<dcaro@cloudcumin1001> |
END (FAIL) - Cookbook wmcs.toolforge.component.deploy (exit_code=99) for component jobs-cli |
[toolsbeta] |
09:26 |
<dcaro@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component jobs-cli |
[toolsbeta] |
09:15 |
<fceratto@cumin1002> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) db2240 gradually with 4 steps - Pooling in |
[production] |
09:15 |
<fceratto@cumin1002> |
START - Cookbook sre.mysql.pool db2240 gradually with 4 steps - Pooling in |
[production] |
09:14 |
<fceratto@cumin1002> |
END (PASS) - Cookbook sre.mysql.pool (exit_code=0) db2161 gradually with 4 steps - Pooling in |
[production] |
09:14 |
<fceratto@cumin1002> |
START - Cookbook sre.mysql.pool db2161 gradually with 4 steps - Pooling in |
[production] |
09:12 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Update db2240 T397163', diff saved to https://phabricator.wikimedia.org/P78865 and previous config saved to /var/cache/conftool/dbconfig/20250710-091250-fceratto.json |
[production] |
09:05 |
<vgutierrez> |
restarting purged on cp5017 |
[production] |
09:02 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
09:02 |
<brouberol@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/admin 'apply'. |
[production] |
08:53 |
<slyngshede@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on A:cp-text_codfw and A:cp - 2.8.15 upgrade (T398720) |
[production] |
08:51 |
<slyngshede@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on A:cp-upload_codfw and A:cp - 2.8.15 upgrade (T398720) |
[production] |
08:45 |
<moritzm> |
installing setuptools security updates |
[production] |
08:40 |
<hnowlan@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/changeprop: sync |
[production] |
08:40 |
<hnowlan@deploy1003> |
helmfile [eqiad] START helmfile.d/services/changeprop: sync |
[production] |
08:37 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2178 (re)pooling @ 100%: 10', diff saved to https://phabricator.wikimedia.org/P78863 and previous config saved to /var/cache/conftool/dbconfig/20250710-083719-root.json |
[production] |
08:31 |
<klausman@deploy1003> |
helmfile [ml-serve-codfw] DONE helmfile.d/admin 'apply'. |
[production] |
08:30 |
<klausman@deploy1003> |
helmfile [ml-serve-codfw] START helmfile.d/admin 'apply'. |
[production] |
08:22 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2178 (re)pooling @ 75%: 10', diff saved to https://phabricator.wikimedia.org/P78861 and previous config saved to /var/cache/conftool/dbconfig/20250710-082213-root.json |
[production] |
08:15 |
<slyngshede@cumin1003> |
START - Cookbook sre.cdn.roll-upgrade-haproxy rolling upgrade of HAProxy on A:cp-upload_codfw and A:cp - 2.8.15 upgrade (T398720) |
[production] |
08:12 |
<slyngshede@cumin1003> |
START - Cookbook sre.cdn.roll-upgrade-haproxy rolling upgrade of HAProxy on A:cp-text_codfw and A:cp - 2.8.15 upgrade (T398720) |
[production] |
08:11 |
<aklapper@deploy1003> |
rebuilt and synchronized wikiversions files: group2 to 1.45.0-wmf.9 refs T392179 |
[production] |
08:10 |
<moritzm> |
installing containerd security updates |
[production] |
08:07 |
<klausman@cumin1002> |
conftool action : set/pooled=false; selector: dnsdisc=inference,name=codfw |
[production] |
08:07 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2178 (re)pooling @ 50%: 10', diff saved to https://phabricator.wikimedia.org/P78860 and previous config saved to /var/cache/conftool/dbconfig/20250710-080708-root.json |
[production] |
08:07 |
<klausman@cumin1002> |
conftool action : get/pooled; selector: dnsdisc=inference,name=codfw |
[production] |
08:05 |
<klausman> |
Depooling Liftwing prod in codfw so we can roll out some changes that restart all services (cf. T398533) |
[production] |
08:00 |
<moritzm> |
installing python-urllib3 security updates |
[production] |
07:55 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1213.eqiad.wmnet with reason: Maintenance |
[production] |
07:54 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on es1047.eqiad.wmnet with reason: Maintenance |
[production] |
07:52 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2178 (re)pooling @ 25%: 10', diff saved to https://phabricator.wikimedia.org/P78859 and previous config saved to /var/cache/conftool/dbconfig/20250710-075202-root.json |
[production] |
07:50 |
<vgutierrez> |
switching to upload cert globally on upload CDN cluster - T394484 |
[production] |
07:47 |
<elukey@deploy1003> |
helmfile [staging] DONE helmfile.d/services/machinetranslation: sync |
[production] |
07:44 |
<elukey@deploy1003> |
helmfile [staging] START helmfile.d/services/machinetranslation: sync |
[production] |
07:44 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db2178 for migration to mariadb 10.11', diff saved to https://phabricator.wikimedia.org/P78858 and previous config saved to /var/cache/conftool/dbconfig/20250710-074432-marostegui.json |
[production] |
07:44 |
<root@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db2178.codfw.wmnet with reason: Maintenance |
[production] |
07:44 |
<slyngshede@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on A:cp-upload_magru and A:cp - 2.8.15 upgrade (T398720) |
[production] |
07:39 |
<slyngshede@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on A:cp-text_magru and A:cp - 2.8.15 upgrade (T398720) |
[production] |
07:39 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db1210 (re)pooling @ 100%: 10', diff saved to https://phabricator.wikimedia.org/P78857 and previous config saved to /var/cache/conftool/dbconfig/20250710-073907-root.json |
[production] |
07:31 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'db2228 (re)pooling @ 100%: 10', diff saved to https://phabricator.wikimedia.org/P78856 and previous config saved to /var/cache/conftool/dbconfig/20250710-073123-root.json |
[production] |
07:29 |
<hashar> |
Restarting CI Jenkins |
[production] |