|
2026-05-13
ยง
|
| 10:55 |
<jiji@deploy1003> |
helmfile [codfw] START helmfile.d/services/ratelimit: apply |
[production] |
| 10:55 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host install6003.wikimedia.org |
[production] |
| 10:52 |
<moritzm> |
installing Linux 5.10.251-4 on all Bullseye hosts |
[production] |
| 10:49 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on pki2002.codfw.wmnet with reason: host reimage |
[production] |
| 10:48 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host install6003.wikimedia.org |
[production] |
| 10:42 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on pki2002.codfw.wmnet with reason: host reimage |
[production] |
| 10:40 |
<jiji@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/mw-mcrouter: apply |
[production] |
| 10:39 |
<jiji@deploy1003> |
helmfile [eqiad] START helmfile.d/services/mw-mcrouter: apply |
[production] |
| 10:39 |
<jiji@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/mw-mcrouter: apply |
[production] |
| 10:39 |
<jiji@deploy1003> |
helmfile [codfw] START helmfile.d/services/mw-mcrouter: apply |
[production] |
| 10:35 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db2220.codfw.wmnet with reason: host reimage |
[production] |
| 10:33 |
<topranks> |
switch eqsin core router ibgp path to route via switches T424611 |
[production] |
| 10:26 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db2220.codfw.wmnet with reason: host reimage |
[production] |
| 10:25 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.reimage for host pki2002.codfw.wmnet with OS trixie |
[production] |
| 10:24 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host pki2002.mgmt.codfw.wmnet with chassis set policy GRACEFUL_RESTART and with Dell SCP reboot policy GRACEFUL |
[production] |
| 10:22 |
<elukey@cumin1003> |
START - Cookbook sre.hosts.provision for host pki2002.mgmt.codfw.wmnet with chassis set policy GRACEFUL_RESTART and with Dell SCP reboot policy GRACEFUL |
[production] |
| 10:21 |
<elukey@cumin1003> |
END (PASS) - Cookbook sre.hardware.upgrade-firmware (exit_code=0) upgrade firmware for hosts pki2002.codfw.wmnet |
[production] |
| 10:17 |
<jayme@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/ratelimit: apply |
[production] |
| 10:16 |
<jmm@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/proton: apply |
[production] |
| 10:16 |
<jayme@deploy1003> |
helmfile [eqiad] START helmfile.d/services/ratelimit: apply |
[production] |
| 10:16 |
<jayme@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/ratelimit: apply |
[production] |
| 10:15 |
<jmm@deploy1003> |
helmfile [eqiad] START helmfile.d/services/proton: apply |
[production] |
| 10:15 |
<jayme@deploy1003> |
helmfile [codfw] START helmfile.d/services/ratelimit: apply |
[production] |
| 10:14 |
<jayme@deploy1003> |
helmfile [staging] DONE helmfile.d/services/ratelimit: apply |
[production] |
| 10:14 |
<jayme@deploy1003> |
helmfile [staging] START helmfile.d/services/ratelimit: apply |
[production] |
| 10:12 |
<jayme@deploy1003> |
helmfile [staging] DONE helmfile.d/services/ratelimit: apply |
[production] |
| 10:12 |
<jayme@deploy1003> |
helmfile [staging] START helmfile.d/services/ratelimit: apply |
[production] |
| 10:10 |
<moritzm> |
installing Apache security updates on Bullseye |
[production] |
| 10:09 |
<atsuko@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/opensearch-ttmserver-test: apply |
[production] |
| 10:09 |
<atsuko@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/opensearch-ttmserver-test: apply |
[production] |
| 10:06 |
<marostegui@cumin1003> |
START - Cookbook sre.hosts.reimage for host db2220.codfw.wmnet with OS trixie |
[production] |
| 10:05 |
<jmm@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/proton: apply |
[production] |
| 10:05 |
<jiji@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mc1064.eqiad.wmnet with OS bullseye |
[production] |
| 10:04 |
<jmm@deploy1003> |
helmfile [codfw] START helmfile.d/services/proton: apply |
[production] |
| 10:03 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db2220: Reimage to Trixie |
[production] |
| 10:02 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db2220: Reimage to Trixie |
[production] |
| 10:02 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db2220.codfw.wmnet with reason: Reimage to Trixie |
[production] |
| 10:02 |
<jmm@deploy1003> |
helmfile [staging] DONE helmfile.d/services/proton: apply |
[production] |
| 10:01 |
<jmm@deploy1003> |
helmfile [staging] START helmfile.d/services/proton: apply |
[production] |
| 09:59 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Depool db2220 T426142', diff saved to https://phabricator.wikimedia.org/P92500 and previous config saved to /var/cache/conftool/dbconfig/20260513-095934-marostegui.json |
[production] |
| 09:58 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Promote db2218 to s7 primary T426142', diff saved to https://phabricator.wikimedia.org/P92499 and previous config saved to /var/cache/conftool/dbconfig/20260513-095814-marostegui.json |
[production] |
| 09:58 |
<atsuko@deploy1003> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/opensearch-ttmserver-test: apply |
[production] |
| 09:58 |
<atsuko@deploy1003> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/opensearch-ttmserver-test: apply |
[production] |
| 09:57 |
<jiji@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mc1062.eqiad.wmnet with OS bullseye |
[production] |
| 09:56 |
<moritzm> |
installing distro-info-data updates from Bookworm point release |
[production] |
| 09:54 |
<marostegui> |
Starting s7 codfw failover from db2220 to db2218 - T426142 |
[production] |
| 09:53 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on 28 hosts with reason: Primary switchover s7 T426142 |
[production] |
| 09:53 |
<jiji@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host mc1061.eqiad.wmnet with OS bullseye |
[production] |
| 09:53 |
<marostegui@cumin1003> |
dbctl commit (dc=all): 'Set db2218 with weight 0 T426142', diff saved to https://phabricator.wikimedia.org/P92498 and previous config saved to /var/cache/conftool/dbconfig/20260513-095337-marostegui.json |
[production] |
| 09:51 |
<moritzm> |
installing ca-certificates update from Bookworm point release |
[production] |