|
2025-10-22
ยง
|
| 19:55 |
<ebernhardson@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/cirrus-streaming-updater: apply |
[production] |
| 19:54 |
<ebernhardson@deploy2002> |
helmfile [eqiad] START helmfile.d/services/cirrus-streaming-updater: apply |
[production] |
| 19:51 |
<ebernhardson@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/cirrus-streaming-updater: apply |
[production] |
| 19:51 |
<ebernhardson@deploy2002> |
helmfile [eqiad] START helmfile.d/services/cirrus-streaming-updater: apply |
[production] |
| 19:33 |
<andrew@cumin2002> |
START - Cookbook sre.hosts.reimage for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:32 |
<andrew@cumin2002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:27 |
<andrew@cumin2002> |
START - Cookbook sre.hosts.reimage for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:27 |
<andrew@cumin2002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:11 |
<jhathaway@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on sretest2001.codfw.wmnet with reason: sleep test |
[production] |
| 19:07 |
<andrew@cumin2002> |
START - Cookbook sre.hosts.reimage for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:06 |
<andrew@cumin2002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 19:06 |
<sukhe> |
sudo cumin "A:cp" "run-puppet-agent --enable 'merging CR 1198132'" |
[production] |
| 18:53 |
<sukhe> |
sudo cumin "A:cp" "disable-puppet 'merging CR 1198132'" |
[production] |
| 18:40 |
<ejegg> |
fundraising civicrm upgraded from b82b0ef5 to 1bade506 |
[production] |
| 18:39 |
<bking@cumin2002> |
END (PASS) - Cookbook sre.wdqs.data-transfer (exit_code=0) (T406920, Update outdated categories info) xfer categories from wdqs1011.eqiad.wmnet -> wdqs1026.eqiad.wmnet, repooling both afterwards |
[production] |
| 18:38 |
<ejegg> |
payments-wiki upgraded from ea963482 to 3753f979 |
[production] |
| 18:34 |
<bking@cumin2002> |
START - Cookbook sre.wdqs.data-transfer (T406920, Update outdated categories info) xfer categories from wdqs1011.eqiad.wmnet -> wdqs1026.eqiad.wmnet, repooling both afterwards |
[production] |
| 18:34 |
<bking@cumin2002> |
END (PASS) - Cookbook sre.wdqs.data-transfer (exit_code=0) (T406920, Update outdated categories info) xfer categories from wdqs1011.eqiad.wmnet -> wdqs1025.eqiad.wmnet, repooling both afterwards |
[production] |
| 18:29 |
<bking@cumin2002> |
START - Cookbook sre.wdqs.data-transfer (T406920, Update outdated categories info) xfer categories from wdqs1011.eqiad.wmnet -> wdqs1025.eqiad.wmnet, repooling both afterwards |
[production] |
| 18:28 |
<andrew@cumin2002> |
START - Cookbook sre.hosts.reimage for host cloudcontrol2010-dev.codfw.wmnet with OS trixie |
[production] |
| 18:18 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.reimage for host sretest1005.eqiad.wmnet with OS trixie |
[production] |
| 18:17 |
<cmooney@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host sretest1005.eqiad.wmnet with OS trixie |
[production] |
| 18:16 |
<dancy@deploy2002> |
rebuilt and synchronized wikiversions files: group1 to 1.45.0-wmf.24 refs T405680 |
[production] |
| 18:11 |
<dzahn@cumin2002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 30 days, 0:00:00 on zuul2001.codfw.wmnet with reason: still in setup |
[production] |
| 18:09 |
<dzahn@cumin2002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 30 days, 0:00:00 on zuul1001.eqiad.wmnet with reason: still in setup |
[production] |
| 18:09 |
<Amir1> |
deleting local user_password on sul wikis (T104500) |
[production] |
| 18:08 |
<dzahn@cumin2002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 30 days, 0:00:00 on zuul2001.codfw.wmnet with reason: still in setup |
[production] |
| 17:53 |
<Amir1> |
mwscript-k8s --dblist=small --follow -- purgeUserOptions.php --login-age 11 (T406724) |
[production] |
| 17:38 |
<sukhe@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-reboot (exit_code=0) rolling reboot on A:cp-text_codfw and A:cp |
[production] |
| 17:37 |
<sukhe@cumin1003> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp2041.codfw.wmnet |
[production] |
| 17:31 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.reimage for host sretest1005.eqiad.wmnet with OS trixie |
[production] |
| 17:30 |
<sukhe@cumin1003> |
END (PASS) - Cookbook sre.cdn.roll-reboot (exit_code=0) rolling reboot on A:cp-upload_codfw and A:cp |
[production] |
| 17:30 |
<sukhe@cumin1003> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp2042.codfw.wmnet |
[production] |
| 17:12 |
<cmooney@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host sretest1005.eqiad.wmnet with OS trixie |
[production] |
| 17:12 |
<kamila@cumin1003> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
| 17:10 |
<kamila@cumin1003> |
START - Cookbook sre.dns.netbox |
[production] |
| 16:59 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.reimage for host sretest1005.eqiad.wmnet with OS trixie |
[production] |
| 16:59 |
<ejegg> |
SmashPig upgraded from b1f04532 to ecba7d88 |
[production] |
| 16:58 |
<sukhe@cumin1003> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp2039.codfw.wmnet |
[production] |
| 16:57 |
<cmooney@cumin1003> |
END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:51 |
<sukhe@cumin1003> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp2040.codfw.wmnet |
[production] |
| 16:44 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.provision for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:44 |
<cmooney@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:40 |
<kamila@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 7 days, 0:00:00 on wikikube-worker2203.codfw.wmnet with reason: host unresponsive |
[production] |
| 16:39 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.provision for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:39 |
<kamila@cumin1003> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host wikikube-worker2203.codfw.wmnet |
[production] |
| 16:38 |
<kamila@cumin1003> |
START - Cookbook sre.k8s.pool-depool-node depool for host wikikube-worker2203.codfw.wmnet |
[production] |
| 16:23 |
<cmooney@cumin1003> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:23 |
<cmooney@cumin1003> |
START - Cookbook sre.hosts.provision for host sretest1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 16:16 |
<sukhe@cumin1003> |
cookbooks.sre.cdn.roll-reboot finished rebooting cp2037.codfw.wmnet |
[production] |