|
2025-05-10
§
|
| 19:58 |
<lucaswerkmeister> |
webservice restart (per request on behalf of tool maintainer, as the bastion is having issues atm) |
[tools.letaxobot] |
| 17:35 |
<lucaswerkmeister> |
root@tools-bastion-13:~# systemctl restart sssd-sudo{,.socket} # looks like the reset-failed didn’t work properly, systemd didn’t even try to start the service again afaict (T393732) |
[tools] |
| 17:33 |
<lucaswerkmeister> |
root@tools-bastion-13:~# systemctl reset-failed sssd-{pam,sudo}.service && systemctl restart sssd-pam{,-priv}.socket # try to reset the rate limits this way (T393732) |
[tools] |
| 16:22 |
<lucaswerkmeister> |
systemctl restart sssd-{pam{,-priv},sudo}.socket # service-start-limit-hit, T393732? |
[tools] |
| 14:10 |
<lucaswerkmeister> |
root@tools-bastion-13:~# systemctl restart sssd-sudo.socket # service-start-limit-hit, T393732? |
[tools] |
| 11:53 |
<lucaswerkmeister> |
T393732 note: restart of sssd-pam.service actually failed, “may be requested by dependency only”; overall it still seems to have worked though (so next time restarting the sockets is probably sufficient) |
[tools] |
| 11:52 |
<lucaswerkmeister> |
root@tools-bastion-13:~# systemctl restart sssd-pam{,{,-priv}.socket} # all three failed with start-limit-hit / Start request repeated too quickly; T393732? |
[tools] |
| 00:41 |
<dani@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:41 |
<dani@deploy1003> |
helmfile [codfw] START helmfile.d/services/miscweb: apply |
[production] |
| 00:41 |
<dani@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:41 |
<dani@deploy1003> |
helmfile [eqiad] START helmfile.d/services/miscweb: apply |
[production] |
| 00:41 |
<dani@deploy1003> |
helmfile [staging] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:41 |
<dani@deploy1003> |
helmfile [staging] START helmfile.d/services/miscweb: apply |
[production] |
| 00:23 |
<dani@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:22 |
<dani@deploy1003> |
helmfile [codfw] START helmfile.d/services/miscweb: apply |
[production] |
| 00:22 |
<dani@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:22 |
<dani@deploy1003> |
helmfile [eqiad] START helmfile.d/services/miscweb: apply |
[production] |
| 00:22 |
<dani@deploy1003> |
helmfile [staging] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:22 |
<dani@deploy1003> |
helmfile [staging] START helmfile.d/services/miscweb: apply |
[production] |
| 00:16 |
<dani@deploy1003> |
helmfile [codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:16 |
<dani@deploy1003> |
helmfile [codfw] START helmfile.d/services/miscweb: apply |
[production] |
| 00:16 |
<dani@deploy1003> |
helmfile [eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:15 |
<dani@deploy1003> |
helmfile [eqiad] START helmfile.d/services/miscweb: apply |
[production] |
| 00:15 |
<dani@deploy1003> |
helmfile [staging] DONE helmfile.d/services/miscweb: apply |
[production] |
| 00:15 |
<dani@deploy1003> |
helmfile [staging] START helmfile.d/services/miscweb: apply |
[production] |
|
2025-05-09
§
|
| 23:02 |
<vriley@cumin1002> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host thanos-fe1007.eqiad.wmnet with OS bullseye |
[production] |
| 22:18 |
<raymond-ndibe@cloudcumin1001> |
END (PASS) - Cookbook wmcs.toolforge.component.deploy (exit_code=0) for component builds-api |
[toolsbeta] |
| 22:11 |
<raymond-ndibe@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component builds-api |
[toolsbeta] |
| 22:10 |
<wmbot~bd808@tools-bastion-12> |
Deployed container built from8601a403 |
[tools.gitlab-content] |
| 22:10 |
<raymond-ndibe@cloudcumin1001> |
END (PASS) - Cookbook wmcs.toolforge.component.deploy (exit_code=0) for component builds-api |
[toolsbeta] |
| 22:10 |
<wmbot~bd808@tools-bastion-12> |
Built container from 8601a403 |
[tools.gitlab-content] |
| 22:10 |
<vriley@cumin1002> |
START - Cookbook sre.hosts.reimage for host thanos-fe1007.eqiad.wmnet with OS bullseye |
[production] |
| 22:09 |
<vriley@cumin1002> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-fe1007.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 22:08 |
<raymond-ndibe@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component builds-api |
[toolsbeta] |
| 22:03 |
<vriley@cumin1002> |
START - Cookbook sre.hosts.provision for host thanos-fe1007.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART and with Dell SCP reboot policy FORCED |
[production] |
| 22:01 |
<raymond-ndibe@cloudcumin1001> |
END (FAIL) - Cookbook wmcs.toolforge.component.deploy (exit_code=99) for component builds-api |
[toolsbeta] |
| 22:00 |
<raymond-ndibe@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component builds-api |
[toolsbeta] |
| 21:57 |
<vriley@cumin1002> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host thanos-fe1007.eqiad.wmnet with OS bullseye |
[production] |
| 21:56 |
<raymond-ndibe@cloudcumin1001> |
END (FAIL) - Cookbook wmcs.toolforge.component.deploy (exit_code=99) for component builds-api |
[toolsbeta] |
| 21:56 |
<raymond-ndibe@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component builds-api |
[toolsbeta] |
| 21:54 |
<raymond-ndibe@cloudcumin1001> |
END (FAIL) - Cookbook wmcs.toolforge.component.deploy (exit_code=99) for component builds-api |
[toolsbeta] |
| 21:54 |
<raymond-ndibe@cloudcumin1001> |
START - Cookbook wmcs.toolforge.component.deploy for component builds-api |
[toolsbeta] |