2024-07-15
ยง
|
12:30 |
<dcausse@deploy1002> |
helmfile [staging] START helmfile.d/services/rdf-streaming-updater: apply |
[production] |
12:16 |
<dcausse@deploy1002> |
helmfile [staging] DONE helmfile.d/services/rdf-streaming-updater: apply |
[production] |
12:15 |
<dcausse@deploy1002> |
helmfile [staging] START helmfile.d/services/rdf-streaming-updater: apply |
[production] |
11:32 |
<marostegui> |
test |
[production] |
11:31 |
<marostegui> |
Reboot stashbot |
[production] |
11:25 |
<cgoubert@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:24 |
<cgoubert@deploy1002> |
helmfile [eqiad] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:11 |
<cgoubert@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:11 |
<cgoubert@deploy1002> |
helmfile [codfw] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:11 |
<claime> |
Increasing webVideoTranscodePrioritized concurrency in changeprop-jobqueue |
[production] |
11:09 |
<cgoubert@deploy1002> |
helmfile [staging] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:08 |
<cgoubert@deploy1002> |
helmfile [staging] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
11:08 |
<cgoubert@deploy1002> |
helmfile [staging] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
10:21 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db2116 (T367856)', diff saved to https://phabricator.wikimedia.org/P66480 and previous config saved to /var/cache/conftool/dbconfig/20240715-102117-marostegui.json |
[production] |
10:21 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2116.codfw.wmnet with reason: Maintenance |
[production] |
10:20 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2116.codfw.wmnet with reason: Maintenance |
[production] |
09:59 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'email' for AS: 52999 |
[production] |
09:59 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'email' for AS: 52999 |
[production] |
09:58 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'email' for AS: 270361 |
[production] |
09:58 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'email' for AS: 270361 |
[production] |
09:58 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'email' for AS: 262293 |
[production] |
09:58 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'email' for AS: 262293 |
[production] |
09:58 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'email' for AS: 61941 |
[production] |
09:57 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'email' for AS: 61941 |
[production] |
09:56 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'configure' for AS: 49544 |
[production] |
09:54 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'configure' for AS: 49544 |
[production] |
09:29 |
<claime> |
manually removing mw1349.eqiad.wmnet mw1350.eqiad.wmnet mw1351.eqiad.wmnet from k8s following reimage to videoscalers - T351074 |
[production] |
09:25 |
<dcausse@deploy1002> |
helmfile [staging] DONE helmfile.d/services/rdf-streaming-updater: apply |
[production] |
09:22 |
<dcausse@deploy1002> |
helmfile [staging] START helmfile.d/services/rdf-streaming-updater: apply |
[production] |
09:19 |
<marostegui> |
Deploy schema change on s7 eqiad db1170 dbmaint T367856 |
[production] |
09:18 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Long schema change |
[production] |
09:18 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Long schema change |
[production] |
09:18 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db1170 (T367856)', diff saved to https://phabricator.wikimedia.org/P66479 and previous config saved to /var/cache/conftool/dbconfig/20240715-091800-marostegui.json |
[production] |
09:17 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Maintenance |
[production] |
09:17 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Maintenance |
[production] |
09:16 |
<elukey@cumin1002> |
END (FAIL) - Cookbook sre.network.tls (exit_code=99) for network device lsw1-d3-codfw |
[production] |
09:15 |
<marostegui> |
Deploy schema change on s7 codfw db2121 dbmaint T367856 |
[production] |
09:15 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2121.codfw.wmnet with reason: Long schema change |
[production] |
09:14 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2121.codfw.wmnet with reason: Long schema change |
[production] |
09:14 |
<elukey@cumin1002> |
START - Cookbook sre.network.tls for network device lsw1-d3-codfw |
[production] |
09:05 |
<volans@cumin1002> |
dbctl commit (dc=all): 'Depool db2121 T369882', diff saved to https://phabricator.wikimedia.org/P66478 and previous config saved to /var/cache/conftool/dbconfig/20240715-090532-volans.json |
[production] |
08:56 |
<volans@cumin1002> |
dbctl commit (dc=all): 'Promote db2218 to s7 primary T369882', diff saved to https://phabricator.wikimedia.org/P66477 and previous config saved to /var/cache/conftool/dbconfig/20240715-085654-volans.json |
[production] |
08:51 |
<volans> |
Starting s7 codfw failover from db2121 to db2218 - T369882 |
[production] |
08:33 |
<slyngshede@cumin1002> |
END (PASS) - Cookbook sre.ganeti.makevm (exit_code=0) for new host idp2004.wikimedia.org |
[production] |
08:33 |
<slyngshede@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host idp2004.wikimedia.org with OS bookworm |
[production] |
08:22 |
<ayounsi@cumin1002> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'configure' for AS: 52468 |
[production] |
08:21 |
<ayounsi@cumin1002> |
START - Cookbook sre.network.peering with action 'configure' for AS: 52468 |
[production] |
08:16 |
<slyngshede@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on idp2004.wikimedia.org with reason: host reimage |
[production] |
08:13 |
<slyngshede@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on idp2004.wikimedia.org with reason: host reimage |
[production] |
08:12 |
<volans@cumin2002> |
dbctl commit (dc=all): 'Remove db2218 from API T369882', diff saved to https://phabricator.wikimedia.org/P66475 and previous config saved to /var/cache/conftool/dbconfig/20240715-081252-volans.json |
[production] |