|
2026-05-05
ยง
|
| 09:30 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
| 09:30 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] START helmfile.d/services/miscweb: apply |
[production] |
| 09:29 |
<jelto@deploy1003> |
helmfile [aux-k8s-codfw] DONE helmfile.d/services/miscweb: apply |
[production] |
| 09:29 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db1174: Reimage to Trixie |
[production] |
| 09:29 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.mysql.depool (exit_code=0) depool db2221: Reimage to Trixie |
[production] |
| 09:29 |
<jelto@deploy1003> |
helmfile [aux-k8s-codfw] START helmfile.d/services/miscweb: apply |
[production] |
| 09:28 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db1174: Reimage to Trixie |
[production] |
| 09:28 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.depool depool db2221: Reimage to Trixie |
[production] |
| 09:28 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db1174.eqiad.wmnet with reason: Reimage to Trixie |
[production] |
| 09:28 |
<aikochou@deploy1003> |
helmfile [ml-serve-codfw] Ran 'sync' command on namespace 'revscoring-articlequality' for release 'main' . |
[production] |
| 09:28 |
<marostegui@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 5:00:00 on db2221.codfw.wmnet with reason: Reimage to Trixie |
[production] |
| 09:26 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2206 (T419961)', diff saved to https://phabricator.wikimedia.org/P92265 and previous config saved to /var/cache/conftool/dbconfig/20260505-092654-fceratto.json |
[production] |
| 09:26 |
<jelto@deploy1003> |
helmfile [staging] DONE helmfile.d/services/miscweb: apply |
[production] |
| 09:25 |
<jelto@deploy1003> |
helmfile [staging] START helmfile.d/services/miscweb: apply |
[production] |
| 09:24 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2213 (T419635)', diff saved to https://phabricator.wikimedia.org/P92264 and previous config saved to /var/cache/conftool/dbconfig/20260505-092431-fceratto.json |
[production] |
| 09:18 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2206 (T419961)', diff saved to https://phabricator.wikimedia.org/P92263 and previous config saved to /var/cache/conftool/dbconfig/20260505-091808-fceratto.json |
[production] |
| 09:18 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2206.codfw.wmnet with reason: Maintenance |
[production] |
| 09:14 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2213', diff saved to https://phabricator.wikimedia.org/P92262 and previous config saved to /var/cache/conftool/dbconfig/20260505-091423-fceratto.json |
[production] |
| 09:13 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2199.codfw.wmnet with reason: Maintenance |
[production] |
| 09:12 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2172 (T419961)', diff saved to https://phabricator.wikimedia.org/P92260 and previous config saved to /var/cache/conftool/dbconfig/20260505-091254-fceratto.json |
[production] |
| 09:04 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2213', diff saved to https://phabricator.wikimedia.org/P92259 and previous config saved to /var/cache/conftool/dbconfig/20260505-090415-fceratto.json |
[production] |
| 09:02 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2172', diff saved to https://phabricator.wikimedia.org/P92258 and previous config saved to /var/cache/conftool/dbconfig/20260505-090246-fceratto.json |
[production] |
| 08:58 |
<marostegui@cumin1003> |
START - Cookbook sre.mysql.pool pool db2209: after reimage to trixie |
[production] |
| 08:54 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2213 (T419635)', diff saved to https://phabricator.wikimedia.org/P92256 and previous config saved to /var/cache/conftool/dbconfig/20260505-085407-fceratto.json |
[production] |
| 08:52 |
<marostegui@cumin1003> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db2209.codfw.wmnet with OS trixie |
[production] |
| 08:52 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2172', diff saved to https://phabricator.wikimedia.org/P92255 and previous config saved to /var/cache/conftool/dbconfig/20260505-085238-fceratto.json |
[production] |
| 08:50 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.makevm (exit_code=99) for new host install5004.wikimedia.org |
[production] |
| 08:50 |
<moritzm> |
installing augeas security updates |
[production] |
| 08:49 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.dns.wipe-cache (exit_code=99) install5004.wikimedia.org on all recursors |
[production] |
| 08:48 |
<jmm@cumin2002> |
START - Cookbook sre.dns.wipe-cache install5004.wikimedia.org on all recursors |
[production] |
| 08:48 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Remove records for VM install5004.wikimedia.org - jmm@cumin2002" |
[production] |
| 08:48 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
| 08:48 |
<jmm@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Remove records for VM install5004.wikimedia.org - jmm@cumin2002" |
[production] |
| 08:46 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2213 (T419635)', diff saved to https://phabricator.wikimedia.org/P92254 and previous config saved to /var/cache/conftool/dbconfig/20260505-084616-fceratto.json |
[production] |
| 08:46 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on db2213.codfw.wmnet with reason: Maintenance |
[production] |
| 08:42 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-editquality-reverted' for release 'main' . |
[production] |
| 08:42 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2172 (T419961)', diff saved to https://phabricator.wikimedia.org/P92253 and previous config saved to /var/cache/conftool/dbconfig/20260505-084231-fceratto.json |
[production] |
| 08:41 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-editquality-goodfaith' for release 'main' . |
[production] |
| 08:40 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-editquality-damaging' for release 'main' . |
[production] |
| 08:38 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-drafttopic' for release 'main' . |
[production] |
| 08:37 |
<jmm@cumin2002> |
START - Cookbook sre.dns.netbox |
[production] |
| 08:37 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.dns.netbox (exit_code=99) |
[production] |
| 08:37 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-draftquality' for release 'main' . |
[production] |
| 08:35 |
<aikochou@deploy1003> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'revscoring-articletopic' for release 'main' . |
[production] |
| 08:34 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] DONE helmfile.d/services/miscweb: apply |
[production] |
| 08:34 |
<jelto@deploy1003> |
helmfile [aux-k8s-eqiad] START helmfile.d/services/miscweb: apply |
[production] |
| 08:34 |
<ayounsi@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 20:00:00 on 13 hosts with reason: switches replacement |
[production] |
| 08:33 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Depooling db2172 (T419961)', diff saved to https://phabricator.wikimedia.org/P92252 and previous config saved to /var/cache/conftool/dbconfig/20260505-083356-fceratto.json |
[production] |
| 08:33 |
<fceratto@cumin1003> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2172.codfw.wmnet with reason: Maintenance |
[production] |
| 08:33 |
<fceratto@cumin1003> |
dbctl commit (dc=all): 'Repooling after maintenance db2155 (T419961)', diff saved to https://phabricator.wikimedia.org/P92251 and previous config saved to /var/cache/conftool/dbconfig/20260505-083326-fceratto.json |
[production] |