2023-03-20
ยง
|
18:15 |
<akosiaris@deploy2002> |
helmfile [eqiad] START helmfile.d/services/changeprop: sync |
[production] |
18:15 |
<akosiaris@deploy2002> |
helmfile [staging] DONE helmfile.d/services/changeprop: sync |
[production] |
18:15 |
<akosiaris@deploy2002> |
helmfile [staging] START helmfile.d/services/changeprop: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/api-gateway: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [codfw] START helmfile.d/services/api-gateway: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/api-gateway: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [eqiad] START helmfile.d/services/api-gateway: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [staging] DONE helmfile.d/services/api-gateway: sync |
[production] |
18:11 |
<akosiaris@deploy2002> |
helmfile [staging] START helmfile.d/services/api-gateway: sync |
[production] |
18:05 |
<mutante> |
miscweb1003 - syntax error in httpd config due to "Unknown Authn provider: ldap" - comes from static-rt vhost (T331896) |
[production] |
18:04 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for lvs1019.eqiad.wmnet |
[production] |
18:04 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.remove-downtime for lvs1019.eqiad.wmnet |
[production] |
17:59 |
<mutante> |
when applying apache role for the first time on new hosts we still have the same old conflict: miscweb1003 - manual "a2dismod mpm_event" to be able to let puppet enable mod PHP (T196968) |
[production] |
17:57 |
<dzahn@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2 days, 0:00:00 on miscweb1003.eqiad.wmnet with reason: maintenance |
[production] |
17:57 |
<dzahn@cumin2002> |
START - Cookbook sre.hosts.downtime for 2 days, 0:00:00 on miscweb1003.eqiad.wmnet with reason: maintenance |
[production] |
17:55 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 0:40:00 on lvs1019.eqiad.wmnet with reason: reboot for kernel update |
[production] |
17:55 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.downtime for 0:40:00 on lvs1019.eqiad.wmnet with reason: reboot for kernel update |
[production] |
17:26 |
<akosiaris> |
disable puppet on rdb*, netbox*, ores*, registry* |
[production] |
17:14 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 0:40:00 on lvs3006.esams.wmnet with reason: reboot for kernel update |
[production] |
17:14 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.downtime for 0:40:00 on lvs3006.esams.wmnet with reason: reboot for kernel update |
[production] |
17:14 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 0:40:00 on lvs2009.codfw.wmnet,lvs1019.eqiad.wmnet with reason: reboot for kernel update |
[production] |
17:14 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.downtime for 0:40:00 on lvs2009.codfw.wmnet,lvs1019.eqiad.wmnet with reason: reboot for kernel update |
[production] |
16:43 |
<hnowlan@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:43 |
<hnowlan@deploy2002> |
helmfile [codfw] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:36 |
<hnowlan@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:36 |
<hnowlan@deploy2002> |
helmfile [codfw] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:32 |
<hnowlan@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:22 |
<hnowlan@deploy1002> |
helmfile [codfw] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:21 |
<hnowlan@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
16:10 |
<hnowlan@deploy1002> |
helmfile [codfw] START helmfile.d/services/changeprop-jobqueue: apply |
[production] |
15:52 |
<cmjohnson@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host thanos-fe1004.eqiad.wmnet with OS bullseye |
[production] |
14:56 |
<dcausse@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:56 |
<dcausse@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:56 |
<cmjohnson@cumin1001> |
START - Cookbook sre.hosts.reimage for host thanos-fe1004.eqiad.wmnet with OS bullseye |
[production] |
14:56 |
<dcausse@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:53 |
<cmjohnson@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host ms-fe1013.eqiad.wmnet with OS bullseye |
[production] |
14:53 |
<cmjohnson@cumin1001> |
START - Cookbook sre.hosts.reimage for host ms-fe1013.eqiad.wmnet with OS bullseye |
[production] |
14:51 |
<ayounsi@cumin1001> |
END (PASS) - Cookbook sre.network.peering (exit_code=0) with action 'configure' for AS: 2552 |
[production] |
14:49 |
<ayounsi@cumin1001> |
START - Cookbook sre.network.peering with action 'configure' for AS: 2552 |
[production] |
14:49 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:49 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:39 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool es2029 and promote es2027 to es3 master', diff saved to https://phabricator.wikimedia.org/P45896 and previous config saved to /var/cache/conftool/dbconfig/20230320-143951-root.json |
[production] |
14:35 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:35 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:30 |
<sukhe@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on lvs2008.codfw.wmnet with reason: T326564 |
[production] |
14:29 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on lvs2008.codfw.wmnet with reason: T326564 |
[production] |
14:17 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:17 |
<bking@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mediawiki-page-content-change-enrichment: apply |
[production] |
14:17 |
<kharlan@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/changeprop-jobqueue: apply |
[production] |
14:11 |
<TheresNoTime> |
close UTC afternoon backport window |
[production] |