|
2025-10-29
ยง
|
| 13:56 |
<stevemunene@cumin1003> |
END (PASS) - Cookbook sre.druid.roll-restart-workers (exit_code=0) for Druid public cluster: Roll restart of Druid jvm daemons. |
[production] |
| 13:43 |
<gehel> |
deploying envoy 1.32.12-1 + restart on W[CD]QS nodes - T404867 |
[production] |
| 13:40 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host tcp-proxy3002.esams.wmnet with OS trixie |
[production] |
| 13:31 |
<kharlan@deploy2002> |
Finished scap sync-world: Backport for [[gerrit:1199762|product_metrics/suggested_investigations_interaction: add performer_groups (T404177)]] (duration: 14m 48s) |
[production] |
| 13:31 |
<moritzm> |
upgrade Envoy on debmonitor* T405808 |
[production] |
| 13:31 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/api-gateway: apply |
[production] |
| 13:30 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/api-gateway: apply |
[production] |
| 13:30 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/api-gateway: apply |
[production] |
| 13:29 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/api-gateway: apply |
[production] |
| 13:29 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/api-gateway: apply |
[production] |
| 13:28 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/api-gateway: apply |
[production] |
| 13:27 |
<kharlan@deploy2002> |
kharlan: Continuing with sync |
[production] |
| 13:26 |
<cgoubert@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 13:24 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on tcp-proxy3002.esams.wmnet with reason: host reimage |
[production] |
| 13:23 |
<cgoubert@deploy2002> |
helmfile [codfw] START helmfile.d/services/rest-gateway: apply |
[production] |
| 13:23 |
<cgoubert@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 13:22 |
<cgoubert@deploy2002> |
helmfile [eqiad] START helmfile.d/services/rest-gateway: apply |
[production] |
| 13:19 |
<kharlan@deploy2002> |
kharlan: Backport for [[gerrit:1199762|product_metrics/suggested_investigations_interaction: add performer_groups (T404177)]] synced to the testservers (see https://wikitech.wikimedia.org/wiki/Mwdebug). Changes can now be verified there. |
[production] |
| 13:18 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on tcp-proxy3002.esams.wmnet with reason: host reimage |
[production] |
| 13:17 |
<kharlan@deploy2002> |
Started scap sync-world: Backport for [[gerrit:1199762|product_metrics/suggested_investigations_interaction: add performer_groups (T404177)]] |
[production] |
| 13:14 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 13:14 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 13:07 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 13:07 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 13:05 |
<stevemunene@cumin1003> |
START - Cookbook sre.druid.roll-restart-workers for Druid public cluster: Roll restart of Druid jvm daemons. |
[production] |
| 13:04 |
<klausman@deploy2002> |
helmfile [ml-serve-codfw] DONE helmfile.d/admin 'apply'. |
[production] |
| 13:04 |
<klausman@deploy2002> |
helmfile [ml-serve-codfw] START helmfile.d/admin 'apply'. |
[production] |
| 13:03 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 13:03 |
<stevemunene@cumin1003> |
END (PASS) - Cookbook sre.druid.roll-restart-workers (exit_code=0) for Druid analytics cluster: Roll restart of Druid jvm daemons. |
[production] |
| 13:03 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:55 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.reimage for host tcp-proxy3002.esams.wmnet with OS trixie |
[production] |
| 12:50 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:50 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:46 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:46 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:46 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host tcp-proxy7001.magru.wmnet with OS trixie |
[production] |
| 12:45 |
<brouberol@deploy2002> |
helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 12:44 |
<brouberol@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 12:43 |
<klausman@deploy2002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'apply'. |
[production] |
| 12:43 |
<klausman@deploy2002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'apply'. |
[production] |
| 12:33 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:33 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:32 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:32 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:31 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:30 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |
| 12:29 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on tcp-proxy7001.magru.wmnet with reason: host reimage |
[production] |
| 12:26 |
<cgoubert@deploy2002> |
helmfile [staging] DONE helmfile.d/services/rest-gateway: apply |
[production] |
| 12:23 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on tcp-proxy7001.magru.wmnet with reason: host reimage |
[production] |
| 12:20 |
<cgoubert@deploy2002> |
helmfile [staging] START helmfile.d/services/rest-gateway: apply |
[production] |