2023-03-07
ยง
|
15:17 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 12:00:00 on db2099.codfw.wmnet with reason: Maintenance |
[production] |
15:16 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on durum1001.eqiad.wmnet with reason: host reimage |
[production] |
15:16 |
<Emperor> |
pool ms-fe1009 T329073 |
[production] |
15:16 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on db1102.eqiad.wmnet with reason: Maintenance |
[production] |
15:16 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 12:00:00 on db1102.eqiad.wmnet with reason: Maintenance |
[production] |
15:16 |
<Emperor> |
pool moss-fe1001 T329073 |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mw-web: sync |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] [main] DONE helmfile.d/services/mw-jobrunner : sync |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] [canary] DONE helmfile.d/services/mw-jobrunner : sync |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] [canary] START helmfile.d/services/mw-jobrunner : sync |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] [main] START helmfile.d/services/mw-jobrunner : sync |
[production] |
15:15 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mw-debug: sync |
[production] |
15:11 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mw-debug: sync |
[production] |
15:11 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mw-api-int: sync |
[production] |
15:11 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mw-api-int: sync |
[production] |
15:11 |
<cmjohnson@cumin1001> |
START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudcephosd1039'] |
[production] |
15:11 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mw-api-ext: sync |
[production] |
15:09 |
<cmjohnson@cumin1001> |
END (PASS) - Cookbook sre.hardware.upgrade-firmware (exit_code=0) upgrade firmware for hosts ['cloudcephosd1038'] |
[production] |
15:06 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mw-api-ext: sync |
[production] |
15:06 |
<sukhe@cumin2002> |
START - Cookbook sre.ganeti.reimage for host durum1001.eqiad.wmnet with OS bullseye |
[production] |
15:06 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mobileapps: sync |
[production] |
15:06 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mobileapps: sync |
[production] |
15:06 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/miscweb: sync |
[production] |
15:04 |
<akosiaris@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubernetes1021.eqiad.wmnet with reason: host reimage |
[production] |
15:04 |
<bblack> |
dns1001 - restarted prometheus-bird-exporter |
[production] |
15:04 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/miscweb: sync |
[production] |
15:04 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mathoid: sync |
[production] |
15:04 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mathoid: sync |
[production] |
15:04 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/linkrecommendation: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/linkrecommendation: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/image-suggestion: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/image-suggestion: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/SERVICE_NAME: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/SERVICE_NAME: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventstreams-internal: sync |
[production] |
15:02 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventstreams-internal: sync |
[production] |
15:01 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventstreams: sync |
[production] |
15:01 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes1021.eqiad.wmnet with reason: host reimage |
[production] |
15:01 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventstreams: sync |
[production] |
15:01 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-main: sync |
[production] |
15:01 |
<sukhe> |
repooling dns1001: authdns-update can now be run again |
[production] |
15:01 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-main: sync |
[production] |
15:01 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-logging-external: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-logging-external: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-analytics-external: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-analytics-external: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-analytics: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-analytics: sync |
[production] |
15:00 |
<akosiaris@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/echostore: sync |
[production] |
14:59 |
<akosiaris@deploy1002> |
helmfile [eqiad] START helmfile.d/services/echostore: sync |
[production] |