2020-09-15
§
|
09:01 |
<elukey@cumin1001> |
START - Cookbook sre.zookeeper.roll-restart-zookeeper |
[production] |
08:59 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.zookeeper.roll-restart-zookeeper (exit_code=0) |
[production] |
08:53 |
<elukey> |
roll restart druid zookeeper clusters for openjdk upgrades |
[production] |
08:53 |
<elukey@cumin1001> |
START - Cookbook sre.zookeeper.roll-restart-zookeeper |
[production] |
08:52 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.druid.roll-restart-workers (exit_code=0) |
[production] |
08:04 |
<elukey@cumin1001> |
START - Cookbook sre.druid.roll-restart-workers |
[production] |
08:02 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.druid.roll-restart-workers (exit_code=0) |
[production] |
07:19 |
<elukey> |
roll restart druid cluster to pick up openjdk updates |
[production] |
07:19 |
<elukey@cumin1001> |
START - Cookbook sre.druid.roll-restart-workers |
[production] |
2020-09-08
§
|
18:22 |
<elukey> |
rm /srv/prometheus/ops/targets/mjolnir_msearch_eqiad.yaml on prometheus100[3,4] as cleanup after https://gerrit.wikimedia.org/r/621988 - T260305 |
[production] |
15:30 |
<elukey> |
roll restart of hadoop master daemons on an-master100[1,2] after the cookbook failed |
[production] |
15:26 |
<elukey@cumin1001> |
END (FAIL) - Cookbook sre.hadoop.roll-restart-masters (exit_code=99) |
[production] |
15:18 |
<elukey@cumin1001> |
START - Cookbook sre.hadoop.roll-restart-masters |
[production] |
13:34 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hadoop.roll-restart-masters (exit_code=0) |
[production] |
13:20 |
<elukey@cumin1001> |
START - Cookbook sre.hadoop.roll-restart-masters |
[production] |
13:14 |
<elukey@cumin1001> |
END (FAIL) - Cookbook sre.hadoop.roll-restart-masters (exit_code=99) |
[production] |
13:14 |
<elukey@cumin1001> |
START - Cookbook sre.hadoop.roll-restart-masters |
[production] |
07:44 |
<elukey> |
roll restart kafka daemons on kafka-jumbo100[7-9] to pick up opendjk upgrades |
[production] |
06:23 |
<elukey> |
roll restart of Hadoop master daemons on an-master100[1,2] to pick up new opejdk settings |
[production] |
2020-09-07
§
|
16:12 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
16:10 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
14:27 |
<elukey@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
14:25 |
<elukey@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
14:23 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
14:23 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
13:28 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
13:26 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
13:25 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
13:23 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
10:37 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
10:35 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
10:02 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
10:00 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
09:09 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
09:06 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |