2020-06-12
ยง
|
15:37 |
<pt1979@cumin2001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:36 |
<hnowlan@deploy1001> |
helmfile [EQIAD] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
15:27 |
<akosiaris@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
15:25 |
<hnowlan@deploy1001> |
helmfile [EQIAD] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
15:24 |
<akosiaris@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
15:24 |
<akosiaris@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
15:24 |
<akosiaris@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
15:24 |
<akosiaris@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
15:22 |
<akosiaris@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
15:22 |
<akosiaris@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
15:22 |
<akosiaris@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
14:51 |
<elukey> |
repool mw1384 as test |
[production] |
14:31 |
<akosiaris@deploy1001> |
helmfile [CODFW] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
14:30 |
<akosiaris> |
bump cpu limits for changeprop another 50% |
[production] |
14:30 |
<akosiaris@deploy1001> |
helmfile [EQIAD] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
13:36 |
<akosiaris@deploy1001> |
helmfile [CODFW] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
13:34 |
<akosiaris> |
update changeprop in eqiad+codfw for higher CPU limits |
[production] |
13:34 |
<akosiaris@deploy1001> |
helmfile [EQIAD] Ran 'sync' command on namespace 'changeprop' for release 'production' . |
[production] |
13:12 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Repool db1088 after schema change', diff saved to https://phabricator.wikimedia.org/P11483 and previous config saved to /var/cache/conftool/dbconfig/20200612-131205-marostegui.json |
[production] |
12:40 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool db1088 for schema change', diff saved to https://phabricator.wikimedia.org/P11482 and previous config saved to /var/cache/conftool/dbconfig/20200612-124015-marostegui.json |
[production] |
12:18 |
<filippo@cumin1001> |
END (PASS) - Cookbook sre.hosts.upgrade-and-reboot (exit_code=0) |
[production] |
11:52 |
<filippo@cumin1001> |
START - Cookbook sre.hosts.upgrade-and-reboot |
[production] |
11:23 |
<jmm@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) |
[production] |
11:19 |
<jmm@cumin1001> |
START - Cookbook sre.hosts.reboot-single |
[production] |
11:15 |
<moritzm> |
failover ganeti master in ulsfo to ganeti4003 |
[production] |
11:14 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Pool db2080 and db2084 into s8 T253217', diff saved to https://phabricator.wikimedia.org/P11481 and previous config saved to /var/cache/conftool/dbconfig/20200612-111422-marostegui.json |
[production] |
11:11 |
<jmm@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) |
[production] |
11:07 |
<jmm@cumin1001> |
START - Cookbook sre.hosts.reboot-single |
[production] |
11:02 |
<jmm@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) |
[production] |
10:58 |
<jmm@cumin1001> |
START - Cookbook sre.hosts.reboot-single |
[production] |
10:39 |
<jmm@cumin1001> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) |
[production] |
10:36 |
<jmm@cumin1001> |
START - Cookbook sre.hosts.reboot-single |
[production] |
10:33 |
<moritzm> |
rolling restart of the ulsfo ganeti cluster |
[production] |
10:21 |
<filippo@cumin1001> |
END (PASS) - Cookbook sre.hosts.upgrade-and-reboot (exit_code=0) |
[production] |
10:02 |
<filippo@cumin1001> |
START - Cookbook sre.hosts.upgrade-and-reboot |
[production] |
10:01 |
<jmm@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) |
[production] |
10:01 |
<filippo@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=1) |
[production] |
10:01 |
<filippo@cumin1001> |
START - Cookbook sre.hosts.reboot-single |
[production] |
10:01 |
<jmm@cumin1001> |
START - Cookbook sre.hosts.downtime |
[production] |
09:58 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Include db2084 in dbctl, depooled', diff saved to https://phabricator.wikimedia.org/P11480 and previous config saved to /var/cache/conftool/dbconfig/20200612-095855-marostegui.json |
[production] |
09:58 |
<godog> |
roll-restart thanos-fe / thanos-be for microcode updates |
[production] |
08:51 |
<elukey> |
restart gerrit on gerrit1001 |
[production] |
08:48 |
<elukey> |
update cr1/cr2 analyitics filters for T252767 and T252675 |
[production] |
08:44 |
<marostegui> |
Compress InnoDB on db2092 - T254462 |
[production] |