2021-09-10
§
|
21:28 |
<legoktm@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'shellbox-syntaxhighlight' for release 'main' . |
[production] |
21:27 |
<legoktm@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'shellbox-syntaxhighlight' for release 'main' . |
[production] |
21:21 |
<legoktm@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'shellbox-syntaxhighlight' for release 'main' . |
[production] |
20:46 |
<jhuneidi@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'blubberoid' for release 'production' . |
[production] |
20:44 |
<jhuneidi@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'blubberoid' for release 'production' . |
[production] |
20:42 |
<jhuneidi@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'blubberoid' for release 'staging' . |
[production] |
18:34 |
<volans@cumin1001> |
END (FAIL) - Cookbook sre.experimental.reimage (exit_code=99) for host sretest1001.eqiad.wmnet |
[production] |
18:08 |
<volans@cumin1001> |
START - Cookbook sre.experimental.reimage for host sretest1001.eqiad.wmnet |
[production] |
17:16 |
<pt1979@cumin2002> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) for 2:00:00 on puppetmaster2005.codfw.wmnet with reason: REIMAGE |
[production] |
17:14 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on puppetmaster2005.codfw.wmnet with reason: REIMAGE |
[production] |
16:42 |
<pt1979@cumin2002> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) for 2:00:00 on puppetmaster2004.codfw.wmnet with reason: REIMAGE |
[production] |
16:40 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on puppetmaster2004.codfw.wmnet with reason: REIMAGE |
[production] |
16:14 |
<volans@cumin1001> |
END (FAIL) - Cookbook sre.experimental.reimage (exit_code=99) for host sretest1001.eqiad.wmnet |
[production] |
16:03 |
<volans@cumin1001> |
START - Cookbook sre.experimental.reimage for host sretest1001.eqiad.wmnet |
[production] |
15:39 |
<volans@cumin1001> |
END (FAIL) - Cookbook sre.experimental.reimage (exit_code=99) for host sretest1001.eqiad.wmnet |
[production] |
15:27 |
<volans@cumin1001> |
START - Cookbook sre.experimental.reimage for host sretest1001.eqiad.wmnet |
[production] |
14:48 |
<jiji@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |
14:43 |
<jiji@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |
13:54 |
<jiji@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |
09:31 |
<XioNoX> |
push pfw policies - T290611 |
[production] |
09:07 |
<mutante> |
planet - deleted all state files for all languages, running fresh update via systemctl start for all languages after proxy changes (T285251) |
[production] |
08:37 |
<jynus> |
upgrade and restart db2139 |
[production] |
08:14 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
08:14 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'sync'. |
[production] |
08:14 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
08:13 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'sync'. |
[production] |
08:12 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
08:12 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'sync'. |
[production] |
07:58 |
<jayme> |
updating rsyslog to 8.1901.0-1~bpo9+wmf2 on kubernetes-workers - T289766 |
[production] |
07:57 |
<moritzm> |
installing ntfs-3g security updates |
[production] |
07:46 |
<jayme@deploy1002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
07:45 |
<jayme@deploy1002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'sync'. |
[production] |
07:31 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
07:31 |
<elukey@deploy1002> |
helmfile [ml-serve-eqiad] START helmfile.d/admin 'sync'. |
[production] |
07:25 |
<jayme> |
updating rsyslog to 8.1901.0-1~bpo9+wmf2 on kubernetes-staging - T289766 |
[production] |
07:19 |
<jayme> |
importes rsyslog 8.1901.0-1~bpo9+wmf2 to stretch-wikimedia - T289766 |
[production] |
06:56 |
<effie> |
disable puppet on deploy1002 and mw2254 |
[production] |
06:29 |
<jayme@deploy1002> |
helmfile [codfw] DONE helmfile.d/admin 'sync'. |
[production] |
06:27 |
<jayme@deploy1002> |
helmfile [codfw] START helmfile.d/admin 'sync'. |
[production] |
06:26 |
<jayme@deploy1002> |
helmfile [eqiad] DONE helmfile.d/admin 'sync'. |
[production] |
06:26 |
<jayme@deploy1002> |
helmfile [eqiad] START helmfile.d/admin 'sync'. |
[production] |
06:02 |
<elukey@puppetmaster1001> |
conftool action : set/pooled=inactive; selector: name=mw2280.codfw.wmnet |
[production] |
05:59 |
<jiji@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |
05:56 |
<elukey> |
powercycle mw2280 - no tty available in mgmt, no ssh, host frozen |
[production] |
05:55 |
<elukey@puppetmaster1001> |
conftool action : set/pooled=no; selector: name=mw2280.codfw.wmnet |
[production] |
05:54 |
<jiji@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |
05:45 |
<jiji@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'mwdebug' for release 'pinkunicorn' . |
[production] |