2021-09-02
ยง
|
15:53 |
<jiji@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts mc1020.eqiad.wmnet |
[production] |
15:40 |
<jiji@cumin1001> |
END (PASS) - Cookbook sre.hosts.decommission (exit_code=0) for hosts mc1019.eqiad.wmnet |
[production] |
15:31 |
<dzahn@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'miscweb' for release 'main' . |
[production] |
15:28 |
<dzahn@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'miscweb' for release 'main' . |
[production] |
15:26 |
<jiji@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts mc1019.eqiad.wmnet |
[production] |
15:16 |
<jiji@cumin1001> |
END (FAIL) - Cookbook sre.hosts.decommission (exit_code=99) for hosts mc1033.eqiad.wmnet |
[production] |
15:15 |
<jiji@cumin1001> |
END (PASS) - Cookbook sre.hosts.decommission (exit_code=0) for hosts mc1034.eqiad.wmnet |
[production] |
15:04 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2136 (re)pooling @ 100%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17178 and previous config saved to /var/cache/conftool/dbconfig/20210902-150412-root.json |
[production] |
14:50 |
<jiji@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts mc1034.eqiad.wmnet |
[production] |
14:49 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2136 (re)pooling @ 75%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17177 and previous config saved to /var/cache/conftool/dbconfig/20210902-144908-root.json |
[production] |
14:49 |
<jiji@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts mc1033.eqiad.wmnet |
[production] |
14:47 |
<cmjohnson@cumin1001> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
14:44 |
<cmjohnson@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
14:39 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'cxserver' for release 'production' . |
[production] |
14:38 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'cxserver' for release 'production' . |
[production] |
14:38 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'cxserver' for release 'staging' . |
[production] |
14:35 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'wikifeeds' for release 'production' . |
[production] |
14:34 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2136 (re)pooling @ 50%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17176 and previous config saved to /var/cache/conftool/dbconfig/20210902-143405-root.json |
[production] |
14:33 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'wikifeeds' for release 'production' . |
[production] |
14:32 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'wikifeeds' for release 'staging' . |
[production] |
14:22 |
<moritzm> |
installing exiv2 security updates |
[production] |
14:19 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2136 (re)pooling @ 25%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17175 and previous config saved to /var/cache/conftool/dbconfig/20210902-141901-root.json |
[production] |
14:13 |
<moritzm> |
installing ffmpeg security updates |
[production] |
14:03 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2136 (re)pooling @ 10%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17174 and previous config saved to /var/cache/conftool/dbconfig/20210902-140357-root.json |
[production] |
14:00 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'zotero' for release 'production' . |
[production] |
13:57 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'zotero' for release 'production' . |
[production] |
13:55 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'zotero' for release 'staging' . |
[production] |
13:48 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool db2136 for upgrade', diff saved to https://phabricator.wikimedia.org/P17173 and previous config saved to /var/cache/conftool/dbconfig/20210902-134838-marostegui.json |
[production] |
13:44 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2119 (re)pooling @ 100%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17172 and previous config saved to /var/cache/conftool/dbconfig/20210902-134448-root.json |
[production] |
13:42 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'citoid' for release 'production' . |
[production] |
13:42 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'citoid' for release 'production' . |
[production] |
13:41 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'citoid' for release 'staging' . |
[production] |
13:39 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'termbox' for release 'production' . |
[production] |
13:39 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'termbox' for release 'production' . |
[production] |
13:38 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'termbox' for release 'test' . |
[production] |
13:38 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'termbox' for release 'staging' . |
[production] |
13:36 |
<jayme@deploy1002> |
helmfile [codfw] Ran 'sync' command on namespace 'blubberoid' for release 'production' . |
[production] |
13:35 |
<jayme@deploy1002> |
helmfile [eqiad] Ran 'sync' command on namespace 'blubberoid' for release 'production' . |
[production] |
13:29 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2119 (re)pooling @ 75%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17171 and previous config saved to /var/cache/conftool/dbconfig/20210902-132945-root.json |
[production] |
13:29 |
<jayme@deploy1002> |
helmfile [staging] Ran 'sync' command on namespace 'blubberoid' for release 'staging' . |
[production] |
13:24 |
<jbond@cumin1001> |
END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) for 2:00:00 on sretest1002.eqiad.wmnet with reason: REIMAGE |
[production] |
13:22 |
<jbond@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on sretest1002.eqiad.wmnet with reason: REIMAGE |
[production] |
13:14 |
<jbond> |
reimage sretest1002 (not sretest1001) |
[production] |
13:14 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2119 (re)pooling @ 50%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17169 and previous config saved to /var/cache/conftool/dbconfig/20210902-131441-root.json |
[production] |
13:14 |
<jbond> |
reimage sretest1001 |
[production] |
12:59 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2119 (re)pooling @ 25%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17168 and previous config saved to /var/cache/conftool/dbconfig/20210902-125937-root.json |
[production] |
12:55 |
<jbond> |
disable puppet fleet wide to roll out 715728 |
[production] |
12:44 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db2119 (re)pooling @ 10%: Slowly repool after reimage T288803', diff saved to https://phabricator.wikimedia.org/P17167 and previous config saved to /var/cache/conftool/dbconfig/20210902-124434-root.json |
[production] |
12:42 |
<marostegui> |
Upgrade db2119 |
[production] |
12:41 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool db2119 for upgrade', diff saved to https://phabricator.wikimedia.org/P17166 and previous config saved to /var/cache/conftool/dbconfig/20210902-124102-marostegui.json |
[production] |