2022-01-13
ยง
|
15:47 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM aphlict1001.eqiad.wmnet |
[production] |
15:42 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM flowspec1001.eqiad.wmnet |
[production] |
15:40 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM flowspec1001.eqiad.wmnet |
[production] |
15:36 |
<bking@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host elastic2051.codfw.wmnet with OS stretch |
[production] |
15:28 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM ldap-replica1004.wikimedia.org |
[production] |
15:26 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM ldap-replica1004.wikimedia.org |
[production] |
15:23 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.reimage for host restbase2009.codfw.wmnet with OS buster |
[production] |
15:23 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM ldap-replica1003.wikimedia.org |
[production] |
15:21 |
<hnowlan@cumin1001> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host restbase2009.codfw.wmnet with OS buster |
[production] |
15:20 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM ldap-replica1003.wikimedia.org |
[production] |
15:17 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM seaborgium.wikimedia.org |
[production] |
15:15 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM seaborgium.wikimedia.org |
[production] |
15:10 |
<bking@cumin1001> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
15:07 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM urldownloader1002.wikimedia.org |
[production] |
15:03 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM urldownloader1002.wikimedia.org |
[production] |
14:56 |
<mmandere> |
cp3053: upgrade varnish to 6.0.9-1wm1 T298758 |
[production] |
14:56 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.reimage for host restbase2009.codfw.wmnet with OS buster |
[production] |
14:47 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM idp1001.wikimedia.org |
[production] |
14:47 |
<moritzm> |
systemctl reset-failed ifup@ens5.service on idp1001 T273026 |
[production] |
14:39 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM idp1001.wikimedia.org |
[production] |
14:15 |
<moritzm> |
switch ml-etcd1003 to DRBD (needed to be able to shuffle instances around for the Ganeti buster update) |
[production] |
14:14 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ml-etcd1003.eqiad.wmnet with reason: switch to drbd storage |
[production] |
14:14 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on ml-etcd1003.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:53 |
<mmandere@cumin1001> |
conftool action : set/pooled=yes; selector: name=cp6009.drmrs.wmnet |
[production] |
13:49 |
<moritzm> |
switch ml-etcd1002 to DRBD (needed to be able to shuffle instances around for the Ganeti buster update) |
[production] |
13:48 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ml-etcd1002.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:48 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on ml-etcd1002.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:45 |
<mmandere@cumin1001> |
conftool action : set/pooled=yes; selector: name=cp6001.drmrs.wmnet |
[production] |
13:35 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM urldownloader1001.wikimedia.org |
[production] |
13:33 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM urldownloader1001.wikimedia.org |
[production] |
13:23 |
<moritzm> |
switch ml-etcd1001 to DRBD (needed to be able to shuffle instances around for the Ganeti buster update) |
[production] |
13:21 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ml-etcd1001.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:21 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on ml-etcd1001.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:10 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM cloudbackup1001-dev.eqiad.wmnet |
[production] |
13:08 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM cloudbackup1001-dev.eqiad.wmnet |
[production] |
12:43 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es1022 (re)pooling @ 100%: repooling after reimage', diff saved to https://phabricator.wikimedia.org/P18731 and previous config saved to /var/cache/conftool/dbconfig/20220113-124307-root.json |
[production] |
12:43 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Remove contributions group from s3 eqiad T263127', diff saved to https://phabricator.wikimedia.org/P18730 and previous config saved to /var/cache/conftool/dbconfig/20220113-124300-marostegui.json |
[production] |
12:41 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Remove all special groups from s3 codfw T263127', diff saved to https://phabricator.wikimedia.org/P18729 and previous config saved to /var/cache/conftool/dbconfig/20220113-124140-marostegui.json |
[production] |
12:37 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Remove weight from es1021', diff saved to https://phabricator.wikimedia.org/P18728 and previous config saved to /var/cache/conftool/dbconfig/20220113-123744-marostegui.json |
[production] |
12:30 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM cloudbackup1002-dev.eqiad.wmnet |
[production] |
12:28 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es1022 (re)pooling @ 75%: repooling after reimage', diff saved to https://phabricator.wikimedia.org/P18727 and previous config saved to /var/cache/conftool/dbconfig/20220113-122803-root.json |
[production] |
12:27 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM cloudbackup1002-dev.eqiad.wmnet |
[production] |
12:23 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM ldap-corp1001.wikimedia.org |
[production] |
12:21 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM ldap-corp1001.wikimedia.org |
[production] |
12:13 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es1022 (re)pooling @ 60%: repooling after reimage', diff saved to https://phabricator.wikimedia.org/P18726 and previous config saved to /var/cache/conftool/dbconfig/20220113-121300-root.json |
[production] |
12:03 |
<btullis@cumin1001> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM eventlog1003.eqiad.wmnet |
[production] |
11:59 |
<btullis@cumin1001> |
START - Cookbook sre.ganeti.reboot-vm for VM eventlog1003.eqiad.wmnet |
[production] |
11:57 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es1022 (re)pooling @ 50%: repooling after reimage', diff saved to https://phabricator.wikimedia.org/P18725 and previous config saved to /var/cache/conftool/dbconfig/20220113-115756-root.json |
[production] |
11:42 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es1022 (re)pooling @ 40%: repooling after reimage', diff saved to https://phabricator.wikimedia.org/P18724 and previous config saved to /var/cache/conftool/dbconfig/20220113-114252-root.json |
[production] |
11:34 |
<btullis@cumin1001> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM kafka-test1010.eqiad.wmnet |
[production] |