2022-01-13
ยง
|
17:52 |
<bking@cumin2002> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:49 |
<bking@cumin2002> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:45 |
<hnowlan@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on maps1005.eqiad.wmnet with reason: requires resync after planet sync |
[production] |
17:45 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on maps1005.eqiad.wmnet with reason: requires resync after planet sync |
[production] |
17:37 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.postgresql.postgres-init (exit_code=99) |
[production] |
17:34 |
<hnowlan@cumin1001> |
START - Cookbook sre.postgresql.postgres-init |
[production] |
17:33 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.postgresql.postgres-init (exit_code=99) |
[production] |
17:29 |
<hnowlan@cumin1001> |
START - Cookbook sre.postgresql.postgres-init |
[production] |
17:29 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.postgresql.postgres-init (exit_code=99) |
[production] |
17:29 |
<hnowlan@cumin1001> |
START - Cookbook sre.postgresql.postgres-init |
[production] |
17:28 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.postgresql.postgres-init (exit_code=99) |
[production] |
17:28 |
<hnowlan@cumin1001> |
START - Cookbook sre.postgresql.postgres-init |
[production] |
17:22 |
<bking@cumin2002> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:22 |
<bking@cumin2002> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:11 |
<bking@cumin2002> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:07 |
<bking@cumin2002> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host elastic2051.codfw.wmnet with OS stretch |
[production] |
17:01 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host restbase2009.codfw.wmnet with OS buster |
[production] |
16:34 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.reimage for host restbase2009.codfw.wmnet with OS buster |
[production] |
16:27 |
<moritzm> |
impor maps-deduped-tilelist 0.0.5 to buster-wikimedia/main T297408 |
[production] |
16:02 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM cuminunpriv1001.eqiad.wmnet |
[production] |
16:00 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM cuminunpriv1001.eqiad.wmnet |
[production] |
15:50 |
<bking@cumin2002> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
15:50 |
<hnowlan@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host restbase2009.codfw.wmnet with OS buster |
[production] |
15:49 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM aphlict1001.eqiad.wmnet |
[production] |
15:47 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM aphlict1001.eqiad.wmnet |
[production] |
15:42 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM flowspec1001.eqiad.wmnet |
[production] |
15:40 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM flowspec1001.eqiad.wmnet |
[production] |
15:36 |
<bking@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host elastic2051.codfw.wmnet with OS stretch |
[production] |
15:28 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM ldap-replica1004.wikimedia.org |
[production] |
15:26 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM ldap-replica1004.wikimedia.org |
[production] |
15:23 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.reimage for host restbase2009.codfw.wmnet with OS buster |
[production] |
15:23 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM ldap-replica1003.wikimedia.org |
[production] |
15:21 |
<hnowlan@cumin1001> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host restbase2009.codfw.wmnet with OS buster |
[production] |
15:20 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM ldap-replica1003.wikimedia.org |
[production] |
15:17 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM seaborgium.wikimedia.org |
[production] |
15:15 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM seaborgium.wikimedia.org |
[production] |
15:10 |
<bking@cumin1001> |
START - Cookbook sre.hosts.reimage for host elastic2051.codfw.wmnet with OS stretch |
[production] |
15:07 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM urldownloader1002.wikimedia.org |
[production] |
15:03 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM urldownloader1002.wikimedia.org |
[production] |
14:56 |
<mmandere> |
cp3053: upgrade varnish to 6.0.9-1wm1 T298758 |
[production] |
14:56 |
<hnowlan@cumin1001> |
START - Cookbook sre.hosts.reimage for host restbase2009.codfw.wmnet with OS buster |
[production] |
14:47 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM idp1001.wikimedia.org |
[production] |
14:47 |
<moritzm> |
systemctl reset-failed ifup@ens5.service on idp1001 T273026 |
[production] |
14:39 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.reboot-vm for VM idp1001.wikimedia.org |
[production] |
14:15 |
<moritzm> |
switch ml-etcd1003 to DRBD (needed to be able to shuffle instances around for the Ganeti buster update) |
[production] |
14:14 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ml-etcd1003.eqiad.wmnet with reason: switch to drbd storage |
[production] |
14:14 |
<jmm@cumin2002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on ml-etcd1003.eqiad.wmnet with reason: switch to drbd storage |
[production] |
13:53 |
<mmandere@cumin1001> |
conftool action : set/pooled=yes; selector: name=cp6009.drmrs.wmnet |
[production] |
13:49 |
<moritzm> |
switch ml-etcd1002 to DRBD (needed to be able to shuffle instances around for the Ganeti buster update) |
[production] |
13:48 |
<jmm@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on ml-etcd1002.eqiad.wmnet with reason: switch to drbd storage |
[production] |