2022-11-04
ยง
|
15:48 |
<pt1979@cumin2002> |
START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cp4052'] |
[production] |
15:43 |
<aikochou@deploy1002> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'articletopic-outlink' for release 'main' . |
[production] |
15:41 |
<aikochou@deploy1002> |
helmfile [ml-staging-codfw] Ran 'sync' command on namespace 'experimental' for release 'main' . |
[production] |
15:00 |
<elukey> |
`elukey@cumin1001:~$ sudo cumin 'ms-fe2*' 'systemctl restart swift-proxy' -b 1 -s 20` |
[production] |
14:52 |
<ladsgroup@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on dbstore1003.eqiad.wmnet with reason: Maintenance |
[production] |
14:52 |
<ladsgroup@cumin1001> |
START - Cookbook sre.hosts.downtime for 8:00:00 on dbstore1003.eqiad.wmnet with reason: Maintenance |
[production] |
14:52 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1196 (T318955)', diff saved to https://phabricator.wikimedia.org/P38159 and previous config saved to /var/cache/conftool/dbconfig/20221104-145225-ladsgroup.json |
[production] |
14:52 |
<vgutierrez@puppetmaster1001> |
conftool action : set/pooled=true; selector: dnsdisc=swift,name=eqiad |
[production] |
14:51 |
<Emperor> |
restart swift-proxy on ms-fe1012 |
[production] |
14:48 |
<elukey> |
restart swift-proxy on ms-fe1011 |
[production] |
14:44 |
<Emperor> |
restart swift-proxy on ms-fe1010 |
[production] |
14:41 |
<pt1979@cumin2002> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host dbprov2004.mgmt.codfw.wmnet with reboot policy FORCED |
[production] |
14:37 |
<vgutierrez@puppetmaster1001> |
conftool action : set/pooled=false; selector: dnsdisc=swift,name=eqiad |
[production] |
14:37 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1196', diff saved to https://phabricator.wikimedia.org/P38158 and previous config saved to /var/cache/conftool/dbconfig/20221104-143718-ladsgroup.json |
[production] |
14:28 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.provision for host dbprov2004.mgmt.codfw.wmnet with reboot policy FORCED |
[production] |
14:26 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hardware.upgrade-firmware (exit_code=0) upgrade firmware for hosts ['cp4052'] |
[production] |
14:25 |
<pt1979@cumin2002> |
START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cp4052'] |
[production] |
14:24 |
<pt1979@cumin2002> |
END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host dbprov2004.mgmt.codfw.wmnet with reboot policy FORCED |
[production] |
14:23 |
<pt1979@cumin2002> |
END (FAIL) - Cookbook sre.hardware.upgrade-firmware (exit_code=99) upgrade firmware for hosts ['cp4052'] |
[production] |
14:22 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1196', diff saved to https://phabricator.wikimedia.org/P38157 and previous config saved to /var/cache/conftool/dbconfig/20221104-142212-ladsgroup.json |
[production] |
14:07 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1196 (T318955)', diff saved to https://phabricator.wikimedia.org/P38156 and previous config saved to /var/cache/conftool/dbconfig/20221104-140705-ladsgroup.json |
[production] |
14:04 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Depooling db1196 (T318955)', diff saved to https://phabricator.wikimedia.org/P38155 and previous config saved to /var/cache/conftool/dbconfig/20221104-140427-ladsgroup.json |
[production] |
14:04 |
<ladsgroup@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db1196.eqiad.wmnet with reason: Maintenance |
[production] |
14:04 |
<ladsgroup@cumin1001> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db1196.eqiad.wmnet with reason: Maintenance |
[production] |
14:04 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1186 (T318955)', diff saved to https://phabricator.wikimedia.org/P38154 and previous config saved to /var/cache/conftool/dbconfig/20221104-140405-ladsgroup.json |
[production] |
13:58 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.provision for host dbprov2004.mgmt.codfw.wmnet with reboot policy FORCED |
[production] |
13:58 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host dbprov2004 |
[production] |
13:57 |
<pt1979@cumin2002> |
START - Cookbook sre.network.configure-switch-interfaces for host dbprov2004 |
[production] |
13:56 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
13:54 |
<pt1979@cumin2002> |
START - Cookbook sre.dns.netbox |
[production] |
13:49 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1186', diff saved to https://phabricator.wikimedia.org/P38153 and previous config saved to /var/cache/conftool/dbconfig/20221104-134859-ladsgroup.json |
[production] |
13:45 |
<pt1979@cumin2002> |
START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cp4052'] |
[production] |
13:33 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1186', diff saved to https://phabricator.wikimedia.org/P38152 and previous config saved to /var/cache/conftool/dbconfig/20221104-133353-ladsgroup.json |
[production] |
13:18 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1186 (T318955)', diff saved to https://phabricator.wikimedia.org/P38151 and previous config saved to /var/cache/conftool/dbconfig/20221104-131846-ladsgroup.json |
[production] |
13:17 |
<sukhe> |
reprepro -C main include bullseye-wikimedia python-logstash_0.4.6-3_amd64.changes: T321309 |
[production] |
13:16 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Depooling db1186 (T318955)', diff saved to https://phabricator.wikimedia.org/P38150 and previous config saved to /var/cache/conftool/dbconfig/20221104-131607-ladsgroup.json |
[production] |
13:16 |
<ladsgroup@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db1186.eqiad.wmnet with reason: Maintenance |
[production] |
13:15 |
<ladsgroup@cumin1001> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db1186.eqiad.wmnet with reason: Maintenance |
[production] |
13:15 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1184 (T318955)', diff saved to https://phabricator.wikimedia.org/P38149 and previous config saved to /var/cache/conftool/dbconfig/20221104-131546-ladsgroup.json |
[production] |
13:11 |
<sukhe> |
reprepro -C main include bullseye-wikimedia prometheus-rdkafka-exporter_0.3_amd64.changes: T321309 |
[production] |
13:10 |
<sukhe> |
reprepro -C main include bullseye-wikimedia file-read-backwards_2.0.0-3_amd64.changes: T321309 |
[production] |
13:09 |
<sukhe> |
reprepro -C main include bullseye-wikimedia fifo-log-demux_0.6.3_amd64.changes: T321309 |
[production] |
13:00 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1184', diff saved to https://phabricator.wikimedia.org/P38148 and previous config saved to /var/cache/conftool/dbconfig/20221104-130039-ladsgroup.json |
[production] |
12:45 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1184', diff saved to https://phabricator.wikimedia.org/P38147 and previous config saved to /var/cache/conftool/dbconfig/20221104-124533-ladsgroup.json |
[production] |
12:36 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'es2020 (re)pooling @ 100%: After reboot', diff saved to https://phabricator.wikimedia.org/P38146 and previous config saved to /var/cache/conftool/dbconfig/20221104-123606-root.json |
[production] |
12:30 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1184 (T318955)', diff saved to https://phabricator.wikimedia.org/P38145 and previous config saved to /var/cache/conftool/dbconfig/20221104-123026-ladsgroup.json |
[production] |
12:27 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Depooling db1184 (T318955)', diff saved to https://phabricator.wikimedia.org/P38144 and previous config saved to /var/cache/conftool/dbconfig/20221104-122747-ladsgroup.json |
[production] |
12:27 |
<ladsgroup@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 8:00:00 on db1184.eqiad.wmnet with reason: Maintenance |
[production] |
12:27 |
<ladsgroup@cumin1001> |
START - Cookbook sre.hosts.downtime for 8:00:00 on db1184.eqiad.wmnet with reason: Maintenance |
[production] |
12:27 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1169 (T318955)', diff saved to https://phabricator.wikimedia.org/P38143 and previous config saved to /var/cache/conftool/dbconfig/20221104-122726-ladsgroup.json |
[production] |