2022-06-21
ยง
|
15:05 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mwdebug: apply |
[production] |
15:01 |
<papaul> |
PDU swap for rack a2 complete |
[production] |
15:00 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/mwdebug: apply |
[production] |
14:59 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] START helmfile.d/services/mwdebug: apply |
[production] |
14:59 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mwdebug: apply |
[production] |
14:58 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mwdebug: apply |
[production] |
14:56 |
<aqu> |
RefineSanitize from an-launcher1002: sudo -u analytics kerberos-run-command analytics spark2-submit --class org.wikimedia.analytics.refinery.job.refine.RefineSanitize --master yarn --deploy-mode client /srv/deployment/analytics/refinery/artifacts/org/wikimedia/analytics/refinery/refinery-job-0.1.15.jar --config_file /home/aqu/refine.properties --since "2022-06-19T09:52:00+0000" --until |
[analytics] |
14:24 |
<papaul> |
on going maintenance on ps1-a2-codfw |
[production] |
14:02 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/mwdebug: apply |
[production] |
13:58 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] START helmfile.d/services/mwdebug: apply |
[production] |
13:58 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mwdebug: apply |
[production] |
13:54 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1052.eqiad.wmnet |
[production] |
13:52 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mwdebug: apply |
[production] |
13:49 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be2047.codfw.wmnet |
[production] |
13:48 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1052.eqiad.wmnet |
[production] |
13:46 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1051.eqiad.wmnet |
[production] |
13:39 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1051.eqiad.wmnet |
[production] |
13:38 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1050.eqiad.wmnet |
[production] |
13:37 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/mwdebug: apply |
[production] |
13:33 |
<aqu> |
sudo systemctl start monitor_refine_event_sanitized_main_immediate.service on an-launcher1002 |
[analytics] |
13:32 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1050.eqiad.wmnet |
[production] |
13:31 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2047.codfw.wmnet |
[production] |
13:30 |
<mwdebug-deploy@deploy1002> |
helmfile [codfw] START helmfile.d/services/mwdebug: apply |
[production] |
13:30 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/mwdebug: apply |
[production] |
13:28 |
<daniel@deploy1002> |
Synchronized rpc/: Config: [[gerrit:805775|rpc: Remove unused RunJobs.php (T175146 T243096)]] (duration: 03m 45s) |
[production] |
13:23 |
<mwdebug-deploy@deploy1002> |
helmfile [eqiad] START helmfile.d/services/mwdebug: apply |
[production] |
13:14 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1049.eqiad.wmnet |
[production] |
13:13 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be2046.codfw.wmnet |
[production] |
13:05 |
<moritzm> |
installing Linux 5.10.120-1~bpo10+1 on buster hosts with backports kernel |
[production] |
13:02 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2046.codfw.wmnet |
[production] |
13:01 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be2045.codfw.wmnet |
[production] |
12:59 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1049.eqiad.wmnet |
[production] |
12:57 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1048.eqiad.wmnet |
[production] |
12:56 |
<moritzm> |
installing haproxy security updates on stretch |
[production] |
12:53 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2045.codfw.wmnet |
[production] |
12:52 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be2044.codfw.wmnet |
[production] |
12:52 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1048.eqiad.wmnet |
[production] |
12:50 |
<mvernon@cumin2002> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ms-be1047.eqiad.wmnet |
[production] |
12:43 |
<moritzm> |
installing python-bottle security updates |
[production] |
12:40 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be1047.eqiad.wmnet |
[production] |
12:39 |
<mvernon@cumin2002> |
START - Cookbook sre.hosts.reboot-single for host ms-be2044.codfw.wmnet |
[production] |
12:36 |
<Rook> |
T302164 #173 upgrading single user container b687ca6aedc745c63b2659124dca0dab01d38173 |
[paws] |
12:25 |
<moritzm> |
reset logster-csp/logster-badpass-priv on mwlog1002, these were removed from Puppet |
[production] |
12:12 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.addnode (exit_code=99) for new host ganeti4004.ulsfo.wmnet to ganeti01.svc.ulsfo.wmnet |
[production] |
12:12 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.addnode for new host ganeti4004.ulsfo.wmnet to ganeti01.svc.ulsfo.wmnet |
[production] |
12:06 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.addnode (exit_code=99) for new host ganeti4004.ulsfo.wmnet to ganeti01.svc.ulsfo.wmnet |
[production] |
12:05 |
<jmm@cumin2002> |
START - Cookbook sre.ganeti.addnode for new host ganeti4004.ulsfo.wmnet to ganeti01.svc.ulsfo.wmnet |
[production] |
11:59 |
<mbsantos> |
mbsantos@maps2009 imposm-removebackup-import (T305845) |
[production] |
11:48 |
<Rook> |
806504: Show username on 404 page when logged in | https://gerrit.wikimedia.org/r/c/analytics/quarry/web/+/806504 |
[quarry] |
11:44 |
<jmm@cumin2002> |
END (FAIL) - Cookbook sre.ganeti.addnode (exit_code=99) for new host ganeti4004.ulsfo.wmnet to ganeti01.svc.ulsfo.wmnet |
[production] |