2023-05-03
ยง
|
14:13 |
<otto@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/eventgate-analytics: apply |
[production] |
14:13 |
<otto@deploy1002> |
helmfile [staging] DONE helmfile.d/services/eventgate-main: apply |
[production] |
14:13 |
<otto@deploy1002> |
helmfile [staging] START helmfile.d/services/eventgate-main: apply |
[production] |
14:13 |
<otto@deploy1002> |
helmfile [codfw] START helmfile.d/services/eventgate-analytics: apply |
[production] |
14:12 |
<otto@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:12 |
<otto@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:12 |
<otto@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:12 |
<otto@deploy1002> |
helmfile [staging] DONE helmfile.d/services/eventgate-analytics: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [staging] START helmfile.d/services/eventgate-analytics: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [codfw] START helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/eventgate-logging-external: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [staging] DONE helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [staging] START helmfile.d/services/eventgate-analytics-external: apply |
[production] |
14:11 |
<otto@deploy1002> |
helmfile [eqiad] START helmfile.d/services/eventgate-logging-external: apply |
[production] |
14:09 |
<sukhe> |
stop pybal on lvs2007 to drain host for decommissioning |
[production] |
14:09 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Depooling db1170:3312 (T335838)', diff saved to https://phabricator.wikimedia.org/P47400 and previous config saved to /var/cache/conftool/dbconfig/20230503-140932-ladsgroup.json |
[production] |
14:09 |
<ladsgroup@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Maintenance |
[production] |
14:09 |
<lucaswerkmeister-wmde@deploy1002> |
Finished scap: Backport for [[gerrit:910556|Turn on experimental Parsoid Read Views support, except on commons & wikidata (T335157)]] (duration: 15m 27s) |
[production] |
14:09 |
<ladsgroup@cumin1001> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db1170.eqiad.wmnet with reason: Maintenance |
[production] |
14:09 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1158 (T335838)', diff saved to https://phabricator.wikimedia.org/P47399 and previous config saved to /var/cache/conftool/dbconfig/20230503-140908-ladsgroup.json |
[production] |
14:05 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db2169:3316 (T335838)', diff saved to https://phabricator.wikimedia.org/P47398 and previous config saved to /var/cache/conftool/dbconfig/20230503-140540-ladsgroup.json |
[production] |
14:04 |
<otto@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/eventgate-logging-external: apply |
[production] |
14:04 |
<otto@deploy1002> |
helmfile [codfw] START helmfile.d/services/eventgate-logging-external: apply |
[production] |
14:03 |
<herron@cumin1001> |
END (PASS) - Cookbook sre.ganeti.makevm (exit_code=0) for new host kafkamon2003.codfw.wmnet |
[production] |
14:03 |
<herron@cumin1001> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.ganeti.makevm: created new VM kafkamon2003.codfw.wmnet - herron@cumin1001" |
[production] |
14:02 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db2137:3315', diff saved to https://phabricator.wikimedia.org/P47396 and previous config saved to /var/cache/conftool/dbconfig/20230503-140246-ladsgroup.json |
[production] |
14:02 |
<herron@cumin1001> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.ganeti.makevm: created new VM kafkamon2003.codfw.wmnet - herron@cumin1001" |
[production] |
13:55 |
<lucaswerkmeister-wmde@deploy1002> |
lucaswerkmeister-wmde and cscott: Backport for [[gerrit:910556|Turn on experimental Parsoid Read Views support, except on commons & wikidata (T335157)]] synced to the testservers: mwdebug1001.eqiad.wmnet, mwdebug1002.eqiad.wmnet, mwdebug2001.codfw.wmnet, mwdebug2002.codfw.wmnet |
[production] |
13:54 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1158', diff saved to https://phabricator.wikimedia.org/P47395 and previous config saved to /var/cache/conftool/dbconfig/20230503-135402-ladsgroup.json |
[production] |
13:53 |
<lucaswerkmeister-wmde@deploy1002> |
Started scap: Backport for [[gerrit:910556|Turn on experimental Parsoid Read Views support, except on commons & wikidata (T335157)]] |
[production] |
13:52 |
<lucaswerkmeister-wmde@deploy1002> |
Finished scap: Backport for [[gerrit:914437|wblistentityusage: Deprecate wbeu prefix, new output format (T300460 T196962)]] (duration: 27m 54s) |
[production] |
13:50 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db2169:3316', diff saved to https://phabricator.wikimedia.org/P47394 and previous config saved to /var/cache/conftool/dbconfig/20230503-135034-ladsgroup.json |
[production] |
13:48 |
<cgoubert@cumin1001> |
END (PASS) - Cookbook sre.k8s.reboot-nodes (exit_code=0) rolling reboot on A:wikikube-worker-codfw |
[production] |
13:47 |
<herron@cumin1001> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) kafkamon2003.codfw.wmnet on all recursors |
[production] |
13:47 |
<herron@cumin1001> |
START - Cookbook sre.dns.wipe-cache kafkamon2003.codfw.wmnet on all recursors |
[production] |
13:47 |
<herron@cumin1001> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
13:47 |
<herron@cumin1001> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM kafkamon2003.codfw.wmnet - herron@cumin1001" |
[production] |
13:47 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db2137:3315', diff saved to https://phabricator.wikimedia.org/P47393 and previous config saved to /var/cache/conftool/dbconfig/20230503-134740-ladsgroup.json |
[production] |
13:46 |
<herron@cumin1001> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM kafkamon2003.codfw.wmnet - herron@cumin1001" |
[production] |
13:43 |
<herron@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
13:43 |
<herron@cumin1001> |
START - Cookbook sre.ganeti.makevm for new host kafkamon2003.codfw.wmnet |
[production] |
13:43 |
<slyngshede@cumin1001> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM idm1001.wikimedia.org |
[production] |
13:41 |
<lucaswerkmeister-wmde@deploy1002> |
lucaswerkmeister-wmde: Backport for [[gerrit:914437|wblistentityusage: Deprecate wbeu prefix, new output format (T300460 T196962)]] synced to the testservers: mwdebug2002.codfw.wmnet, mwdebug2001.codfw.wmnet, mwdebug1001.eqiad.wmnet, mwdebug1002.eqiad.wmnet |
[production] |
13:40 |
<slyngshede@cumin1001> |
START - Cookbook sre.ganeti.reboot-vm for VM idm1001.wikimedia.org |
[production] |
13:40 |
<slyngshede@cumin1001> |
END (PASS) - Cookbook sre.ganeti.reboot-vm (exit_code=0) for VM idm2001.wikimedia.org |
[production] |
13:38 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db1158', diff saved to https://phabricator.wikimedia.org/P47392 and previous config saved to /var/cache/conftool/dbconfig/20230503-133855-ladsgroup.json |
[production] |
13:36 |
<slyngshede@cumin1001> |
START - Cookbook sre.ganeti.reboot-vm for VM idm2001.wikimedia.org |
[production] |
13:36 |
<slyngshede@cumin1001> |
END (ERROR) - Cookbook sre.ganeti.reboot-vm (exit_code=97) for VM idm-test1001.wikimedia.org |
[production] |
13:35 |
<herron@cumin1001> |
END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=1) for host kafkamon1003.eqiad.wmnet |
[production] |
13:35 |
<ladsgroup@cumin1001> |
dbctl commit (dc=all): 'Repooling after maintenance db2169:3316', diff saved to https://phabricator.wikimedia.org/P47391 and previous config saved to /var/cache/conftool/dbconfig/20230503-133528-ladsgroup.json |
[production] |