2025-06-12
ยง
|
11:17 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1212 (T396130)', diff saved to https://phabricator.wikimedia.org/P77825 and previous config saved to /var/cache/conftool/dbconfig/20250612-111722-marostegui.json |
[production] |
11:14 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Depooling db2146 (T395241)', diff saved to https://phabricator.wikimedia.org/P77824 and previous config saved to /var/cache/conftool/dbconfig/20250612-111423-fceratto.json |
[production] |
11:14 |
<fceratto@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2146.codfw.wmnet with reason: Maintenance |
[production] |
11:13 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2145 (T395241)', diff saved to https://phabricator.wikimedia.org/P77823 and previous config saved to /var/cache/conftool/dbconfig/20250612-111357-fceratto.json |
[production] |
11:10 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1051.eqiad.wmnet |
[production] |
11:10 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1051.eqiad.wmnet |
[production] |
11:10 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
11:07 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
11:07 |
<vgutierrez> |
use Google Trust Services (GTS) unified TLS certificate on drmrs - T395131 |
[production] |
11:07 |
<andrew@cumin1002> |
START - Cookbook sre.hosts.reimage for host cloudcephosd1014.eqiad.wmnet with OS bullseye |
[production] |
11:05 |
<jmm@cumin1003> |
START - Cookbook sre.hosts.reboot-single for host ganeti1051.eqiad.wmnet |
[production] |
11:05 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
11:02 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1212', diff saved to https://phabricator.wikimedia.org/P77822 and previous config saved to /var/cache/conftool/dbconfig/20250612-110213-marostegui.json |
[production] |
11:01 |
<jmm@cumin1003> |
START - Cookbook sre.hosts.reimage for host ncredir7004.magru.wmnet with OS bookworm |
[production] |
11:00 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.ganeti.makevm: created new VM ncredir7004.magru.wmnet - jmm@cumin1003" |
[production] |
11:00 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
11:00 |
<jmm@cumin1003> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.ganeti.makevm: created new VM ncredir7004.magru.wmnet - jmm@cumin1003" |
[production] |
11:00 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) ncredir7004.magru.wmnet on all recursors |
[production] |
10:59 |
<jmm@cumin1003> |
START - Cookbook sre.dns.wipe-cache ncredir7004.magru.wmnet on all recursors |
[production] |
10:59 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
10:59 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM ncredir7004.magru.wmnet - jmm@cumin1003" |
[production] |
10:58 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2145', diff saved to https://phabricator.wikimedia.org/P77821 and previous config saved to /var/cache/conftool/dbconfig/20250612-105848-fceratto.json |
[production] |
10:57 |
<jmm@cumin1003> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1051.eqiad.wmnet |
[production] |
10:56 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1050.eqiad.wmnet |
[production] |
10:56 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1050.eqiad.wmnet |
[production] |
10:50 |
<jmm@cumin1003> |
START - Cookbook sre.hosts.reboot-single for host ganeti1050.eqiad.wmnet |
[production] |
10:50 |
<jmm@cumin1003> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM ncredir7004.magru.wmnet - jmm@cumin1003" |
[production] |
10:50 |
<fceratto@deploy1003> |
helmfile [aux-k8s-eqiad] 'sync' command on namespace 'zarcillo' for release 'main' . |
[production] |
10:47 |
<jmm@cumin1003> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1050.eqiad.wmnet |
[production] |
10:47 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1212', diff saved to https://phabricator.wikimedia.org/P77820 and previous config saved to /var/cache/conftool/dbconfig/20250612-104706-marostegui.json |
[production] |
10:44 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1049.eqiad.wmnet |
[production] |
10:43 |
<jmm@cumin1003> |
END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1049.eqiad.wmnet |
[production] |
10:43 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2145', diff saved to https://phabricator.wikimedia.org/P77819 and previous config saved to /var/cache/conftool/dbconfig/20250612-104341-fceratto.json |
[production] |
10:43 |
<jmm@cumin1003> |
START - Cookbook sre.dns.netbox |
[production] |
10:43 |
<jmm@cumin1003> |
START - Cookbook sre.ganeti.makevm for new host ncredir7004.magru.wmnet |
[production] |
10:42 |
<jmm@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host ganeti2050.codfw.wmnet with OS bookworm |
[production] |
10:38 |
<jmm@cumin1003> |
START - Cookbook sre.hosts.reboot-single for host ganeti1049.eqiad.wmnet |
[production] |
10:36 |
<cgoubert@deploy1003> |
Finished scap sync-world: 1156288: mediawiki: Add job history limit control - T395885 (duration: 02m 48s) |
[production] |
10:33 |
<cgoubert@deploy1003> |
Started scap sync-world: 1156288: mediawiki: Add job history limit control - T395885 |
[production] |
10:32 |
<jmm@cumin1003> |
START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1049.eqiad.wmnet |
[production] |
10:32 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1212 (T396130)', diff saved to https://phabricator.wikimedia.org/P77818 and previous config saved to /var/cache/conftool/dbconfig/20250612-103159-marostegui.json |
[production] |
10:28 |
<fceratto@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db2145 (T395241)', diff saved to https://phabricator.wikimedia.org/P77817 and previous config saved to /var/cache/conftool/dbconfig/20250612-102834-fceratto.json |
[production] |
10:27 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db1212 (T396130)', diff saved to https://phabricator.wikimedia.org/P77816 and previous config saved to /var/cache/conftool/dbconfig/20250612-102700-marostegui.json |
[production] |
10:26 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on an-redacteddb1001.eqiad.wmnet,clouddb[1013,1017].eqiad.wmnet,db1154.eqiad.wmnet with reason: Maintenance |
[production] |
10:26 |
<marostegui@cumin1002> |
DONE (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1212.eqiad.wmnet with reason: Maintenance |
[production] |
10:26 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1198 (T396130)', diff saved to https://phabricator.wikimedia.org/P77815 and previous config saved to /var/cache/conftool/dbconfig/20250612-102630-marostegui.json |
[production] |
10:25 |
<jmm@cumin1003> |
START - Cookbook sre.hosts.reimage for host ganeti2050.codfw.wmnet with OS bookworm |
[production] |
10:24 |
<jmm@cumin1003> |
END (FAIL) - Cookbook sre.ganeti.makevm (exit_code=99) for new host ncredir7004.magru.wmnet |
[production] |
10:23 |
<jmm@cumin1003> |
END (FAIL) - Cookbook sre.dns.netbox (exit_code=99) |
[production] |
10:23 |
<jmm@cumin1003> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host ganeti2050.codfw.wmnet with OS bookworm |
[production] |