2023-11-30
ยง
|
07:32 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db1210 (re)pooling @ 1%: Upgrade to 10.6.16 and bookworm', diff saved to https://phabricator.wikimedia.org/P53954 and previous config saved to /var/cache/conftool/dbconfig/20231130-073212-root.json |
[production] |
07:32 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'db1126 (re)pooling @ 1%: Upgrade to 10.6.16 and bookworm', diff saved to https://phabricator.wikimedia.org/P53953 and previous config saved to /var/cache/conftool/dbconfig/20231130-073210-root.json |
[production] |
07:13 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db1210.eqiad.wmnet with OS bookworm |
[production] |
07:09 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db1126.eqiad.wmnet with OS bookworm |
[production] |
06:53 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1210.eqiad.wmnet with reason: host reimage |
[production] |
06:49 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1126.eqiad.wmnet with reason: host reimage |
[production] |
06:49 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1210.eqiad.wmnet with reason: host reimage |
[production] |
06:46 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1126.eqiad.wmnet with reason: host reimage |
[production] |
06:45 |
<kart_> |
Updated Apertium to 2023-11-30-061450-production (T270060) |
[production] |
06:44 |
<kartik@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/apertium: apply |
[production] |
06:44 |
<kartik@deploy2002> |
helmfile [codfw] START helmfile.d/services/apertium: apply |
[production] |
06:43 |
<kartik@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/apertium: apply |
[production] |
06:42 |
<kartik@deploy2002> |
helmfile [eqiad] START helmfile.d/services/apertium: apply |
[production] |
06:40 |
<kartik@deploy2002> |
helmfile [staging] DONE helmfile.d/services/apertium: apply |
[production] |
06:39 |
<kartik@deploy2002> |
helmfile [staging] START helmfile.d/services/apertium: apply |
[production] |
06:36 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.reimage for host db1126.eqiad.wmnet with OS bookworm |
[production] |
06:36 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.reimage for host db1210.eqiad.wmnet with OS bookworm |
[production] |
06:33 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool db1210 T351283', diff saved to https://phabricator.wikimedia.org/P53952 and previous config saved to /var/cache/conftool/dbconfig/20231130-063317-root.json |
[production] |
06:32 |
<marostegui@cumin1001> |
dbctl commit (dc=all): 'Depool db1126 T351283', diff saved to https://phabricator.wikimedia.org/P53951 and previous config saved to /var/cache/conftool/dbconfig/20231130-063258-root.json |
[production] |
06:27 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host db1159.eqiad.wmnet with OS bookworm |
[production] |
06:08 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db1159.eqiad.wmnet with reason: host reimage |
[production] |
06:05 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db1159.eqiad.wmnet with reason: host reimage |
[production] |
05:52 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.reimage for host db1159.eqiad.wmnet with OS bookworm |
[production] |
05:47 |
<marostegui> |
Failover m3 from db1159 to db1119 - T352149 |
[production] |
05:41 |
<marostegui@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on db[2134,2160].codfw.wmnet,db[1119,1159,1217].eqiad.wmnet with reason: m3 master switchover T352149 |
[production] |
05:41 |
<marostegui@cumin1001> |
START - Cookbook sre.hosts.downtime for 1:00:00 on db[2134,2160].codfw.wmnet,db[1119,1159,1217].eqiad.wmnet with reason: m3 master switchover T352149 |
[production] |
02:49 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubernetes2060.codfw.wmnet with OS bullseye |
[production] |
02:49 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:47 |
<pt1979@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:44 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubernetes2059.codfw.wmnet with OS bullseye |
[production] |
02:43 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:42 |
<pt1979@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:29 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubernetes2060.codfw.wmnet with reason: host reimage |
[production] |
02:26 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes2060.codfw.wmnet with reason: host reimage |
[production] |
02:22 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubernetes2059.codfw.wmnet with reason: host reimage |
[production] |
02:19 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubernetes2058.codfw.wmnet with OS bullseye |
[production] |
02:19 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:18 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes2059.codfw.wmnet with reason: host reimage |
[production] |
02:14 |
<pt1979@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:09 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.reimage for host kubernetes2060.codfw.wmnet with OS bullseye |
[production] |
02:07 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubernetes2057.codfw.wmnet with OS bullseye |
[production] |
02:07 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
02:04 |
<pt1979@cumin2002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - pt1979@cumin2002" |
[production] |
01:56 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.reimage for host kubernetes2059.codfw.wmnet with OS bullseye |
[production] |
01:56 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubernetes2058.codfw.wmnet with reason: host reimage |
[production] |
01:52 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes2058.codfw.wmnet with reason: host reimage |
[production] |
01:46 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubernetes2057.codfw.wmnet with reason: host reimage |
[production] |
01:43 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes2057.codfw.wmnet with reason: host reimage |
[production] |
01:35 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.reimage for host kubernetes2058.codfw.wmnet with OS bullseye |
[production] |
01:25 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.reimage for host kubernetes2057.codfw.wmnet with OS bullseye |
[production] |