2023-07-06
ยง
|
14:13 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/datahub: apply on main |
[production] |
14:12 |
<stevemunene@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
14:09 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/datahub: apply on main |
[production] |
14:06 |
<stevemunene@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts analytics1067.eqiad.wmnet |
[production] |
14:05 |
<hnowlan> |
disabling puppet on A:cp-text to test 935464 |
[production] |
14:05 |
<hnowlan@puppetmaster1001> |
conftool action : set/pooled=no; selector: service=ats-be,name=cp2037.codfw.wmnet |
[production] |
14:02 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reimage for host dns1004.wikimedia.org with OS bullseye |
[production] |
14:02 |
<sukhe@cumin2002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host dns1004.wikimedia.org with OS bullseye |
[production] |
14:01 |
<btullis@cumin1001> |
START - Cookbook sre.hosts.reimage for host an-test-worker1003.eqiad.wmnet with OS bullseye |
[production] |
13:56 |
<sukhe@cumin2002> |
START - Cookbook sre.hosts.reimage for host dns1004.wikimedia.org with OS bullseye |
[production] |
13:55 |
<bking@cumin1001> |
START - Cookbook sre.wdqs.data-transfer |
[production] |
13:54 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/datahub: sync on main |
[production] |
13:51 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.dhcp (exit_code=0) for host cloudlb1001.eqiad.wmnet |
[production] |
13:42 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/datahub: apply on main |
[production] |
13:38 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.dhcp for host cloudlb1001.eqiad.wmnet |
[production] |
13:34 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/datahub: sync on main |
[production] |
13:33 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host zookeeper-test1002.eqiad.wmnet with OS bookworm |
[production] |
13:32 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.dhcp (exit_code=0) for host an-test-worker1003.eqiad.wmnet |
[production] |
13:30 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.hosts.decommission (exit_code=0) for hosts analytics1066.eqiad.wmnet |
[production] |
13:30 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
13:30 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1066.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
13:29 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/datahub: apply on main |
[production] |
13:29 |
<pt1979@cumin2002> |
START - Cookbook sre.hosts.dhcp for host an-test-worker1003.eqiad.wmnet |
[production] |
13:29 |
<pt1979@cumin2002> |
END (PASS) - Cookbook sre.hosts.dhcp (exit_code=0) for host an-test-worker1003.eqiad.wmnet |
[production] |
13:24 |
<stevemunene@cumin1001> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1066.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
13:22 |
<stevemunene@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
13:18 |
<urbanecm@deploy1002> |
Finished scap: Backport for [[gerrit:935815|Enable global abuse filters on almost all projects (T341159)]] (duration: 10m 07s) |
[production] |
13:17 |
<btullis@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 7 days, 0:00:00 on an-worker1095.eqiad.wmnet with reason: Replacing RAID controller battery |
[production] |
13:17 |
<btullis@cumin1001> |
START - Cookbook sre.hosts.downtime for 7 days, 0:00:00 on an-worker1095.eqiad.wmnet with reason: Replacing RAID controller battery |
[production] |
13:14 |
<stevemunene@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts analytics1066.eqiad.wmnet |
[production] |
13:12 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.hosts.decommission (exit_code=0) for hosts analytics1065.eqiad.wmnet |
[production] |
13:12 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
13:12 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1065.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
13:10 |
<btullis@cumin1001> |
END (PASS) - Cookbook sre.kafka.roll-restart-brokers (exit_code=0) for Kafka A:kafka-test-eqiad cluster: Roll restart of jvm daemons. |
[production] |
13:10 |
<stevemunene@cumin1001> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1065.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
13:10 |
<urbanecm@deploy1002> |
urbanecm: Backport for [[gerrit:935815|Enable global abuse filters on almost all projects (T341159)]] synced to the testservers: mwdebug2001.codfw.wmnet, mwdebug2002.codfw.wmnet, mwdebug1002.eqiad.wmnet, mwdebug1001.eqiad.wmnet |
[production] |
13:08 |
<urbanecm@deploy1002> |
Started scap: Backport for [[gerrit:935815|Enable global abuse filters on almost all projects (T341159)]] |
[production] |
13:08 |
<stevemunene@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
13:02 |
<stevemunene@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts analytics1065.eqiad.wmnet |
[production] |
13:00 |
<aborrero@cumin1001> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cloudlb1001.eqiad.wmnet with OS bullseye |
[production] |
12:58 |
<elukey@cumin1001> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on zookeeper-test1002.eqiad.wmnet with reason: host reimage |
[production] |
12:58 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.hosts.decommission (exit_code=0) for hosts analytics1064.eqiad.wmnet |
[production] |
12:58 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
12:58 |
<stevemunene@cumin1001> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1064.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
12:56 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.downtime for 2:00:00 on zookeeper-test1002.eqiad.wmnet with reason: host reimage |
[production] |
12:43 |
<stevemunene@cumin1001> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: analytics1064.eqiad.wmnet decommissioned, removing all IPs except the asset tag one - stevemunene@cumin1001" |
[production] |
12:42 |
<elukey@cumin1001> |
START - Cookbook sre.hosts.reimage for host zookeeper-test1002.eqiad.wmnet with OS bookworm |
[production] |
12:40 |
<stevemunene@cumin1001> |
START - Cookbook sre.dns.netbox |
[production] |
12:35 |
<stevemunene@cumin1001> |
START - Cookbook sre.hosts.decommission for hosts analytics1064.eqiad.wmnet |
[production] |
12:32 |
<samtar@deploy1002> |
Finished scap: Backport for [[gerrit:935854|Revert "Add tag when reference added to the page" (T341202)]] (duration: 24m 04s) |
[production] |