| 
      
        2023-07-10
      
      ยง
     | 
  
    
  | 13:21 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.dns.wipe-cache karapace1002.eqiad.wmnet on all recursors | 
  [production] | 
            
  | 13:21 | 
  <btullis@cumin1001> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 13:21 | 
  <btullis@cumin1001> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM karapace1002.eqiad.wmnet - btullis@cumin1001" | 
  [production] | 
            
  | 13:20 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Add records for VM karapace1002.eqiad.wmnet - btullis@cumin1001" | 
  [production] | 
            
  | 13:20 | 
  <ladsgroup@deploy1002> | 
  isaranto and ladsgroup: Backport for [[gerrit:935743|ores extension: deploy LiftWing usage on testwiki (T319170)]] synced to the testservers: mwdebug1002.eqiad.wmnet, mwdebug1001.eqiad.wmnet, mwdebug2001.codfw.wmnet, mwdebug2002.codfw.wmnet | 
  [production] | 
            
  | 13:18 | 
  <ladsgroup@deploy1002> | 
  Started scap: Backport for [[gerrit:935743|ores extension: deploy LiftWing usage on testwiki (T319170)]] | 
  [production] | 
            
  | 13:16 | 
  <lucaswerkmeister-wmde@deploy1002> | 
  Finished scap: Backport for [[gerrit:936322|Disable wgParserEnableLegacyMediaDOM on group2 wikis (T314318)]] (duration: 10m 26s) | 
  [production] | 
            
  | 13:16 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 13:16 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.ganeti.makevm for new host karapace1002.eqiad.wmnet | 
  [production] | 
            
  | 13:07 | 
  <lucaswerkmeister-wmde@deploy1002> | 
  lucaswerkmeister-wmde and arlolra: Backport for [[gerrit:936322|Disable wgParserEnableLegacyMediaDOM on group2 wikis (T314318)]] synced to the testservers: mwdebug1002.eqiad.wmnet, mwdebug2002.codfw.wmnet, mwdebug1001.eqiad.wmnet, mwdebug2001.codfw.wmnet | 
  [production] | 
            
  | 13:05 | 
  <lucaswerkmeister-wmde@deploy1002> | 
  Started scap: Backport for [[gerrit:936322|Disable wgParserEnableLegacyMediaDOM on group2 wikis (T314318)]] | 
  [production] | 
            
  | 12:34 | 
  <claime> | 
  Running puppet on cp-text hosts - T341463 | 
  [production] | 
            
  | 12:33 | 
  <claime> | 
  Sending 1% of global traffic to mw-on-k8s - T341463 | 
  [production] | 
            
  | 12:04 | 
  <moritzm> | 
  failover ganeti masters in drmrs | 
  [production] | 
            
  | 12:02 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti6004.drmrs.wmnet | 
  [production] | 
            
  | 12:02 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti6004.drmrs.wmnet | 
  [production] | 
            
  | 11:55 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host ganeti6004.drmrs.wmnet | 
  [production] | 
            
  | 11:55 | 
  <moritzm> | 
  installing avahi security updates | 
  [production] | 
            
  | 11:52 | 
  <vgutierrez> | 
  repool cp2037 (debugging finished) - T320967 | 
  [production] | 
            
  | 11:42 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti6004.drmrs.wmnet | 
  [production] | 
            
  | 11:36 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 11:35 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 11:34 | 
  <btullis@deploy1002> | 
  helmfile [staging] DONE helmfile.d/services/datahub: sync on main | 
  [production] | 
            
  | 11:30 | 
  <btullis@deploy1002> | 
  helmfile [staging] START helmfile.d/services/datahub: apply on main | 
  [production] | 
            
  | 11:29 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 11:28 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 11:28 | 
  <btullis@deploy1002> | 
  helmfile [staging] START helmfile.d/services/datahub: apply on main | 
  [production] | 
            
  | 11:23 | 
  <btullis@deploy1002> | 
  helmfile [staging] DONE helmfile.d/services/datahub: sync on main | 
  [production] | 
            
  | 11:15 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 28 days, 0:00:00 on debmonitor2003.codfw.wmnet with reason: WIP | 
  [production] | 
            
  | 11:15 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.downtime for 28 days, 0:00:00 on debmonitor2003.codfw.wmnet with reason: WIP | 
  [production] | 
            
  | 11:14 | 
  <moritzm> | 
  remove unused VM netflow6002 T330884 | 
  [production] | 
            
  | 11:11 | 
  <btullis@deploy1002> | 
  helmfile [staging] START helmfile.d/services/datahub: apply on main | 
  [production] | 
            
  | 11:11 | 
  <jmm@cumin2002> | 
  END (FAIL) - Cookbook sre.ganeti.drain-node (exit_code=99) for draining ganeti node ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 11:05 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti6003.drmrs.wmnet | 
  [production] | 
            
  | 10:55 | 
  <moritzm> | 
  failover ganeti master in eqiad to ganeti1029 | 
  [production] | 
            
  | 10:53 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti1034.eqiad.wmnet | 
  [production] | 
            
  | 10:50 | 
  <elukey@deploy1002> | 
  helmfile [codfw] DONE helmfile.d/services/eventgate-main: sync | 
  [production] | 
            
  | 10:50 | 
  <elukey@deploy1002> | 
  helmfile [codfw] START helmfile.d/services/eventgate-main: sync | 
  [production] | 
            
  | 10:49 | 
  <aborrero@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cloudlb1002.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 10:46 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host ganeti1034.eqiad.wmnet | 
  [production] | 
            
  | 10:45 | 
  <btullis@deploy1002> | 
  helmfile [staging] DONE helmfile.d/services/datahub: sync on main | 
  [production] | 
            
  | 10:44 | 
  <elukey@deploy1002> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-main: sync | 
  [production] | 
            
  | 10:44 | 
  <elukey@deploy1002> | 
  helmfile [staging] START helmfile.d/services/eventgate-main: sync | 
  [production] | 
            
  | 10:43 | 
  <vgutierrez@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for cp2037.codfw.wmnet | 
  [production] | 
            
  | 10:43 | 
  <vgutierrez@cumin1001> | 
  START - Cookbook sre.hosts.remove-downtime for cp2037.codfw.wmnet | 
  [production] | 
            
  | 10:34 | 
  <btullis@deploy1002> | 
  helmfile [staging] START helmfile.d/services/datahub: apply on main | 
  [production] | 
            
  | 10:28 | 
  <aborrero@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudlb1002.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 10:26 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.ganeti.drain-node for draining ganeti node ganeti1034.eqiad.wmnet | 
  [production] | 
            
  | 10:25 | 
  <aborrero@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on cloudlb1002.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 10:21 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1033.eqiad.wmnet | 
  [production] |