| 
      
        2023-11-06
      
      ยง
     | 
  
    
  | 17:46 | 
  <bking@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/rdf-streaming-updater: apply | 
  [production] | 
            
  | 17:46 | 
  <bking@deploy2002> | 
  helmfile [staging] START helmfile.d/services/rdf-streaming-updater: apply | 
  [production] | 
            
  | 17:46 | 
  <jclark@cumin1001> | 
  START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudrabbit1003'] | 
  [production] | 
            
  | 17:41 | 
  <otto@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 17:41 | 
  <otto@deploy2002> | 
  helmfile [staging] START helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 17:35 | 
  <andrew@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cloudrabbit1002.wikimedia.org with OS bookworm | 
  [production] | 
            
  | 17:24 | 
  <jynus@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host backup2011.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 17:19 | 
  <andrew@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudrabbit1002.wikimedia.org with reason: host reimage | 
  [production] | 
            
  | 17:15 | 
  <andrew@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on cloudrabbit1002.wikimedia.org with reason: host reimage | 
  [production] | 
            
  | 17:07 | 
  <jynus@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on backup2011.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 17:05 | 
  <otto@deploy2002> | 
  helmfile [eqiad] DONE helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 17:03 | 
  <jynus@cumin2002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on backup2011.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 17:03 | 
  <andrew@cumin1001> | 
  START - Cookbook sre.hosts.reimage for host cloudrabbit1002.wikimedia.org with OS bookworm | 
  [production] | 
            
  | 17:03 | 
  <andrew@cumin1001> | 
  START - Cookbook sre.hosts.reimage for host cloudrabbit1003.wikimedia.org with OS bookworm | 
  [production] | 
            
  | 17:01 | 
  <sukhe@cumin2002> | 
  END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:56 | 
  <sukhe@cumin2002> | 
  START - Cookbook sre.hosts.reimage for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:56 | 
  <sukhe@cumin2002> | 
  END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:55 | 
  <jdrewniak@deploy2002> | 
  Synchronized portals: Wikimedia Portals Update: [[gerrit:971991| Bumping portals to master (T128546)]] (duration: 05m 34s) | 
  [production] | 
            
  | 16:49 | 
  <otto@deploy2002> | 
  helmfile [eqiad] START helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 16:49 | 
  <jdrewniak@deploy2002> | 
  Synchronized portals/wikipedia.org/assets: Wikimedia Portals Update: [[gerrit:971991| Bumping portals to master (T128546)]] (duration: 05m 53s) | 
  [production] | 
            
  | 16:49 | 
  <sukhe@cumin2002> | 
  START - Cookbook sre.hosts.reimage for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:49 | 
  <sukhe@cumin2002> | 
  END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:48 | 
  <otto@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 16:48 | 
  <otto@deploy2002> | 
  helmfile [staging] START helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 16:45 | 
  <otto@deploy2002> | 
  helmfile [codfw] DONE helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:44 | 
  <otto@deploy2002> | 
  helmfile [codfw] START helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:44 | 
  <sukhe@cumin2002> | 
  START - Cookbook sre.hosts.reimage for host cp4052.ulsfo.wmnet with OS bookworm | 
  [production] | 
            
  | 16:43 | 
  <otto@deploy2002> | 
  helmfile [eqiad] DONE helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:43 | 
  <otto@deploy2002> | 
  helmfile [eqiad] START helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:41 | 
  <otto@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:41 | 
  <otto@deploy2002> | 
  helmfile [staging] START helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 16:41 | 
  <ottomata> | 
  beginning deployments of eventgate clusters: mesh and cert chart updates, as well as sleep timeout values for graceful envoy+eventgate container termination - T349823 T300033 T346638 | 
  [production] | 
            
  | 16:33 | 
  <bking@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host wdqs1014.eqiad.wmnet | 
  [production] | 
            
  | 16:29 | 
  <btullis@cumin1001> | 
  END (FAIL) - Cookbook sre.wikireplicas.add-wiki (exit_code=99) | 
  [production] | 
            
  | 16:29 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.wikireplicas.add-wiki | 
  [production] | 
            
  | 16:28 | 
  <jynus@cumin2002> | 
  START - Cookbook sre.hosts.reimage for host backup2011.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 16:26 | 
  <bking@cumin1001> | 
  START - Cookbook sre.hosts.reboot-single for host wdqs1014.eqiad.wmnet | 
  [production] | 
            
  | 16:10 | 
  <bking@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/rdf-streaming-updater: apply | 
  [production] | 
            
  | 16:10 | 
  <bking@deploy2002> | 
  helmfile [staging] START helmfile.d/services/rdf-streaming-updater: apply | 
  [production] | 
            
  | 16:09 | 
  <marostegui@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host pc1016.eqiad.wmnet with OS bookworm | 
  [production] | 
            
  | 16:08 | 
  <marostegui@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host pc2016.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 16:02 | 
  <fnegri@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cloudrabbit1001.wikimedia.org with OS bookworm | 
  [production] | 
            
  | 15:54 | 
  <marostegui@cumin1001> | 
  END (ERROR) - Cookbook sre.hosts.downtime (exit_code=97) for 2:00:00 on pc1016.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:52 | 
  <marostegui@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on pc2016.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:50 | 
  <marostegui@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on pc1016.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:50 | 
  <marostegui@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on pc2016.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:46 | 
  <fnegri@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudrabbit1001.wikimedia.org with reason: host reimage | 
  [production] | 
            
  | 15:45 | 
  <bking@deploy2002> | 
  helmfile [staging] DONE helmfile.d/services/rdf-streaming-updater: apply | 
  [production] | 
            
  | 15:45 | 
  <marostegui@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3:00:00 on pc2015.codfw.wmnet,pc1015.eqiad.wmnet with reason: Upgrade | 
  [production] | 
            
  | 15:44 | 
  <marostegui@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 3:00:00 on pc2015.codfw.wmnet,pc1015.eqiad.wmnet with reason: Upgrade | 
  [production] |