| 2024-06-19
      
      ยง | 
    
  | 14:37 | <taavi@cumin1002> | END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudvirt1043.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 14:36 | <taavi@cumin1002> | START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - taavi@cumin1002" | [production] | 
            
  | 14:35 | <taavi@cloudcumin1001> | END (PASS) - Cookbook wmcs.openstack.cloudvirt.lib.ensure_canary (exit_code=0) on eqiad1, with recreate True, for hosts list: ['cloudvirt1042'] | [cloudvirt-canary] | 
            
  | 14:35 | <moritzm> | installing nano security updates | [production] | 
            
  | 14:35 | <taavi@cloudcumin1001> | START - Cookbook wmcs.openstack.cloudvirt.lib.ensure_canary on eqiad1, with recreate True, for hosts list: ['cloudvirt1042'] | [cloudvirt-canary] | 
            
  | 14:35 | <taavi@cloudcumin1001> | START - Cookbook wmcs.openstack.cloudvirt.lib.ensure_canary on eqiad1, with recreate True, for hosts list: ['cloudvirt1043'] | [cloudvirt-canary] | 
            
  | 14:34 | <taavi@cumin1002> | START - Cookbook sre.hosts.downtime for 2:00:00 on cloudvirt1043.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 14:24 | <moritzm> | installing libvpx security updates | [production] | 
            
  | 14:23 | <moritzm> | installing pymysql security updates | [production] | 
            
  | 14:19 | <brouberol@deploy1002> | helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s_services/services/datahub: sync on production | [production] | 
            
  | 14:19 | <taavi@cumin1002> | START - Cookbook sre.hosts.reimage for host cloudvirt1043.eqiad.wmnet with OS bookworm | [production] | 
            
  | 14:17 | <brouberol@deploy1002> | helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s_services/services/datahub: apply on production | [production] | 
            
  | 14:14 | <brouberol@deploy1002> | helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s_services/services/datahub-next: sync on staging | [production] | 
            
  | 14:12 | <brouberol@deploy1002> | helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s_services/services/datahub-next: apply on staging | [production] | 
            
  | 14:11 | <taavi@cumin1002> | END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudvirt1042.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 14:11 | <taavi@cumin2002> | END (FAIL) - Cookbook sre.hardware.upgrade-firmware (exit_code=1) upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:10 | <klausman@cumin2002> | END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host ml-staging2003.codfw.wmnet with OS bookworm | [production] | 
            
  | 14:10 | <klausman@cumin2002> | END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - klausman@cumin2002" | [production] | 
            
  | 14:09 | <taavi@cumin2002> | START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:09 | <klausman@cumin2002> | START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - klausman@cumin2002" | [production] | 
            
  | 14:09 | <taavi@cumin2002> | END (FAIL) - Cookbook sre.hardware.upgrade-firmware (exit_code=1) upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:08 | <taavi@cumin1002> | START - Cookbook sre.hosts.downtime for 2:00:00 on cloudvirt1042.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 14:08 | <taavi@cumin2002> | START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:07 | <taavi@cumin2002> | END (ERROR) - Cookbook sre.hardware.upgrade-firmware (exit_code=97) upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:07 | <taavi@cumin2002> | START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudvirt1043.eqiad.wmnet'] | [production] | 
            
  | 14:01 | <taavi@cumin1002> | END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cloudvirt1044.eqiad.wmnet with OS bookworm | [production] | 
            
  | 14:00 | <taavi@cloudcumin1001> | END (PASS) - Cookbook wmcs.openstack.cloudvirt.lib.ensure_canary (exit_code=0) on eqiad1, with recreate True, for hosts list: ['cloudvirt1044'] | [cloudvirt-canary] | 
            
  | 14:00 | <taavi@cloudcumin1001> | START - Cookbook wmcs.openstack.cloudvirt.lib.ensure_canary on eqiad1, with recreate True, for hosts list: ['cloudvirt1044'] | [cloudvirt-canary] | 
            
  | 13:57 | <klausman@cumin2002> | END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on ml-staging2003.codfw.wmnet with reason: host reimage | [production] | 
            
  | 13:54 | <klausman@cumin2002> | START - Cookbook sre.hosts.downtime for 2:00:00 on ml-staging2003.codfw.wmnet with reason: host reimage | [production] | 
            
  | 13:53 | <taavi@cumin1002> | START - Cookbook sre.hosts.reimage for host cloudvirt1042.eqiad.wmnet with OS bookworm | [production] | 
            
  | 13:53 | <taavi@cumin1002> | END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host cloudvirt1042.eqiad.wmnet with OS bookworm | [production] | 
            
  | 13:51 | <klausman@cumin2002> | END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:50 | <klausman@cumin2002> | START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:49 | <klausman@cumin2002> | END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:48 | <klausman@cumin2002> | START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:43 | <taavi@cumin1002> | START - Cookbook sre.hosts.reimage for host cloudvirt1042.eqiad.wmnet with OS bookworm | [production] | 
            
  | 13:42 | <klausman@cumin2002> | END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:41 | <taavi@cumin2002> | END (FAIL) - Cookbook sre.hardware.upgrade-firmware (exit_code=99) upgrade firmware for hosts ['cloudvirt1042.eqiad.wmnet'] | [production] | 
            
  | 13:41 | <klausman@cumin2002> | START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Trying to fix Puppet error on ml-staging2003 - klausman@cumin2002" | [production] | 
            
  | 13:35 | <fabfur@cumin1002> | conftool action : set/pooled=yes; selector: name=cp5017.eqsin.wmnet | [production] | 
            
  | 13:35 | <taavi@cumin1002> | END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudvirt1044.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 13:35 | <taavi@cumin1002> | END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host cloudvirt1043.eqiad.wmnet with OS bookworm | [production] | 
            
  | 13:35 | <fabfur@cumin1002> | END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on P{cp5017.*} and A:cp | [production] | 
            
  | 13:32 | <fabfur@cumin1002> | START - Cookbook sre.cdn.roll-upgrade-haproxy rolling upgrade of HAProxy on P{cp5017.*} and A:cp | [production] | 
            
  | 13:32 | <taavi@cumin1002> | START - Cookbook sre.hosts.downtime for 2:00:00 on cloudvirt1044.eqiad.wmnet with reason: host reimage | [production] | 
            
  | 13:32 | <sukhe@puppetmaster1001> | conftool action : set/pooled=yes; selector: name=dns6001.wikimedia.org,service=ntp-a | [production] | 
            
  | 13:31 | <fabfur@cumin1002> | conftool action : set/pooled=no; selector: name=cp5017.eqsin.wmnet | [production] | 
            
  | 13:31 | <taavi@cumin2002> | START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudvirt1042.eqiad.wmnet'] | [production] | 
            
  | 13:28 | <sukhe> | enable puppet on dns6001 to test CR 1046685 | [production] |