| 
      
        2024-09-04
      
      ยง
     | 
  
    
  | 15:59 | 
  <cmooney@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 0:30:00 on 27 hosts with reason: Move server uplinks codfw racks C1 | 
  [production] | 
            
  | 15:58 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host ml-lab1001.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:56 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 15:56 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.move-vlan for host wikikube-worker2083 | 
  [production] | 
            
  | 15:56 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2083.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 15:56 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.renumber-node Renumbering for host wikikube-worker2083.codfw.wmnet | 
  [production] | 
            
  | 15:56 | 
  <arnaudb@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 0:30:00 on 10 hosts with reason: network maintenance T370852 | 
  [production] | 
            
  | 15:55 | 
  <arnaudb@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 0:30:00 on 10 hosts with reason: network maintenance T370852 | 
  [production] | 
            
  | 15:55 | 
  <arnaudb@cumin1002> | 
  dbctl commit (dc=all): 'depool db2125 db2138 db2149 db2190 db2206 db2207 es2031 es2032 es2036 - T370852', diff saved to https://phabricator.wikimedia.org/P68650 and previous config saved to /var/cache/conftool/dbconfig/20240904-155459-arnaudb.json | 
  [production] | 
            
  | 15:53 | 
  <ladsgroup@deploy1003> | 
  Finished scap sync-world: Backport for [[gerrit:1070324|Fix bug causing review form to disappear on unreviewed pages (T373582)]] (duration: 10m 31s) | 
  [production] | 
            
  | 15:53 | 
  <swfrench@cumin2002> | 
  START - Cookbook sre.hosts.decommission for hosts mw[2260,2267].codfw.wmnet | 
  [production] | 
            
  | 15:48 | 
  <ladsgroup@deploy1003> | 
  ladsgroup: Continuing with sync | 
  [production] | 
            
  | 15:47 | 
  <ladsgroup@deploy1003> | 
  ladsgroup: Backport for [[gerrit:1070324|Fix bug causing review form to disappear on unreviewed pages (T373582)]] synced to the testservers (https://wikitech.wikimedia.org/wiki/Mwdebug) | 
  [production] | 
            
  | 15:46 | 
  <bking@cumin2002> | 
  END (FAIL) - Cookbook sre.wdqs.restart (exit_code=99) | 
  [production] | 
            
  | 15:43 | 
  <aqu@deploy1003> | 
  Finished deploy [airflow-dags/analytics@3b0d8ba]: Regular analytics weekly train [airflow-dags@3b0d8ba1] (duration: 00m 48s) | 
  [production] | 
            
  | 15:43 | 
  <topranks> | 
  configure lsw1-c1-codfw interfaces for servers in advance of move T373095 | 
  [production] | 
            
  | 15:43 | 
  <ladsgroup@deploy1003> | 
  Started scap sync-world: Backport for [[gerrit:1070324|Fix bug causing review form to disappear on unreviewed pages (T373582)]] | 
  [production] | 
            
  | 15:42 | 
  <aqu@deploy1003> | 
  Started deploy [airflow-dags/analytics@3b0d8ba]: Regular analytics weekly train [airflow-dags@3b0d8ba1] | 
  [production] | 
            
  | 15:25 | 
  <swfrench@cumin2002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host mw2267.codfw.wmnet | 
  [production] | 
            
  | 15:24 | 
  <swfrench@cumin2002> | 
  START - Cookbook sre.k8s.pool-depool-node depool for host mw2267.codfw.wmnet | 
  [production] | 
            
  | 15:21 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2081.codfw.wmnet | 
  [production] | 
            
  | 15:20 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2081.codfw.wmnet | 
  [production] | 
            
  | 15:15 | 
  <vgutierrez@cumin1002> | 
  conftool action : set/pooled=yes; selector: name=cp7015.magru.wmnet | 
  [production] | 
            
  | 15:14 | 
  <elukey@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host ml-lab1001.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:13 | 
  <vgutierrez@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for cp7015.magru.wmnet | 
  [production] | 
            
  | 15:13 | 
  <vgutierrez@cumin1002> | 
  START - Cookbook sre.hosts.remove-downtime for cp7015.magru.wmnet | 
  [production] | 
            
  | 15:12 | 
  <jclark@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host phab1005.eqiad.wmnet with OS bookworm | 
  [production] | 
            
  | 15:12 | 
  <jclark@cumin1002> | 
  END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host phab1005.eqiad.wmnet with OS bookworm | 
  [production] | 
            
  | 15:11 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host ml-lab1001.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:09 | 
  <hashar@deploy1003> | 
  Finished scap sync-world: Backport for [[gerrit:1070548|ParserOutput::collectMetadata: Log if given value is non-numeric and also non-string, for easier debugging, and don't fatal (T373920)]] (duration: 08m 37s) | 
  [production] | 
            
  | 15:06 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host ml-lab1001.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:06 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2036.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:05 | 
  <jclark@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host ml-lab1001.eqiad.wmnet with OS bookworm | 
  [production] | 
            
  | 15:04 | 
  <hashar@deploy1003> | 
  hashar: Continuing with sync | 
  [production] | 
            
  | 15:04 | 
  <hashar@deploy1003> | 
  hashar: Backport for [[gerrit:1070548|ParserOutput::collectMetadata: Log if given value is non-numeric and also non-string, for easier debugging, and don't fatal (T373920)]] synced to the testservers (https://wikitech.wikimedia.org/wiki/Mwdebug) | 
  [production] | 
            
  | 15:02 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2036.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:02 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host ml-lab1001.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:00 | 
  <hashar@deploy1003> | 
  Started scap sync-world: Backport for [[gerrit:1070548|ParserOutput::collectMetadata: Log if given value is non-numeric and also non-string, for easier debugging, and don't fatal (T373920)]] | 
  [production] | 
            
  | 14:49 | 
  <claime> | 
  homer cr*codfw* commit 'T372878' | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.move-vlan (exit_code=0) for host wikikube-worker2036 | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2036 | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2036 | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) wikikube-worker2036.codfw.wmnet 121.16.192.10.in-addr.arpa 1.2.1.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.dns.wipe-cache wikikube-worker2036.codfw.wmnet 121.16.192.10.in-addr.arpa 1.2.1.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host wikikube-worker2036 - cgoubert@cumin1002" | 
  [production] | 
            
  | 14:44 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host wikikube-worker2036 - cgoubert@cumin1002" | 
  [production] | 
            
  | 14:40 | 
  <stevemunene@deploy1003> | 
  helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/airflow-test-k8s: apply | 
  [production] | 
            
  | 14:40 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 14:40 | 
  <bking@cumin2002> | 
  START - Cookbook sre.wdqs.restart | 
  [production] |