| 
      
        2025-01-15
      
      ยง
     | 
  
    
  | 13:44 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 13:43 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.move-vlan for host wikikube-worker2224 | 
  [production] | 
            
  | 13:43 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2224.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 13:40 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) wikikube-worker2224.codfw.wmnet wikikube-worker2225.codfw.wmnet wikikube-worker2226.codfw.wmnet wikikube-worker2227.codfw.wmnet on all recursors | 
  [production] | 
            
  | 13:40 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.dns.wipe-cache wikikube-worker2224.codfw.wmnet wikikube-worker2225.codfw.wmnet wikikube-worker2226.codfw.wmnet wikikube-worker2227.codfw.wmnet on all recursors | 
  [production] | 
            
  | 13:39 | 
  <dcausse> | 
  errata: depooling wdqs1013 (high lag) | 
  [production] | 
            
  | 13:39 | 
  <dcausse> | 
  depooling wdqs1003 (high lag) | 
  [production] | 
            
  | 13:36 | 
  <moritzm> | 
  imported firmware-amd-graphics 20230210-5~bpo11+1 into component/amd-gpu-firmware for bullseye-wikimedia T383557 | 
  [production] | 
            
  | 13:31 | 
  <jynus@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on dbprov1004.eqiad.wmnet with reason: os upgrade | 
  [production] | 
            
  | 13:30 | 
  <jynus@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on dbprov1004.eqiad.wmnet with reason: os upgrade | 
  [production] | 
            
  | 13:30 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2368 to wikikube-worker2227 | 
  [production] | 
            
  | 13:30 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2227 | 
  [production] | 
            
  | 13:29 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2227 | 
  [production] | 
            
  | 13:29 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 13:29 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2368 to wikikube-worker2227 - jelto@cumin1002" | 
  [production] | 
            
  | 13:22 | 
  <hnowlan@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/shellbox-video: apply | 
  [production] | 
            
  | 13:22 | 
  <hnowlan@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/shellbox-video: apply | 
  [production] | 
            
  | 13:21 | 
  <hnowlan@deploy1003> | 
  helmfile [eqiad] DONE helmfile.d/services/shellbox-video: apply | 
  [production] | 
            
  | 13:21 | 
  <hnowlan@deploy1003> | 
  helmfile [eqiad] START helmfile.d/services/shellbox-video: apply | 
  [production] | 
            
  | 13:14 | 
  <marostegui@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db1163.eqiad.wmnet with reason: maintenance | 
  [production] | 
            
  | 13:14 | 
  <marostegui@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db1163.eqiad.wmnet with reason: maintenance | 
  [production] | 
            
  | 13:09 | 
  <elukey> | 
  restart wdqs-blazegraph.service on wdqs1013 - failed http probes | 
  [production] | 
            
  | 13:06 | 
  <elukey> | 
  `elukey@puppetmaster1001:~$ sudo puppet cert destroy graphite.discovery.wmnet` | 
  [production] | 
            
  | 13:05 | 
  <marostegui@cumin1002> | 
  dbctl commit (dc=all): 'Depool db1163 T383689', diff saved to https://phabricator.wikimedia.org/P72073 and previous config saved to /var/cache/conftool/dbconfig/20250115-130511-marostegui.json | 
  [production] | 
            
  | 13:03 | 
  <marostegui@cumin1002> | 
  dbctl commit (dc=all): 'Promote db1184 to s1 primary T383689', diff saved to https://phabricator.wikimedia.org/P72072 and previous config saved to /var/cache/conftool/dbconfig/20250115-130354-root.json | 
  [production] | 
            
  | 13:03 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2368 to wikikube-worker2227 - jelto@cumin1002" | 
  [production] | 
            
  | 13:03 | 
  <marostegui> | 
  Starting s1 eqiad failover from db1163 to db1184 - T383689 | 
  [production] | 
            
  | 12:59 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 12:58 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.rename from mw2368 to wikikube-worker2227 | 
  [production] | 
            
  | 12:58 | 
  <marostegui@cumin1002> | 
  dbctl commit (dc=all): 'Remove db1184 from API T383689', diff saved to https://phabricator.wikimedia.org/P72071 and previous config saved to /var/cache/conftool/dbconfig/20250115-125818-root.json | 
  [production] | 
            
  | 12:58 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2367 to wikikube-worker2226 | 
  [production] | 
            
  | 12:57 | 
  <marostegui@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on 34 hosts with reason: Primary switchover s1 T383689 | 
  [production] | 
            
  | 12:57 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2226 | 
  [production] | 
            
  | 12:57 | 
  <marostegui@cumin1002> | 
  dbctl commit (dc=all): 'Set db1184 with weight 0 T383689', diff saved to https://phabricator.wikimedia.org/P72070 and previous config saved to /var/cache/conftool/dbconfig/20250115-125732-root.json | 
  [production] | 
            
  | 12:57 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2226 | 
  [production] | 
            
  | 12:57 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 12:57 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2367 to wikikube-worker2226 - jelto@cumin1002" | 
  [production] | 
            
  | 12:57 | 
  <marostegui@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 1:00:00 on 34 hosts with reason: Primary switchover s1 T383689 | 
  [production] | 
            
  | 12:57 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2367 to wikikube-worker2226 - jelto@cumin1002" | 
  [production] | 
            
  | 12:53 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 12:53 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.rename from mw2367 to wikikube-worker2226 | 
  [production] | 
            
  | 12:52 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2366 to wikikube-worker2225 | 
  [production] | 
            
  | 12:51 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2225 | 
  [production] | 
            
  | 12:51 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2225 | 
  [production] | 
            
  | 12:51 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 12:51 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2366 to wikikube-worker2225 - jelto@cumin1002" | 
  [production] | 
            
  | 12:50 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2366 to wikikube-worker2225 - jelto@cumin1002" | 
  [production] | 
            
  | 12:46 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 12:46 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.rename from mw2366 to wikikube-worker2225 | 
  [production] | 
            
  | 12:45 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2359 to wikikube-worker2224 | 
  [production] |