| 
      
        2022-08-10
      
      ยง
     | 
  
    
  | 15:46 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 3 days, 0:00:00 on aqs2011.codfw.wmnet with reason: btullis codfw maintenance | 
  [production] | 
            
  | 15:45 | 
  <btullis@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3 days, 0:00:00 on aqs2010.codfw.wmnet with reason: btullis codfw maintenance | 
  [production] | 
            
  | 15:45 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 3 days, 0:00:00 on aqs2010.codfw.wmnet with reason: btullis codfw maintenance | 
  [production] | 
            
  | 15:45 | 
  <btullis@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3 days, 0:00:00 on aqs2009.codfw.wmnet with reason: btullis codfw maintenance | 
  [production] | 
            
  | 15:45 | 
  <btullis@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 3 days, 0:00:00 on aqs2009.codfw.wmnet with reason: btullis codfw maintenance | 
  [production] | 
            
  | 15:37 | 
  <urandom> | 
  (ephemerally) increasing hinted hand-off delivery rate limit to 16KB, RESTBase eqiad nodes  -- T314941 | 
  [production] | 
            
  | 15:34 | 
  <jbond> | 
  remove puppetmaster[12]002 from production | 
  [production] | 
            
  | 15:30 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for kafka-main2004.codfw.wmnet | 
  [production] | 
            
  | 15:30 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.remove-downtime for kafka-main2004.codfw.wmnet | 
  [production] | 
            
  | 15:20 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for mc[2051-2052].codfw.wmnet | 
  [production] | 
            
  | 15:20 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.remove-downtime for mc[2051-2052].codfw.wmnet | 
  [production] | 
            
  | 15:17 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for mc-gp2003.codfw.wmnet | 
  [production] | 
            
  | 15:17 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.remove-downtime for mc-gp2003.codfw.wmnet | 
  [production] | 
            
  | 15:16 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for mc2033.codfw.wmnet | 
  [production] | 
            
  | 15:16 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.remove-downtime for mc2033.codfw.wmnet | 
  [production] | 
            
  | 15:14 | 
  <_joe_> | 
  power off krb2002 | 
  [production] | 
            
  | 15:14 | 
  <elukey@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on krb2002.codfw.wmnet with reason: PDU maintenance | 
  [production] | 
            
  | 15:13 | 
  <elukey@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on krb2002.codfw.wmnet with reason: PDU maintenance | 
  [production] | 
            
  | 15:13 | 
  <_joe_> | 
  shutting down rdb2010,puppetmaster2002 for d5 maintenance | 
  [production] | 
            
  | 15:02 | 
  <jelto> | 
  power off mc2035 | 
  [production] | 
            
  | 15:01 | 
  <jelto> | 
  power off mc2034 | 
  [production] | 
            
  | 15:01 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on mc2035.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 15:01 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 4:00:00 on mc2035.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 15:01 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on mc2034.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 15:01 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 4:00:00 on mc2034.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:43 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on db2094.codfw.wmnet with reason: PDU Maint (T310146) | 
  [production] | 
            
  | 14:43 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on db2094.codfw.wmnet with reason: PDU Maint (T310146) | 
  [production] | 
            
  | 14:38 | 
  <urandom> | 
  disabling reserved space on eqiad nodes (RESTBase), /dev/md2 (aka /srv/cassandra/instance-data) -- T314941 | 
  [production] | 
            
  | 14:28 | 
  <jelto> | 
  power off kafka-main2004 gracefully | 
  [production] | 
            
  | 14:28 | 
  <hnowlan> | 
  shutting down sessionstore2003 | 
  [production] | 
            
  | 14:27 | 
  <hnowlan@puppetmaster1001> | 
  conftool action : set/pooled=no; selector: name=sessionstore2003.codfw.wmnet | 
  [production] | 
            
  | 14:27 | 
  <sukhe> | 
  power off cp2039, cp2040 for PDU upgrade: rack D | 
  [production] | 
            
  | 14:27 | 
  <hnowlan@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on sessionstore2003.codfw.wmnet with reason: PDU maintenance | 
  [production] | 
            
  | 14:27 | 
  <hnowlan@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on sessionstore2003.codfw.wmnet with reason: PDU maintenance | 
  [production] | 
            
  | 14:25 | 
  <jelto> | 
  power off mc-gp2003 | 
  [production] | 
            
  | 14:25 | 
  <jelto> | 
  power off mc2033 | 
  [production] | 
            
  | 14:24 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:30:00 on kafka-main2004.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:23 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 4:30:00 on kafka-main2004.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:23 | 
  <sukhe> | 
  depool codfw for PDU upgrade: rack D | 
  [production] | 
            
  | 14:23 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:30:00 on mc-gp2003.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:23 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 4:30:00 on mc-gp2003.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:23 | 
  <jelto@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:30:00 on mc2033.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:23 | 
  <jelto@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 4:30:00 on mc2033.codfw.wmnet with reason: PDU swap | 
  [production] | 
            
  | 14:15 | 
  <sukhe@puppetmaster1001> | 
  conftool action : set/pooled=no; selector: name=cp20[39|40]\.codfw\.wmnet,service=ats-tls | 
  [production] | 
            
  | 14:13 | 
  <sukhe@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3:00:00 on cp[2039-2040].codfw.wmnet with reason: shutdown for PDU upgrade: rack D4 | 
  [production] | 
            
  | 14:13 | 
  <urandom> | 
  flushing Cassandra tables, restbase1030 | 
  [production] | 
            
  | 14:13 | 
  <sukhe@cumin2002> | 
  START - Cookbook sre.hosts.downtime for 3:00:00 on cp[2039-2040].codfw.wmnet with reason: shutdown for PDU upgrade: rack D4 | 
  [production] | 
            
  | 14:13 | 
  <urandom> | 
  flushing Cassandra tables, restbase1019 | 
  [production] | 
            
  | 14:12 | 
  <sukhe@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3:00:00 on dns2002.wikimedia.org with reason: shutdown for PDU upgrade: rack D4 | 
  [production] | 
            
  | 14:12 | 
  <sukhe@cumin2002> | 
  START - Cookbook sre.hosts.downtime for 3:00:00 on dns2002.wikimedia.org with reason: shutdown for PDU upgrade: rack D4 | 
  [production] |