| 
      
        2022-04-21
      
      ยง
     | 
  
    
  | 14:26 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after maintenance db1179', diff saved to https://phabricator.wikimedia.org/P25975 and previous config saved to /var/cache/conftool/dbconfig/20220421-142631-ladsgroup.json | 
  [production] | 
            
  | 14:26 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host thumbor1005.eqiad.wmnet | 
  [production] | 
            
  | 14:25 | 
  <kormat@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:30:00 on db1117.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 14:25 | 
  <kormat@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 1:30:00 on db1117.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 14:24 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after maintenance db1144:3315 (T298565)', diff saved to https://phabricator.wikimedia.org/P25974 and previous config saved to /var/cache/conftool/dbconfig/20220421-142413-ladsgroup.json | 
  [production] | 
            
  | 14:22 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'db1152 (re)pooling @ 50%: Reboot T303174', diff saved to https://phabricator.wikimedia.org/P25973 and previous config saved to /var/cache/conftool/dbconfig/20220421-142223-kormat.json | 
  [production] | 
            
  | 14:17 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Depooling db1144:3315 (T298565)', diff saved to https://phabricator.wikimedia.org/P25972 and previous config saved to /var/cache/conftool/dbconfig/20220421-141727-ladsgroup.json | 
  [production] | 
            
  | 14:17 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1144.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 14:17 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 6:00:00 on db1144.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 14:16 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host thumbor1005.eqiad.wmnet | 
  [production] | 
            
  | 14:15 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host thumbor1002.eqiad.wmnet | 
  [production] | 
            
  | 14:11 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after maintenance db1179', diff saved to https://phabricator.wikimedia.org/P25971 and previous config saved to /var/cache/conftool/dbconfig/20220421-141126-ladsgroup.json | 
  [production] | 
            
  | 14:10 | 
  <cmjohnson@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host parse1019.mgmt.eqiad.wmnet with reboot policy FORCED | 
  [production] | 
            
  | 14:10 | 
  <cmjohnson@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host parse1020.mgmt.eqiad.wmnet with reboot policy FORCED | 
  [production] | 
            
  | 14:09 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [codfw] DONE helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 14:09 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [codfw] START helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 14:09 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [eqiad] DONE helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 14:09 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [eqiad] START helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 14:07 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'db1152 (re)pooling @ 25%: Reboot T303174', diff saved to https://phabricator.wikimedia.org/P25969 and previous config saved to /var/cache/conftool/dbconfig/20220421-140719-kormat.json | 
  [production] | 
            
  | 14:05 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host thumbor1002.eqiad.wmnet | 
  [production] | 
            
  | 14:03 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'db1152 depooling: Rebooting for T303174', diff saved to https://phabricator.wikimedia.org/P25968 and previous config saved to /var/cache/conftool/dbconfig/20220421-140309-kormat.json | 
  [production] | 
            
  | 14:03 | 
  <kormat@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:30:00 on db1152.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 14:03 | 
  <kormat@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 1:30:00 on db1152.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 14:02 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host thumbor1001.eqiad.wmnet | 
  [production] | 
            
  | 13:58 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'db1120 depooling: Rebooting for T303174', diff saved to https://phabricator.wikimedia.org/P25967 and previous config saved to /var/cache/conftool/dbconfig/20220421-135831-kormat.json | 
  [production] | 
            
  | 13:58 | 
  <kormat@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:30:00 on db1120.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 13:58 | 
  <kormat@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 1:30:00 on db1120.eqiad.wmnet with reason: Rebooting for T303174 | 
  [production] | 
            
  | 13:56 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after maintenance db1179 (T298565)', diff saved to https://phabricator.wikimedia.org/P25966 and previous config saved to /var/cache/conftool/dbconfig/20220421-135621-ladsgroup.json | 
  [production] | 
            
  | 13:55 | 
  <cmjohnson@cumin1001> | 
  START - Cookbook sre.hosts.provision for host parse1020.mgmt.eqiad.wmnet with reboot policy FORCED | 
  [production] | 
            
  | 13:55 | 
  <cmjohnson@cumin1001> | 
  START - Cookbook sre.hosts.provision for host parse1019.mgmt.eqiad.wmnet with reboot policy FORCED | 
  [production] | 
            
  | 13:54 | 
  <moritzm> | 
  powercycling thumbor1001, stuck on reboot | 
  [production] | 
            
  | 13:45 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.hosts.reboot-single for host thumbor1001.eqiad.wmnet | 
  [production] | 
            
  | 13:34 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [codfw] DONE helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 13:34 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [codfw] START helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 13:34 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [eqiad] DONE helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 13:34 | 
  <mwdebug-deploy@deploy1002> | 
  helmfile [eqiad] START helmfile.d/services/mwdebug: apply | 
  [production] | 
            
  | 13:32 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after maintenance db1130 (T298565)', diff saved to https://phabricator.wikimedia.org/P25965 and previous config saved to /var/cache/conftool/dbconfig/20220421-133204-ladsgroup.json | 
  [production] | 
            
  | 13:31 | 
  <taavi@deploy1002> | 
  Synchronized wmf-config/interwiki.php: Config: [[gerrit:785157|Update interwiki cache]] (duration: 00m 51s) | 
  [production] | 
            
  | 13:29 | 
  <ladsgroup@cumin1001> | 
  dbctl commit (dc=all): 'Depooling db1130 (T298565)', diff saved to https://phabricator.wikimedia.org/P25964 and previous config saved to /var/cache/conftool/dbconfig/20220421-132935-ladsgroup.json | 
  [production] | 
            
  | 13:29 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1130.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:29 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 6:00:00 on db1130.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:25 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on dbstore1003.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:25 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 6:00:00 on dbstore1003.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:23 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on 8 hosts with reason: Maintenance | 
  [production] | 
            
  | 13:23 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 12:00:00 on 8 hosts with reason: Maintenance | 
  [production] | 
            
  | 13:23 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db2123.codfw.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:23 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 6:00:00 on db2123.codfw.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:19 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host thumbor2006.codfw.wmnet | 
  [production] | 
            
  | 13:19 | 
  <ladsgroup@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1150.eqiad.wmnet with reason: Maintenance | 
  [production] | 
            
  | 13:19 | 
  <ladsgroup@cumin1001> | 
  START - Cookbook sre.hosts.downtime for 6:00:00 on db1150.eqiad.wmnet with reason: Maintenance | 
  [production] |