| 
      
        2020-09-08
      
      ยง
     | 
  
    
  | 13:18 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'mobileapps' for release 'staging' . | 
  [production] | 
            
  | 13:18 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'mobileapps' for release 'production' . | 
  [production] | 
            
  | 13:17 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'mathoid' for release 'staging' . | 
  [production] | 
            
  | 13:17 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'mathoid' for release 'production' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'eventgate-analytics' for release 'canary' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'eventgate-analytics' for release 'production' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'eventgate-analytics-external' for release 'canary' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'eventgate-analytics-external' for release 'production' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'echostore' for release 'production' . | 
  [production] | 
            
  | 13:16 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'echostore' for release 'staging' . | 
  [production] | 
            
  | 13:14 | 
  <elukey@cumin1001> | 
  END (FAIL) - Cookbook sre.hadoop.roll-restart-masters (exit_code=99) | 
  [production] | 
            
  | 13:14 | 
  <elukey@cumin1001> | 
  START - Cookbook sre.hadoop.roll-restart-masters | 
  [production] | 
            
  | 13:13 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'changeprop-jobqueue' for release 'production' . | 
  [production] | 
            
  | 13:12 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'changeprop' for release 'production' . | 
  [production] | 
            
  | 13:09 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'cxserver' for release 'staging' . | 
  [production] | 
            
  | 13:09 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'cxserver' for release 'production' . | 
  [production] | 
            
  | 13:08 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'citoid' for release 'production' . | 
  [production] | 
            
  | 13:08 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'citoid' for release 'staging' . | 
  [production] | 
            
  | 13:04 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'blubberoid' for release 'production' . | 
  [production] | 
            
  | 13:04 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'blubberoid' for release 'staging' . | 
  [production] | 
            
  | 12:47 | 
  <oblivian@deploy1001> | 
  helmfile [staging] Ran 'sync' command on namespace 'mobileapps' for release 'staging' . | 
  [production] | 
            
  | 12:35 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after reboot. T261389', diff saved to https://phabricator.wikimedia.org/P12523 and previous config saved to /var/cache/conftool/dbconfig/20200908-123546-kormat.json | 
  [production] | 
            
  | 12:34 | 
  <oblivian@deploy1001> | 
  helmfile [staging] Ran 'sync' command on namespace 'mobileapps' for release 'staging' . | 
  [production] | 
            
  | 12:27 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'Rebooting for T261389', diff saved to https://phabricator.wikimedia.org/P12522 and previous config saved to /var/cache/conftool/dbconfig/20200908-122702-kormat.json | 
  [production] | 
            
  | 12:27 | 
  <kormat@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) | 
  [production] | 
            
  | 12:27 | 
  <kormat@cumin1001> | 
  START - Cookbook sre.hosts.downtime | 
  [production] | 
            
  | 12:11 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after reboot. T261389', diff saved to https://phabricator.wikimedia.org/P12521 and previous config saved to /var/cache/conftool/dbconfig/20200908-121139-kormat.json | 
  [production] | 
            
  | 12:04 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'Rebooting for T261389', diff saved to https://phabricator.wikimedia.org/P12520 and previous config saved to /var/cache/conftool/dbconfig/20200908-120419-kormat.json | 
  [production] | 
            
  | 12:04 | 
  <kormat@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) | 
  [production] | 
            
  | 12:04 | 
  <kormat@cumin1001> | 
  START - Cookbook sre.hosts.downtime | 
  [production] | 
            
  | 11:34 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'calico-policy-controller' . | 
  [production] | 
            
  | 11:33 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'coredns' . | 
  [production] | 
            
  | 11:33 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'rbac-deploy-clusterrole' . | 
  [production] | 
            
  | 11:18 | 
  <jynus@cumin1001> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) | 
  [production] | 
            
  | 11:15 | 
  <jynus@cumin1001> | 
  START - Cookbook sre.hosts.downtime | 
  [production] | 
            
  | 10:53 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'calico-policy-controller' . | 
  [production] | 
            
  | 10:53 | 
  <marostegui> | 
  Deploy schema change on s3 eqiad master - T253276 | 
  [production] | 
            
  | 10:53 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'coredns' . | 
  [production] | 
            
  | 10:53 | 
  <akosiaris@deploy1001> | 
  helmfile [eqiad] Ran 'sync' command on namespace 'kube-system' for release 'rbac-deploy-clusterrole' . | 
  [production] | 
            
  | 10:20 | 
  <marostegui> | 
  Deploy schema change on s4 eqiad master - T253276 | 
  [production] | 
            
  | 10:14 | 
  <jmm@cumin2001> | 
  END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=99) | 
  [production] | 
            
  | 10:14 | 
  <jmm@cumin2001> | 
  START - Cookbook sre.hosts.reboot-single | 
  [production] | 
            
  | 10:11 | 
  <jmm@cumin2001> | 
  END (FAIL) - Cookbook sre.hosts.reboot-single (exit_code=99) | 
  [production] | 
            
  | 10:11 | 
  <jmm@cumin2001> | 
  START - Cookbook sre.hosts.reboot-single | 
  [production] | 
            
  | 10:08 | 
  <kormat@cumin1001> | 
  dbctl commit (dc=all): 'Repooling after reboot. T261389', diff saved to https://phabricator.wikimedia.org/P12519 and previous config saved to /var/cache/conftool/dbconfig/20200908-100852-kormat.json | 
  [production] | 
            
  | 09:52 | 
  <akosiaris> | 
  enable puppet, run it on all k8s eqiad nodes and double check that calico-node is fine T239835 | 
  [production] | 
            
  | 09:43 | 
  <akosiaris> | 
  stopped calico-node and kube-apiserver on k8s nodes/masters T239835 | 
  [production] | 
            
  | 09:43 | 
  <marostegui> | 
  Stop mysql on es2014 to clone es2026 T261717 | 
  [production] | 
            
  | 09:39 | 
  <marostegui@cumin1001> | 
  dbctl commit (dc=all): 'Depool es2014 - T261717', diff saved to https://phabricator.wikimedia.org/P12517 and previous config saved to /var/cache/conftool/dbconfig/20200908-093957-marostegui.json | 
  [production] | 
            
  | 09:37 | 
  <volans> | 
  running homer 'cr*eqiad*' commit "Update debmonitor IPs (#2), T261489" | 
  [production] |