2021-06-15
§
|
17:46 |
<razzi> |
remove hdfs namenode backup on stat1004 |
[analytics] |
17:45 |
<razzi> |
enable puppet on an-launcher |
[analytics] |
17:45 |
<razzi> |
sudo -u yarn kerberos-run-command yarn yarn rmadmin -refreshQueues |
[analytics] |
16:55 |
<razzi> |
sudo -i wmf-auto-reimage-host -p T278423 an-master1002.eqiad.wmnet |
[analytics] |
16:53 |
<razzi> |
run uid script on an-master1002 |
[analytics] |
16:33 |
<elukey> |
restart hadoop-yarn-resourcemanager on an-master1001 |
[analytics] |
16:16 |
<razzi> |
sudo systemctl stop 'hadoop-*' on an-master1002 |
[analytics] |
16:14 |
<razzi> |
sudo systemctl stop hadoop-* on an-master1001, then realize I meant to do this on an-master1002, so start hadoop-* |
[analytics] |
16:11 |
<razzi> |
downtime an-master1002 |
[analytics] |
15:55 |
<razzi> |
sudo transfer.py an-master1001.eqiad.wmnet:/srv/hadoop/backup/hdfs-namenode-snapshot-buster-reimage-2021-06-15.tar.gz stat1004.eqiad.wmnet:/home/razzi/hdfs-namenode-fsimage |
[analytics] |
15:42 |
<razzi> |
tar -czf /srv/hadoop/backup/hdfs-namenode-snapshot-buster-reimage-$(date --iso-8601).tar.gz current on an-master1001 |
[analytics] |
15:38 |
<razzi> |
backup /srv/hadoop/name/current to /home/razzi/hdfs-namenode-snapshot-buster-reimage-2021-06-15.tar.gz on an-master1001 |
[analytics] |
15:33 |
<razzi> |
sudo -u hdfs kerberos-run-command hdfs hdfs dfsadmin -saveNamespace |
[analytics] |