hadoop-zookeeper配置YARN-HA集群

1.原版yarn-site.xml




 
  
  <?xml
  version="1.0"?>
  <!--
    Licensed under the Apache License, Version
  2.0 (the "License");
    you may not use this file except in
  compliance with the License.
    You may obtain a copy of the License at
   
     
  http://www.apache.org/licenses/LICENSE-2.0
   
    Unless required by applicable law or agreed
  to in writing, software
    distributed under the License is
  distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY
  KIND, either express or implied.
    See the License for the specific language
  governing permissions and
    limitations under the License. See accompanying
  LICENSE file.
  -->
  <configuration>
   
  <!-- Site
  specific YARN configuration properties -->
  <!-- reducer获取数据的方式 -->
      <property>
         
  <name>yarn.nodemanager.aux-services</name>
          <value>mapreduce_shuffle</value>
      </property>
   
  <!-- 指定YARN的ResourceManager的地址 -->
          <property>
                 
  <name>yarn.resourcemanager.hostname</name>
                 
  <value>hadoop203.cevent.com</value>
          </property>
   
   
  </configuration>
  ~
  
 


2.修改版yarn-site




 
  
  [cevent@hadoop202
  hadoop-2.7.2]$ vim etc/hadoop/yarn-site.xml
   
  <configuration>
   
  <!-- Site
  specific YARN configuration properties -->
  <!-- reducer获取数据的方式 -->
      <property>
         
  <name>yarn.nodemanager.aux-services</name>
         
  <value>mapreduce_shuffle</value>
      </property>
   
      <!-- 日志聚集功能  -->
          <property>
                 
  <name>yarn.log-aggregation-enable</name>
                 
  <value>true</value>
          </property>
      <!-- 日志保留时间7天毫秒级  -->
          <property>
                 
  <name>yarn.log-aggregation.retain-seconds</name>
                  <value>604800</value>
          </property>
   
      <!--启用resourcemanager ha-->
      <property>
         
  <name>yarn.resourcemanager.ha.enabled</name>
          <value>true</value>
      </property>
   
      <!--声明两台resourcemanager的地址-->
      <property>
          <name>yarn.resourcemanager.cluster-id</name>
         
  <value>cluster-yarn1</value>
      </property>
   
      <property>
         
  <name>yarn.resourcemanager.ha.rm-ids</name>
          <value>rm1,rm2</value>
      </property>
   
      <property>
         
  <name>yarn.resourcemanager.hostname.rm1</name>
         
  <value>hadoop202.cevent.com</value>
      </property>
   
      <property>
         
  <name>yarn.resourcemanager.hostname.rm2</name>
         
  <value>hadoop203.cevent.com</value>
      </property>
   
      <!--指定zookeeper集群的地址-->
      <property>
          <name>yarn.resourcemanager.zk-address</name>
         
  <value>hadoop202.cevent.com:2181,hadoop203.cevent.com:2181,hadoop204.cevent.com:2181</value>
      </property>
   
      <!--启用自动恢复-->
      <property>
         
  <name>yarn.resourcemanager.recovery.enabled</name>
          <value>true</value>
      </property>
   
      <!--指定resourcemanager的状态信息存储在zookeeper集群-->
      <property>
         
  <name>yarn.resourcemanager.store.class</name>     
         
  <value>org.apache.hadoop.yarn.server.resourcemanager.recovery.ZKRMStateStore</value>
      </property>
   
  </configuration>
   
  
 


3.hadoop202分发yarn-site




 
  
  [cevent@hadoop202
  hadoop-2.7.2]$ xsync etc/hadoop/yarn-site.xml 
  fname=yarn-site.xml
  pdir=/opt/module/hadoop-HA/hadoop-2.7.2/etc/hadoop
  ---------------
  hadoop203.cevent.com ----------------
  sending incremental
  file list
  yarn-site.xml
   
  sent 1840
  bytes  received 43 bytes  3766.00 bytes/sec
  total size is
  2457  speedup is 1.30
  ---------------
  hadoop204.cevent.com ----------------
  sending
  incremental file list
  yarn-site.xml
   
  sent 1840
  bytes  received 43 bytes  3766.00 bytes/sec
  total size is
  2457  speedup is 1.30
  
 


4.勘察结果hadoop203




 
  
   
      <!--指定zookeeper集群的地址--> 
      <property>
         
  <name>yarn.resourcemanager.zk-address</name>
         
  <value>hadoop202.cevent.com:2181,hadoop203.cevent.com:2181,hadoop204.cevent.com:2181</value>
      </property>
   
      <!--启用自动恢复--> 
      <property>
         
  <name>yarn.resourcemanager.recovery.enabled</name>
          <value>true</value>
      </property>
   
      <!--指定resourcemanager的状态信息存储在zookeeper集群--> 
      <property>
          <name>yarn.resourcemanager.store.class</name>    
         
  <value>org.apache.hadoop.yarn.server.resourcemanager.recovery.ZKRMStateStore</value>
      </property>
   
   
   
  </configuration>
  You have new
  mail in /var/spool/mail/root
  [cevent@hadoop203
  hadoop-2.7.2]$
  
 


5.启动hdfs-hadoop202-sbin journalnode | bin/hdfs namenode -format




 
  
  [cevent@hadoop202
  hadoop-2.7.2]$ sbin/hadoop-daemon.sh start
  journalnode  启动journalnode
  starting
  journalnode, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-journalnode-hadoop202.cevent.com.out
  You
  have new mail in /var/spool/mail/root
  [cevent@hadoop202
  hadoop-2.7.2]$ bin/hdfs namenode -format   格式化namenode
  20/04/23
  20:53:20 INFO namenode.NameNode: STARTUP_MSG: 
  /************************************************************
  STARTUP_MSG:
  Starting NameNode
  STARTUP_MSG:   host = hadoop202.cevent.com/192.168.1.202
  STARTUP_MSG:   args = [-format]
  STARTUP_MSG:  
  version = 2.7.2
  …….
  Re-format filesystem in
  Storage Directory /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name ? (Y
  or N) y
  Re-format filesystem in QJM to
  [192.168.1.202:8485, 192.168.1.203:8485, 192.168.1.204:8485] ? (Y or N) y
  20/04/23
  20:53:36 INFO namenode.FSImage: Allocated new BlockPoolId:
  BP-1726989784-192.168.1.202-1587646416928
  20/04/23
  20:53:36 INFO common.Storage: Storage directory
  /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name has been successfully
  formatted.
  20/04/23
  20:53:37 INFO namenode.NNStorageRetentionManager: Going to retain 1 images
  with txid >= 0
  20/04/23
  20:53:37 INFO util.ExitUtil: Exiting with status 0
  20/04/23
  20:53:37 INFO namenode.NameNode: SHUTDOWN_MSG: 
  /************************************************************
  SHUTDOWN_MSG: Shutting down
  NameNode at hadoop202.cevent.com/192.168.1.202
  ************************************************************/
  [cevent@hadoop202
  hadoop-2.7.2]$ sbin/hadoop-daemon.sh start
  namenode  启动namenode
  starting
  namenode, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-namenode-hadoop202.cevent.com.out
  [cevent@hadoop202
  hadoop-2.7.2]$ jps
  3742
  Jps
  3666
  NameNode
      3532 JournalNode
   
  
 


6.启动Hadoop203(=resourcemanager2)




 
  
  [cevent@hadoop203
  hadoop-2.7.2]$ bin/hdfs namenode -bootstrapStandby
  同步rm1的元数据
  20/04/23
  20:59:10 INFO namenode.NameNode: STARTUP_MSG: 
  /************************************************************
  STARTUP_MSG:
  Starting NameNode
  STARTUP_MSG:   host = hadoop203.cevent.com/192.168.1.203
  STARTUP_MSG:   args = [-bootstrapStandby]
  STARTUP_MSG:  
  version = 2.7.2
  20/04/23
  20:59:14 WARN common.Util: Path
  /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name should be specified as a
  URI in configuration files. Please update hdfs configuration.
  =====================================================
  About to bootstrap Standby ID
  nn2 from:
             Nameservice ID: ceventcluster
          Other Namenode ID: nn1
    Other NN's HTTP address:
  http://hadoop202.cevent.com:50070
    Other NN's IPC  address: hadoop202.cevent.com/192.168.1.202:9000
               Namespace ID: 324046010
              Block pool ID:
  BP-1726989784-192.168.1.202-1587646416928
                 Cluster ID:
  CID-8c5b68c3-24a2-46c1-949b-391664f18d84
             Layout version: -63
         isUpgradeFinalized: true
  =====================================================
  Re-format filesystem in
  Storage Directory /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name ? (Y
  or N) y
  20/04/23
  20:59:24 INFO common.Storage: Storage directory /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name
  has been successfully formatted.
  20/04/23
  20:59:24 WARN common.Util: Path
  /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name should be specified as a
  URI in configuration files. Please update hdfs configuration.
  20/04/23
  20:59:24 WARN common.Util: Path /opt/module/hadoop-HA/hadoop-2.7.2/data/tmp/dfs/name
  should be specified as a URI in configuration files. Please update hdfs
  configuration.
  20/04/23
  20:59:26 INFO namenode.TransferFsImage: Opening connection to
  http://hadoop202.cevent.com:50070/imagetransfer?getimage=1&txid=0&storageInfo=-63:324046010:0:CID-8c5b68c3-24a2-46c1-949b-391664f18d84
  20/04/23
  20:59:26 INFO namenode.TransferFsImage: Image Transfer timeout configured to
  60000 milliseconds
  20/04/23
  20:59:26 INFO namenode.TransferFsImage: Transfer took 0.00s at 0.00 KB/s
  20/04/23
  20:59:26 INFO namenode.TransferFsImage: Downloaded file
  fsimage.ckpt_0000000000000000000 size 353 bytes.
  20/04/23
  20:59:26 INFO util.ExitUtil: Exiting with status 0
  20/04/23
  20:59:26 INFO namenode.NameNode: SHUTDOWN_MSG: 
  /************************************************************
  SHUTDOWN_MSG:
  Shutting down NameNode at hadoop203.cevent.com/192.168.1.203
  ************************************************************/
  [cevent@hadoop203
  hadoop-2.7.2]$ sbin/hadoop-daemon.sh start
  namenode 启动namenode
  starting namenode, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-namenode-hadoop203.cevent.com.out
   
  
 


7.Hadoop202启动datanode(这里偶遇脑瘫-干掉)




 
  
  [cevent@hadoop202
  hadoop-2.7.2]$ sbin/hadoop-daemons.sh start
  datanode  这里的daemeons进程必须
  hadoop204.cevent.com:
  starting datanode, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-datanode-hadoop204.cevent.com.out
  hadoop203.cevent.com:
  starting datanode, logging to /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-datanode-hadoop203.cevent.com.out
  hadoop202.cevent.com:
  starting datanode, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/hadoop-cevent-datanode-hadoop202.cevent.com.out
  hadoop205.cevent.com:
  ssh: connect to host hadoop205.cevent.com port 22: No route to host
  [cevent@hadoop202
  hadoop-2.7.2]$ jps
  3936 DataNode
  3666 NameNode
  3532 JournalNode
  4009 Jps
  【偶遇脑瘫split-brain】
  [cevent@hadoop202
  hadoop-2.7.2]$ bin/hdfs haadmin
  -transitionToActive nn1 启动hadoop202的active
  Automatic
  failover is enabled for NameNode at hadoop203.cevent.com/192.168.1.203:9000
  Refusing
  to manually manage HA state, since it may cause
  a split-brain scenario or
  other incorrect state.
  If you are very sure you know
  what you are doing, please 
  specify the --forcemanual flag.   要求必须手动标识
  [cevent@hadoop202
  hadoop-2.7.2]$ jps
  4564
  Jps
  3666
  NameNode
  3532 JournalNode
  [cevent@hadoop202
  hadoop-2.7.2]$ bin/hdfs haadmin
  -transitionToActive --forcemanual  nn1 执行激活
  You
  have specified the --forcemanual flag. This flag is dangerous, as it can
  induce a split-brain scenario that WILL CORRUPT your HDFS namespace, possibly
  irrecoverably.
   
  It is
  recommended not to use this flag, but instead to shut down the cluster and
  disable automatic failover if you prefer to manually manage your HA state.
   
  You
  may abort safely by answering 'n' or hitting ^C now.
   
  Are you sure you want to continue?
  (Y or N) y
  20/04/23
  21:24:11 WARN ha.HAAdmin: Proceeding with manual HA state management even
  though
  automatic
  failover is enabled for NameNode at hadoop203.cevent.com/192.168.1.203:9000
  20/04/23
  21:24:11 WARN ha.HAAdmin: Proceeding with manual HA state management even
  though
  automatic
  failover is enabled for NameNode at hadoop202.cevent.com/192.168.1.202:9000
  [cevent@hadoop202
  hadoop-2.7.2]$ jps
  4691
  Jps
  3666
  NameNode
  3532 JournalNode
  
 


8.启动成功

激活hadoop202

9.启动yarn




 
  
  [cevent@hadoop202
  hadoop-2.7.2]$ sbin/start-yarn.sh 启动yarn
  starting
  yarn daemons
  starting
  resourcemanager, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/yarn-cevent-resourcemanager-hadoop202.cevent.com.out
  hadoop205.cevent.com:
  bash: line 0: cd: /opt/module/hadoop-HA/hadoop-2.7.2: 没有那个文件或目录
  hadoop205.cevent.com:
  bash: /opt/module/hadoop-HA/hadoop-2.7.2/sbin/yarn-daemon.sh: 没有那个文件或目录
  hadoop202.cevent.com:
  starting nodemanager, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/yarn-cevent-nodemanager-hadoop202.cevent.com.out
  hadoop204.cevent.com:
  starting nodemanager, logging to /opt/module/hadoop-HA/hadoop-2.7.2/logs/yarn-cevent-nodemanager-hadoop204.cevent.com.out
  hadoop203.cevent.com:
  starting nodemanager, logging to
  /opt/module/hadoop-HA/hadoop-2.7.2/logs/yarn-cevent-nodemanager-hadoop203.cevent.com.out
  [cevent@hadoop202
  hadoop-2.7.2]$ jps
  4969
  ResourceManager
  5188
  Jps
  3666
  NameNode
  3532
  JournalNode
  5079 NodeManager
  (这里没有datanode是因为之前误将hadoop203的hadoop-daemon.sh单开)
   
  
 


  • 1
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值