yarn启动前需要配置两个文件:mapred-site.xml 和 yarn-site.xml
mapred-site.xml:(master配置即可)
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
yarn-site.xml:(master 和 slavex 都需要配置)
<configuration>
<!-- Site specific YARN configuration properties -->
<!-- 下面一个配置master配置即可 (resourcemanager节点) -->
<property>
<name>yarn.resourcemanager.hostname</name>
<value>master</value>
</property>
<!--开始出现了mapreduce_shuffle does not exist 错误,是因为我在slave下没有配置下面两项(nodemanager节点配置)-->
<property>
<name>yarn.nodemanager.aux-services</name>
<value>mapreduce_shuffle</value>
</property>
<property>
<name>yarn.nodemanager.auxservices.mapreduce.shuffle.class</name>
<value>org.apache.hadoop.mapred.ShuffleHandler</value>
</property>
<!--下面三个配置后,在masterIP:8088下才会显示slave下的 NodeManager 的情况-->
<property>
<name>yarn.resourcemanager.address</name>
<value>master:8032</value>
</property>
<property>
<name>yarn.resourcemanager.scheduler.address</name>
<value>master:8030</value>
</property>
<property>
<name>yarn.resourcemanager.resource-tracker.address</name>
<value>master:8031</value>
</property>
</configuration>
然后启动yarn:start-yarn.sh:
运行自带的 wordcount 计算:
查看运行结果: