
| $ tar -zxvf hadoop-2.7.3.tar.gz -C /opt/app/ $ cd /opt/app/hadoop-2.7.3 $ mkdir -p hdfs/{datanode,namenode} tmpdata $ cd /opt/app/hadoop-2.7.3/etc/hadoop
$ cp hadoop-env.sh hadoop-env.sh.bak $ vim hadoop-env.sh export JAVA_HOME=/opt/app/jdk1.8.0_212
$ cp yarn-env.sh yarn-env.sh.bak $ vim yarn-env.sh export JAVA_HOME=/opt/app/jdk1.8.0_212
$ cp hdfs-site.xml hdfs-site.xml.bak $ vim hdfs-site.xml <configuration> <property> <name>dfs.namenode.name.dir</name> <value>/opt/app/hadoop-2.7.3/hdfs/namenode</value> </property> <property> <name>dfs.datanode.data.dir</name> <value>/opt/app/hadoop-2.7.3/hdfs/datanode</value> </property> <property> <name>dfs.namenode.http-address</name> <value>debian120:50070</value> </property> <property> <name>dfs.namenode.secondary.http-address</name> <value>debian121:50090</value> </property> <property> <name>dfs.replication</name> <value>2</value> </property> <property> <name>dfs.permissions.enabled</name> <value>false</value> </property> <property> <name>dfs.webhdfs.enabled</name> <value>true</value> </property> </configuration>
$ cp yarn-site.xml yarn-site.xml.bak $ vim yarn-site.xml <configuration> <property> <name>yarn.nodemanager.aux-services</name> <value>mapreduce_shuffle</value> </property> <property> <name>yarn.nodemanager.aux-services.mapreduce.shuffle.class</name> <value>org.apache.hadoop.mapred.ShuffleHandler</value> </property> <property> <name>yarn.resourcemanager.address</name> <value>debian122:8025</value> </property> <property> <name>yarn.resourcemanager.admin.address</name> <value>debian122:8030</value> </property> <property> <name>yarn.resourcemanager.scheduler.address</name> <value>debian122:8050</value> </property> <property> <name>yarn.resourcemanager.resource-tracker.address</name> <value>debian122:8033</value> </property> <property> <name>yarn.resourcemanager.webapp.address</name> <value>debian122:8088</value> </property> </configuration>
$ cp core-site.xml core-site.xml.bak $ vim core-site.xml <configuration> <property> <name>fs.defaultFS</name> <value>hdfs://debian120:9000</value> </property> <property> <name>hadoop.tmp.dir</name> <value>/opt/app/hadoop-2.7.3/tmpdata</value> </property> <property> <name>io.file.buffer.size</name> <value>10240</value> </property> <property> <name>ha.zookeeper.quorum</name> <value>debian120:2181,debian121:2181,debian122:2181</value> </property> <property> <name>ha.zookeeper.session-timeout.ms</name> <value>1000</value> </property> <property> <name>hadoop.proxyuser.hadoop.hosts</name> <value>*</value> </property> <property> <name>hadoop.proxyuser.hadoop.groups</name> <value>*</value> </property> </configuration>
$ cp mapred-site.xml.template mapred-site.xml $ vim mapred-site.xml <configuration> <property> <name>mapreduce.framework.name</name> <value>yarn</value> </property> </configuration>
$ cp slaves slaves.bak $ vim slaves debian120 debian121 debian122
$ sudo vim /etc/profile.d/my.sh export HADOOP_HOME=/opt/app/hadoop-2.7.3 export PATH=$PATH:$HADOOP_HOME/bin:$HADOOP_HOME/sbin
debian120$ hadoop namenode -format
debian120$ start-dfs.sh Starting namenodes on [debian120] debian120: starting namenode, logging to /opt/app/hadoop-2.7.3/logs/hadoop-liubin-namenode-debian120.out debian120: starting datanode, logging to /opt/app/hadoop-2.7.3/logs/hadoop-liubin-datanode-debian120.out debian121: starting datanode, logging to /opt/app/hadoop-2.7.3/logs/hadoop-liubin-datanode-debian121.out debian122: starting datanode, logging to /opt/app/hadoop-2.7.3/logs/hadoop-liubin-datanode-debian122.out Starting secondary namenodes [debian121] debian121: starting secondarynamenode, logging to /opt/app/hadoop-2.7.3/logs/hadoop-liubin-secondarynamenode-debian121.out
debian122$ start-yarn.sh starting yarn daemons resourcemanager running as process 1562. Stop it first. debian121: starting nodemanager, logging to /opt/app/hadoop-2.7.3/logs/yarn-liubin-nodemanager-debian121.out debian120: starting nodemanager, logging to /opt/app/hadoop-2.7.3/logs/yarn-liubin-nodemanager-debian120.out debian122: starting nodemanager, logging to /opt/app/hadoop-2.7.3/logs/yarn-liubin-nodemanager-debian122.out
debian120$ jps 3840 Jps 2026 QuorumPeerMain 3483 DataNode 3741 NodeManager 3373 NameNode debian121$ jps 1523 DataNode 1720 NodeManager 1611 SecondaryNameNode 1196 QuorumPeerMain 1821 Jps debian122$ jps 2017 NodeManager 2116 Jps 1399 DataNode 1176 QuorumPeerMain 1562 ResourceManager
$ hadoop namenode -format
|