Steps to install Hadoop 3.4.
1. Open terminal
2. ./login.sh
/* It will ask for your username and password provided
to you by Bennett to access internet. */
4. sudo apt-get install ssh
/* don't execute if already exist */
5. sudo apt-get install default-jdk
/*Install Java*/
6. update-alternatives --config java
/*Check your jdk directory*/ /* */
7. JDK directory is : /usr/lib/jvm/java-8-openjdk-amd64
8. wget
https://archive.apache.org/dist/hadoop/core/hadoop-
3.4.0/hadoop-3.4.0.tar.gz
/*download hadoop tar file*/
9. tar xvzf hadoop-3.4.0.tar.gz
/*Unzip hadoop tar file*/
10. cd /home/hadoop-3.4.0/etc/hadoop
/*browse to this loaction*/ (Note:- this can change user
to user, check accordingly)
11.nano hadoop-env.sh
12.export JAVA_HOME= /usr/lib/jvm/java-8-openjdk-
amd64
/* set to the root of your Java installation*/
13. export HADOOP_PREFIX= /home/hadoop-3.4.0
/*Assuming your installation directory is /home/hadoop-
3.4.0*/
14. cd /home/hadoop-3.4.0/etc/hadoop
/*To Configuring core-site.xml*/
15. nano core-site.xml
<configuration>
<property>
<name>fs.defaultFS</name>
<value>hdfs://localhost:9000</value>
</property>
</configuration>
/*configuration is already present. So copy from the
property part inside configuration*/
/*ctrl o-to save and press enter*/ /*ctrl x - to exit*/
16. cd /home/hadoop-3.4.0/etc/hadoop
/* To Configuring hdfs-site.xml*/
17. nano hdfs-site.xml
<configuration>
<property>
<name>dfs.replication</name>
<value>1</value>
</property>
</configuration>
/*configuration is already present. So copy from the
property part inside configuration*/
/*ctrl o-to save and press enter*/ /*ctrl x - to exit*/
18. cd /home/hadoop-3.4.0/etc/hadoop
19. cp mapred-site.xml.template mapred-site.xml
20. nano mapred-site.xml
/* To Configuring mapred-site.xml*/
<configuration>
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
</configuration>
/*configuration is already present. So copy from the
property part inside configuration*/
/*ctrl o-to save and press enter*/ /*ctrl x - to exit*/
21. nano yarn-site.xml
<configuration>
<property>
<name>yarn.nodemanager.aux-services</name>
<value>mapreduce_shuffle</value>
</property>
</configuration>
/* To Configuring yarn-site.xml*/
/*configuration is already present. So copy from the
property part inside configuration*/
/*ctrl o-to save and press enter*/ /*ctrl x - to exit*/
22. cd /home/hadoop-3.4.0
23. bin/hdfs namenode -format
/* SEE the message for "Storage directory /tmp/hadoop-
username/dfs/name has been successfully formatted"
after the above step */
24. sbin/start-all.sh
25. /*Enter password set by you every time the
password is asked */
26. jps
/*SEE for Jps
NodeManager
NameNode
SecondaryNameNode
DataNode
ResourceManager */
27. To test for installation of Namenode and hadoop
type your browser:-
http:// your_ip_address:50070
/*your_ip_address is the ip address of the VM assigned
to you*/
-----------------------------------------------------------------------------
-------------------