0% found this document useful (0 votes)

4 views

Hadoop and Hive Installation

Uploaded by

Praveen Shetty NMAMIT

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

4 views

Hadoop and Hive Installation

Uploaded by

Praveen Shetty NMAMIT

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 19

#Update repo and install Java 11 for Hadoop

sudo apt update

java -version;

sudo apt install openjdk-11-jdk -y

javac -version

#Command to Find Java Location

dirname $(dirname $(readlink -f $(which java)))

#Download the latest hadoop setup file

wget https://dlcdn.apache.org/hadoop/common/hadoop-3.4.0/hadoop-3.4.0.tar.gz
#Unzip using tar

tar xzf hadoop-3.4.0.tar.gz

#Rename and Move the unzipped hadoop folder to home directory

mv hadoop-3.4.0 ~/hadoop

#Create datanode and namenode directories inside hadoop

cd ~/hadoop
mkdir dfsdata
cd dfsdata
mkdir -p {datanode,namenode}
cd ..
chmod -R 777 dfsdata
#Edit the Config Files in ~/hadoop/etc/hadoop/

# For core-site.xml
<property>
<name>fs.defaultFS</name>
<value>hdfs://localhost:9000</value>
</property>

# For hdfs-site.xml
<property>
<name>dfs.replication</name>
<value>3</value>
</property><property>
<name>dfs.name.dir</name>
<value>/home/ubuntu/hadoop/dfsdata/namenode</value>
</property><property>
<name>dfs.data.dir</name>
<value>/home/ubuntu/hadoop/dfsdata/datanode</value>
</property>
# For mapred-site.xml
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>

# For yarn-site.xml
<property>
<name>yarn.nodemanager.aux-services</name>
<value>mapreduce_shuffle</value>
</property><property>
<name>yarn.nodemanager.auxservices.mapreduce.shuffle.class</name>
<value>org.apache.hadoop.mapred.ShuffleHandler</value>
</property>
#Update hadoop-env.sh

export JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64

#Update the Environment variable (replace ur path accordingly)

# update ~/.bashrc add the below at the end of the file
export JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64
export HADOOP_HOME=/home/ubuntu/hadoop
export HADOOP_INSTALL=$HADOOP_HOME
export HADOOP_MAPRED_HOME=$HADOOP_HOME
export HADOOP_COMMON_HOME=$HADOOP_HOME
export HADOOP_HDFS_HOME=$HADOOP_HOME
export HADOOP_YARN_HOME=$HADOOP_HOME
export HADOOP_COMMON_LIB_NATIVE=$HADOOP_HOME/lib/native
export PATH=$PATH:$HADOOP_HOME/bin:$HADOOP_HOME/sbin
export HADOOP_OPTS="-Djava.library.path=$HADOOP_HOME/lib/native"

#Activate the Environment Variables

source ~/.bashrc
#Configure SSH Server to Create PasswordLess SSH Login
sudo apt install openssh-server openssh-client -y
ssh-keygen -t rsa
cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys
chmod 640 ~/.ssh/authorized_keys

#Test the SSH login to localhost

sh localhost
give yes and exit
# Initializes or Resets the Hadoop HDFS by clearing the NameNode's
metadata and preparing the filesystem for use, erasing all stored data

hdfs namenode -format

#Start the HDFS daemons (NameNode, DataNode, and Secondary NameNode)

start-dfs.sh

#Start the YARN daemons (ResourceManager and NodeManager)

start-yarn.sh

#Check whether all services running using jps command

Test the Web Pages : http://localhost:9870 http://localhost:9864 http://localhost:8088

*****************************************************************************************************

stop-yarn.sh

stop-dfs.sh
INSTALL LATEST HIVE along with Hadoop 3.4.0

#For hive need to install java8

sudo apt install openjdk-8-jdk -y

#Modify the JAVA Path From 11 to 8 in

/home/hadoop/etc/hadoop/hadoop-env.sh &
/home/ubuntu/.bashrc

export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64

#Rebuild the Environment Variables

source ~/.bashrc

#Test Hadoop is Working ( with start-all.sh )

start-all.sh
#Update ~/hadoop/etc/hadoop/mapred-site.xml add following props

<property>
<name>yarn.app.mapreduce.am.env</name>
<value>HADOOP_MAPRED_HOME=${HADOOP_HOME}</value>
</property>
<property>
<name>mapreduce.map.env</name>
<value>HADOOP_MAPRED_HOME=${HADOOP_HOME}</value>
</property>
<property>
<name>mapreduce.reduce.env</name>
<value>HADOOP_MAPRED_HOME=${HADOOP_HOME}</value>
</property>

#Restart hadoop

stop-all.sh

start-all.sh
#Test mapreduce with a sample job

yarn jar
$HADOOP_HOME/share/hadoop/mapreduce/hadoop-mapreduce-examples-3.4.0.jar pi
10 100

#Download apache-hive-4.0.0-bin.tar.gz
tar xzf apache-hive-4.0.0-bin.tar.gz

#Rename it to hive and keep it in Home directory

mv hive-4.0.0 ~/hive

#Create hive-env.sh and hive-site.xml using template

cd /home/ubuntu/hive/conf/

cp hive-env.sh.template hive-env.sh

cp hive-default.xml.template hive-site.xml
#Edit hive.site.xml and below 2 props at the beginning
<property>
<name>system:java.io.tmpdir</name>
<value>/tmp/hive/java</value>
</property>
<property>
<name>system:user.name</name>
<value>${user.name}</value>
</property>
#Edit hive-site.xml find the below text and remove extra characters
between word "for transactional" (search for below text)
*******************************************************************************************************
Ensures commands with OVERWRITE (such as INSERT OVERWRITE) acquire Exclusive
locks

#Update the ~/.bashrc file

export HIVE_HOME=/home/ubuntu/hive
export HIVE_CONF_DIR=$HIVE_HOME/conf
export PATH=$PATH:$HIVE_HOME/bin
export CLASSPATH=$CLASSPATH:$HADOOP_HOME/lib/*:.
export CLASSPATH=$CLASSPATH:$HIVE_HOME/lib/*:.

#Rebuild the Environment Variable

source ~/.bashrc
#Create hdfs directories and give corresponding permissions
hdfs dfs -ls /
hdfs dfs -rm -r /user
hdfs dfs -ls /
hdfs dfs -mkdir -p /user/hive/warehouse

hdfs dfs -chmod g+w /user

hdfs dfs -chmod g+wx /user

hdfs dfs -chmod g+w /tmp

hdfs dfs -chmod g+wx /tmp

#Edit ~/hive/conf/hive-env.sh update commented one to

HADOOP_HOME=/home/ubuntu/hadoop
# Copy latest guava jar to hive command

rm -r /home/ubuntu/hive/lib/guava-*.jar

cp /home/ubuntu/hadoop/share/hadoop/common/lib/guava-27.0-jre.jar
/home/ubuntu/hive/lib

#Edit latest .sql file location and Comment First 2 Queries of DDL
Statements for functions with - - ( DDL statement for functions)

/home/ubuntu/hive/scripts/metastore/upgrade/derby/hive-schema-4.0.0.derby.sql
#Initialize Hive Metastore

schematool -dbType derby -initSchema

# Launch Hive to check

hive

!quit
# For better Visualisation use beeline
------------------------------------

beeline -u jdbc:hive2://

show databases;

create database college;

use college;

CREATE TABLE employee (id INT,name STRING, salary FLOAT)ROW FORMAT

DELIMITED FIELDS TERMINATED BY ',' STORED AS TEXTFILE;

SHOW TABLES;

INSERT INTO employee VALUES (1, 'John Doe', 50000.0);

SELECT * FROM employee;

!quit

Hard+drive+motor+driver+schematic: Read/Download
No ratings yet
Hard+drive+motor+driver+schematic: Read/Download
2 pages
Hadoop All Installations
No ratings yet
Hadoop All Installations
19 pages
Hadoop 3 Installation
No ratings yet
Hadoop 3 Installation
10 pages
Setting Hadoop and Mysql 8.0
No ratings yet
Setting Hadoop and Mysql 8.0
3 pages
Nitish Steps To Install Hadoop
No ratings yet
Nitish Steps To Install Hadoop
3 pages
Hadoop Installation Manual 2.odt
No ratings yet
Hadoop Installation Manual 2.odt
20 pages
Hadoop Installation
No ratings yet
Hadoop Installation
7 pages
Hadoop for Ubuntu 2
No ratings yet
Hadoop for Ubuntu 2
4 pages
Hadoop Installation
No ratings yet
Hadoop Installation
3 pages
Big Data Record 2024-25
No ratings yet
Big Data Record 2024-25
46 pages
2 - Installation
No ratings yet
2 - Installation
15 pages
Hadoop Installation On Linux
No ratings yet
Hadoop Installation On Linux
4 pages
Installing Standalone and Pseudocode Hadoop Cluster: 1. Setting Up Vmware Virtual Machine
No ratings yet
Installing Standalone and Pseudocode Hadoop Cluster: 1. Setting Up Vmware Virtual Machine
14 pages
Hadoop Installation Commands
No ratings yet
Hadoop Installation Commands
3 pages
Hadoop 2.7.3 Setup On Ubuntu 15.10
No ratings yet
Hadoop 2.7.3 Setup On Ubuntu 15.10
7 pages
Hadoop
No ratings yet
Hadoop
4 pages
Week 1 in Terminal
No ratings yet
Week 1 in Terminal
10 pages
Original
No ratings yet
Original
17 pages
BDA exp-1.2
No ratings yet
BDA exp-1.2
3 pages
Hands On-Exercies
No ratings yet
Hands On-Exercies
17 pages
big data
No ratings yet
big data
5 pages
Ap21110010351 4
No ratings yet
Ap21110010351 4
3 pages
PRACTICAL 4 - Single and Multi Node Hadoop Install
No ratings yet
PRACTICAL 4 - Single and Multi Node Hadoop Install
11 pages
Hadoop Installation
No ratings yet
Hadoop Installation
6 pages
Hadoop Installation
No ratings yet
Hadoop Installation
6 pages
HarshYadav 20CS3032 Assignment1
No ratings yet
HarshYadav 20CS3032 Assignment1
22 pages
Hadoop Installation Steps
100% (1)
Hadoop Installation Steps
6 pages
big data
No ratings yet
big data
32 pages
Hadoop Installation 2
No ratings yet
Hadoop Installation 2
5 pages
Manual Hadoop HIve Installation
No ratings yet
Manual Hadoop HIve Installation
4 pages
Bda Lab
No ratings yet
Bda Lab
37 pages
DA Lab EXERCISE
No ratings yet
DA Lab EXERCISE
24 pages
Big Data Analytics - Lab-Manual
No ratings yet
Big Data Analytics - Lab-Manual
19 pages
Installationof Hadoop 3
No ratings yet
Installationof Hadoop 3
6 pages
Hadoop Installation
No ratings yet
Hadoop Installation
4 pages
Installation of Hadoop
No ratings yet
Installation of Hadoop
6 pages
Computer Science & Engineering: Department of
No ratings yet
Computer Science & Engineering: Department of
6 pages
Install Hadoop
No ratings yet
Install Hadoop
8 pages
BDA LAB Programs
No ratings yet
BDA LAB Programs
56 pages
BDA Practical
No ratings yet
BDA Practical
38 pages
Amrita CC 3.1
No ratings yet
Amrita CC 3.1
7 pages
Bigdata Manual Final
No ratings yet
Bigdata Manual Final
65 pages
Hadoop Installation Step by Step
No ratings yet
Hadoop Installation Step by Step
8 pages
Hadoop Installation Guide
No ratings yet
Hadoop Installation Guide
18 pages
Big Data Lab Manual and Syllabus
No ratings yet
Big Data Lab Manual and Syllabus
71 pages
BDAO
No ratings yet
BDAO
23 pages
Experiment No - 1
No ratings yet
Experiment No - 1
13 pages
Lab 4 - Installation of Hadoop and MapReduce WordCount Example
100% (1)
Lab 4 - Installation of Hadoop and MapReduce WordCount Example
16 pages
2023MCS320004 HEMANTH TARRA - Hadoop Installation - Assignment
No ratings yet
2023MCS320004 HEMANTH TARRA - Hadoop Installation - Assignment
9 pages
Big Data Analytics Lab Experiments
No ratings yet
Big Data Analytics Lab Experiments
16 pages
Hadoop Single Node Cluster Setup Steps
No ratings yet
Hadoop Single Node Cluster Setup Steps
7 pages
CDH3 Pseudo Installation On Ubuntu
No ratings yet
CDH3 Pseudo Installation On Ubuntu
4 pages
Big Data Manual
No ratings yet
Big Data Manual
19 pages
Hadoop Single Node Installation
No ratings yet
Hadoop Single Node Installation
7 pages
Installation+Steps
No ratings yet
Installation+Steps
5 pages
EX1-Installation of Hadoop
No ratings yet
EX1-Installation of Hadoop
6 pages
Step 1 - Install Oracle Java 8 On Ubuntu
No ratings yet
Step 1 - Install Oracle Java 8 On Ubuntu
7 pages
HADOOP RECORD 2024-FINAL
No ratings yet
HADOOP RECORD 2024-FINAL
59 pages
Install Sqoop
No ratings yet
Install Sqoop
7 pages
hadoop configure 3.3.6 configuration
No ratings yet
hadoop configure 3.3.6 configuration
2 pages
Hadoop Cluster Creation
No ratings yet
Hadoop Cluster Creation
8 pages
Systems Development and Program Change Activities: Earl Kyster Deypalubos Herwin Mae Boclaras
No ratings yet
Systems Development and Program Change Activities: Earl Kyster Deypalubos Herwin Mae Boclaras
58 pages
Monte Carlo Null Models in Ecology
No ratings yet
Monte Carlo Null Models in Ecology
6 pages
Awscloud X Domesticloud
No ratings yet
Awscloud X Domesticloud
20 pages
中国半导体的新时代
No ratings yet
中国半导体的新时代
53 pages
How To Use Index and Match
No ratings yet
How To Use Index and Match
10 pages
AVR-ATMega32-Architecture
No ratings yet
AVR-ATMega32-Architecture
25 pages
Virtual Private Network (VPN) Connection To SAP
No ratings yet
Virtual Private Network (VPN) Connection To SAP
20 pages
Difference Between Confined and Unconfined Aquifer
0% (1)
Difference Between Confined and Unconfined Aquifer
1 page
Android Video: Debug Guide
No ratings yet
Android Video: Debug Guide
45 pages
Congratulations: Learning To Coach Online Course
No ratings yet
Congratulations: Learning To Coach Online Course
3 pages
Madoff The Final Word 1st Edition Richard Behar download
100% (2)
Madoff The Final Word 1st Edition Richard Behar download
47 pages
Admit Card (Kiran Saif)
No ratings yet
Admit Card (Kiran Saif)
1 page
Zoom Class Rules
No ratings yet
Zoom Class Rules
1 page
EHS - Do Agile Be Agile - Xebia Academy - Technical
No ratings yet
EHS - Do Agile Be Agile - Xebia Academy - Technical
7 pages
写作助手
100% (1)
写作助手
8 pages
43LH510T DF - 1003 3754
No ratings yet
43LH510T DF - 1003 3754
44 pages
Ds 4 Windows
No ratings yet
Ds 4 Windows
1 page
'Module 1 - QB (1) '-Compressed
No ratings yet
'Module 1 - QB (1) '-Compressed
3 pages
Mouse Ray Picking Explained
No ratings yet
Mouse Ray Picking Explained
8 pages
Stake Codigo Fonte
No ratings yet
Stake Codigo Fonte
40 pages
Introduction To Functional Programming: Explore Developers Explore Jobs
No ratings yet
Introduction To Functional Programming: Explore Developers Explore Jobs
9 pages
Isilon Troubleshooting Guide File System Locking
No ratings yet
Isilon Troubleshooting Guide File System Locking
6 pages
Get Start de
No ratings yet
Get Start de
66 pages
Social Network For STD
No ratings yet
Social Network For STD
94 pages
3HE12133AAABTQZZA01 - V1 - 7705 SAR Card and Module Support Quick Reference Card Release 8.0
No ratings yet
3HE12133AAABTQZZA01 - V1 - 7705 SAR Card and Module Support Quick Reference Card Release 8.0
6 pages
Data Entry and Keyboarding Skills - QP
No ratings yet
Data Entry and Keyboarding Skills - QP
12 pages
Simplex Method
No ratings yet
Simplex Method
45 pages
Topic 3 and 4 Class Notes
No ratings yet
Topic 3 and 4 Class Notes
15 pages

Hadoop and Hive Installation

Uploaded by

Hadoop and Hive Installation

Uploaded by

#Update repo and install Java 11 for Hadoop

sudo apt update

sudo apt install openjdk-11-jdk -y

#Command to Find Java Location

dirname $(dirname $(readlink -f $(which java)))

#Download the latest hadoop setup file

tar xzf hadoop-3.4.0.tar.gz

#Rename and Move the unzipped hadoop folder to home directory

#Create datanode and namenode directories inside hadoop

#Update the Environment variable (replace ur path accordingly)

#Activate the Environment Variables

#Test the SSH login to localhost

hdfs namenode -format

#Start the YARN daemons (ResourceManager and NodeManager)

#Check whether all services running using jps command

Test the Web Pages : http://localhost:9870 http://localhost:9864 http://localhost:8088

#For hive need to install java8

sudo apt install openjdk-8-jdk -y

#Modify the JAVA Path From 11 to 8 in

#Rebuild the Environment Variables

#Test Hadoop is Working ( with start-all.sh )

#Rename it to hive and keep it in Home directory

#Create hive-env.sh and hive-site.xml using template

#Update the ~/.bashrc file

#Rebuild the Environment Variable

hdfs dfs -chmod g+w /user

hdfs dfs -chmod g+w /tmp

#Edit ~/hive/conf/hive-env.sh update commented one to

schematool -dbType derby -initSchema

# Launch Hive to check

create database college;

CREATE TABLE employee (​id INT,​name STRING,​ salary FLOAT)ROW FORMAT

INSERT INTO employee VALUES (1, 'John Doe', 50000.0);

SELECT * FROM employee;

You might also like

CREATE TABLE employee (id INT,name STRING, salary FLOAT)ROW FORMAT