Skip to content

Instantly share code, notes, and snippets.

Forked from nipra/notes.txt
Created August 9, 2013 07:15
Show Gist options
  • Save sankars/6191725 to your computer and use it in GitHub Desktop.
Save sankars/6191725 to your computer and use it in GitHub Desktop.
# Installing CDH4 on a Single Linux Node in Pseudo-distributed Mode
# Installing CDH4 with MRv1 on a Single Linux Node in Pseudo-distributed mode
# On Ubuntu and other Debian systems
nipra@lambda:Downloads$ wget -cv
nipra@lambda:Downloads$ sudo dpkg -i cdh4-repository_1.0_all.deb # Adds /etc/apt/sources.list.d/cloudera-cdh4.list ??
nipra@lambda:Downloads$ dpkg -L cdh4-repository # To view the files on Ubuntu systems
# Install CDH4
# For Ubuntu Precise systems
# nipra@lambda:~$ lsb_release -c
$ curl -s | sudo apt-key add -
# To view the files on Ubuntu systems
$ dpkg -L hadoop-0.20-conf-pseudo
# Step 1: Format the NameNode.
# Got the error: Error: JAVA_HOME is not set and could not be found.
# Even though ~/.bashrc has ``export JAVA_HOME=/usr/lib/jvm/jdk1.7.0''
# FIX: [ ]
# $ sudo visudo
# Add ``Defaults env_keep+=JAVA_HOME''
$ sudo -u hdfs hdfs namenode -format
# Step 2: Start HDFS
# http://localhost:50070/
$ for service in /etc/init.d/hadoop-hdfs-*
> do
> sudo $service start
> done
# Step 3: Create the /tmp Directory
$ sudo -u hdfs hadoop fs -mkdir /tmp
$ sudo -u hdfs hadoop fs -chmod -R 1777 /tmp
# Step 4: Create the MapReduce system directories
sudo -u hdfs hadoop fs -mkdir /var
sudo -u hdfs hadoop fs -mkdir /var/lib
sudo -u hdfs hadoop fs -mkdir /var/lib/hadoop-hdfs
sudo -u hdfs hadoop fs -mkdir /var/lib/hadoop-hdfs/cache
sudo -u hdfs hadoop fs -mkdir /var/lib/hadoop-hdfs/cache/mapred
sudo -u hdfs hadoop fs -mkdir /var/lib/hadoop-hdfs/cache/mapred/mapred
sudo -u hdfs hadoop fs -mkdir /var/lib/hadoop-hdfs/cache/mapred/mapred/staging
sudo -u hdfs hadoop fs -chmod 1777 /var/lib/hadoop-hdfs/cache/mapred/mapred/staging
sudo -u hdfs hadoop fs -chown -R mapred /var/lib/hadoop-hdfs/cache/mapred
# Step 5: Verify the HDFS File Structure
$ sudo -u hdfs hadoop fs -ls -R /
# Step 6: Start MapReduce
# http://localhost:50030/
for service in /etc/init.d/hadoop-0.20-mapreduce-*
> do
> sudo $service start
> done
# Step 7: Create User Directories
$ sudo -u hdfs hadoop fs -mkdir /user/<user>
$ sudo -u hdfs hadoop fs -chown <user> /user/<user>
where <user> is the Linux username of each user.
sudo -u hdfs hadoop fs -mkdir /user/$USER
sudo -u hdfs hadoop fs -chown $USER /user/$USER
# For stopping daemons
$ for service in /etc/init.d/hadoop-hdfs-* /etc/init.d/hadoop-0.20-mapreduce-*
> do
> sudo $service stop
> done
# HBase
nipra@lambda:~$ sudo apt-get install hbase
nipra@lambda:~$ sudo apt-get install hbase-master
nipra@lambda:~$ sudo jps
nipra@lambda:~$ sudo /etc/init.d/hbase-master stop
# To enable pseudo-distributed mode, you must first make some configuration
# changes. Open /etc/hbase/conf/hbase-site.xml
# Creating the /hbase Directory in HDFS
$ sudo -u hdfs hadoop fs -mkdir /hbase
$ sudo -u hdfs hadoop fs -chown hbase /hbase
# Installing and Starting ZooKeeper Server
# Using config: /etc/zookeeper/conf/zoo.cfg
# ZooKeeper data directory is missing at /var/lib/zookeeper fix the path or run initialize
# invoke-rc.d: initscript zookeeper-server, action "start" failed.
sudo apt-get install zookeeper-server
nipra@lambda:~$ sudo /etc/init.d/zookeeper-server init
nipra@lambda:~$ sudo /etc/init.d/zookeeper-server start
nipra@lambda:~$ sudo /etc/init.d/hbase-master start
# To enable the HBase Region Server on Ubuntu and Debian systems
$ sudo apt-get install hbase-regionserver
# Installing and Starting the HBase Thrift Server
sudo apt-get install hbase-thrift
# Installing and Configuring REST
sudo apt-get install hbase-rest
# ~/bin/
for service in /etc/init.d/hadoop-hdfs-* /etc/init.d/hadoop-0.20-mapreduce-*
sudo $service start
# ~/bin/
for service in /etc/init.d/zookeeper-server /etc/init.d/hbase-master /etc/init.d/hbase-regionserver /etc/init.d/hbase-rest /etc/init.d/hbase-thrift
sudo $service start
# ~/bin/
for service in /etc/init.d/hbase-thrift /etc/init.d/hbase-rest /etc/init.d/hbase-regionserver /etc/init.d/hbase-master /etc/init.d/zookeeper-server
sudo $service stop
# ~/bin/
for service in /etc/init.d/hadoop-0.20-mapreduce-* /etc/init.d/hadoop-hdfs-*
sudo $service stop
# ~/bin/
# ~/bin/
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment