This project aims to be a proof of concept to run the Wortschatz project on HBase
Resource: https://www.digitalocean.com/community/tutorials/how-to-install-hadoop-on-ubuntu-13-10
Primary Namenode: nemo.tm.informatik.uni-leipzig.de YARN Master: nemo.tm.informatik.uni-leipzig.de Datanodes: nemo.tm.informatik.uni-leipzig.de, arielle.tm.informatik.uni-leipzig.de, atlantis.tm.informatik.uni-leipzig.de
wget http://artfiles.org/apache.org/hadoop/common/hadoop-2.6.0/hadoop-2.6.0.tar.gz
tar xfz hadoop-2.6.0.tar.gz
mv hadoop-2.6.0 hadoop
vim .bashrc
##HADOOP VARIABLES START
#export JAVA_HOME=/usr/lib/jvm/java/
#export HADOOP_INSTALL=/disk/localhome/hadoop/hadoop
#export PATH=$PATH:$HADOOP_INSTALL/bin
#export PATH=$PATH:$HADOOP_INSTALL/sbin
#export HADOOP_MAPRED_HOME=$HADOOP_INSTALL
#export HADOOP_COMMON_HOME=$HADOOP_INSTALL
#export HADOOP_HDFS_HOME=$HADOOP_INSTALL
#export YARN_HOME=$HADOOP_INSTALL
#export HADOOP_COMMON_LIB_NATIVE_DIR=$HADOOP_INSTALL/lib/native
#export HADOOP_OPTS="-Djava.library.path=$HADOOP_INSTALL/lib"
##HADOOP VARIABLES END
source ~/.bashrc
cd hadoop
vim etc/hadoop/hadoop-env.sh
#export JAVA_HOME=/usr/lib/jvm/java/
vim etc/hadoop/core-site.xml
#<configuration>
# <property>
# <name>fs.default.name</name>
# <value>hdfs://nemo.tm.informatik.uni-leipzig.de:54310</value>
# <description>The name of the default file system. A URI whose
# scheme and authority determine the FileSystem implementation. The
# uri's scheme determines the config property (fs.SCHEME.impl) naming
# the FileSystem implementation class. The uri's authority is used to
# determine the host, port, etc. for a filesystem.</description>
# </property>
#
# <property>
# <name>hadoop.tmp.dir</name>
# <value>/disk/data/hadoop/tmp</value>
# <description>A base for other temporary directories.</description>
# </property>
#</configuration>
vim etc/hadoop/yarn-site.xml
#<configuration>
# <property>
# <name>yarn.nodemanager.aux-services</name>
# <value>mapreduce_shuffle</value>
# </property>
# <property>
# <name>yarn.nodemanager.aux-services.mapreduce.shuffle.class</name>
# <value>org.apache.hadoop.mapred.ShuffleHandler</value>
# </property>
#</configuration>
cp etc/hadoop/mapred-site.xml.template etc/hadoop/mapred-site.xml
vim etc/hadoop/mapred-site.xml
#<configuration>
# <property>
# <name>mapreduce.framework.name</name>
# <value>yarn</value>
# </property>
#</configuration>
mkdir -p /disk/data/hadoop/hdfs/namenode
mkdir -p /disk/data/hadoop/hdfs/datanode
mkdir -p /disk/data/hadoop/tmp
vim etc/hadoop/hdfs-site.xml
#<configuration>
# <property>
# <name>dfs.replication</name>
# <value>1</value>
# </property>
# <property>
# <name>dfs.namenode.name.dir</name>
# <value>file:/disk/data/hadoop/hdfs/namenode</value>
# </property>
# <property>
# <name>dfs.datanode.data.dir</name>
# <value>file:/disk/data/hadoop/hdfs/datanode</value>
# </property>
#</configuration>
#(NUR MASTER (nemo))
vim etc/hadoop/slaves
#nemo.tm.informatik.uni-leipzig.de
#arielle.tm.informatik.uni-leipzig.de
#atlantis.tm.informatik.uni-leipzig.de
On nemo.tm.informatik.uni-leipzig.de:
start-dfs.sh
start-yarn.sh
Check status at: http://nemo.tm.informatik.uni-leipzig.de:50070
On nemo.tm.informatik.uni-leipzig.de:
stop-yarn.sh
stop-dfs.sh
Resource: hbase.apache.org/book.html
- Master: arielle.tm.informatik.uni-leipzig.de
- Zookeeper Server: nemo.tm.informatik.uni-leipzig.de, arielle.tm.informatik.uni-leipzig.de, atlantis.tm.informatik.uni-leipzig.de
- Regionserver: nemo.tm.informatik.uni-leipzig.de, arielle.tm.informatik.uni-leipzig.de, atlantis.tm.informatik.uni-leipzig.de
wget http://mirror.serversupportforum.de/apache/hbase/stable/hbase-1.0.0-bin.tar.gz
tar xvzf hbase-1.0.0-bin.tar.gz
mv hbase-1.0.0 hbase
cd hbase
vim conf/hbase-env.sh
#export JAVA_HOME=/usr/lib/jvm/java/
vim conf/hbase-site.xml
#<configuration>
# <property>
# <name>hbase.rootdir</name>
# <value>hdfs://nemo.tm.informatik.uni-leipzig.de:8020/hbase</value>
# </property>
# <property>
# <name>hbase.zookeeper.property.dataDir</name>
# <value>/disk/data/hadoop/zookeeper</value>
# </property>
# <property>
# <name>hbase.cluster.distributed</name>
# <value>true</value>
# </property>
# <property>
# <name>hbase.zookeeper.quorum</name>
# <value>arielle.tm.informatik.uni-leipzig.de,nemo.tm.informatik.uni-leipzig.de,atlantis.tm.informatik.uni-leipzig.de</value>
# </property>
#</configuration>
vim conf/regionservers
#arielle.tm.informatik.uni-leipzig.de
#atlantis.tm.informatik.uni-leipzig.de
#nemo.tm.informatik.uni-leipzig.de
On arielle.tm.informatik.uni-leipzig.de:
hbase/bin/start-hbase.sh
To start additional regionservers run
hbase/bin/local-regionservers.sh start x y z ...
where x y z...
are port offsets
On nemo.tm.informatik.uni-leipzig.de:
hbase/bin/stop-hbase.sh