整体的配置表如下:
机器是从仓库里整理出来的箱底机器,已经属于淘汰货了。
总体说下,将198号机器为主机(master.hadoop),其它的主机全部当做从机(slaver1-slaver5.hadoop)。
设置每台机器的BIOS的电源管理,将其全部设置为上电开机。
操作系统采用的是centos 6.5 32bit
软件的版本如下:
jdk1.8.0_45
hadoop-2.2.0
zookeeper-3.4.5
hbase-0.98.8-hadoop2
apache-hive-0.14.0-bin
apache-mahout-1.0-bin
######################## master 198 ###########################
[root@localhost ~]# ifconfig eth0
eth0 Link encap:Ethernet HWaddr 00:23:54:2B:9D:2D
inet addr:10.18.11.198 Bcast:10.18.11.255 Mask:255.255.255.0
inet6 addr: fdd8:8f0:124b:0:223:54ff:fe2b:9d2d/64 Scope:Global
inet6 addr: fe80::223:54ff:fe2b:9d2d/64 Scope:Link
UP BROADCAST RUNNING MULTICAST MTU:1500 Metric:1
RX packets:93982 errors:0 dropped:0 overruns:0 frame:0
TX packets:1684 errors:0 dropped:0 overruns:0 carrier:0
collisions:0 txqueuelen:1000
RX bytes:8404629 (8.0 MiB) TX bytes:165374 (161.4 KiB)
Interrupt:16
## 修改本地域名及IP地址
[root@localhost ~]# vi /etc/hosts
[root@localhost ~]# vi /etc/sysconfig/network
[root@localhost ~]# cat /etc/hosts
127.0.0.1 localhost localhost.localdomain localhost4 localhost4.localdomain4
::1 localhost localhost.localdomain localhost6 localhost6.localdomain6
10.18.11.198 master.hadoop
10.18.11.199 slaver1.hadoop
10.18.11.201 slaver2.hadoop
10.18.11.202 slaver3.hadoop
10.18.11.203 slaver4.hadoop
10.18.11.204 slaver5.hadoop
[root@localhost ~]# cat /etc/sysconfig/network
NETWORKING=yes
NETWORKING_IPV6=no
HOSTNAME=master.hadoop
[root@localhost ~]# reboot
## 禁用IPv6
[root@master ~]# vim /etc/modprobe.d/anaconda.conf
[root@master ~]# cat /etc/modprobe.d/anaconda.conf
# Module options and blacklists written by anaconda
install ipv6 /bin/true
[root@master ~]# lsmod |grep -i ipv6
nf_conntrack_ipv6 7207 2
nf_defrag_ipv6 8897 1 nf_conntrack_ipv6
nf_conntrack 65661 3 nf_conntrack_ipv4,nf_conntrack_ipv6,xt_state
ipv6 261089 35 ip6t_REJECT,nf_conntrack_ipv6,nf_defrag_ipv6
[root@master modprobe.d]# reboot
[root@master ~]# lsmod |grep -i ipv6
[root@master ~]# ifconfig | grep -i inet6
## 禁用iptables防火墙
[root@master ~]# /etc/init.d/iptables stop
iptables: Setting chains to policy ACCEPT: filter [ OK ]
iptables: Flushing firewall rules: [ OK ]
iptables: Unloading modules: [ OK ]
[root@master ~]# chkconfig --list |grep iptables
iptables 0:off 1:off 2:on 3:on 4:on 5:on 6:off
[root@master ~]# chkconfig iptables off
[root@master ~]# chkconfig --list |grep iptables
iptables 0:off 1:off 2:off 3:off 4:off 5:off 6:off
## 建立用户和组
[root@master ~]# groupadd hadoop
[root@master ~]# useradd -g hadoop hduser
[root@master ~]# passwd hduser
Changing password for user hduser.
New password:
BAD PASSWORD: it is based on a dictionary word
Retype new password:
passwd: all authentication tokens updated successfully.
## 提升hduser的sudo权限
[root@master ~]# su - hduser
[hduser@master ~]$ ls
[hduser@master ~]$
[hduser@master ~]$
[hduser@master ~]$ sudo -i
We trust you have received the usual lecture from the local System
Administrator. It usually boils down to these three things:
#1) Respect the privacy of others.
#2) Think before you type.
#3) With great power comes great responsibility.
[sudo] password for hduser:
hduser is not in the sudoers file. This incident will be reported.
[root@master ~]# cat /etc/sudoers |grep -v "#" |grep -v "^$"
Defaults requiretty
Defaults !visiblepw
Defaults always_set_home
Defaults env_reset
Defaults env_keep = "COLORS DISPLAY HOSTNAME HISTSIZE INPUTRC KDEDIR LS_COLO RS"
Defaults env_keep += "MAIL PS1 PS2 QTDIR USERNAME LANG LC_ADDRESS LC_CTYPE"
Defaults env_keep += "LC_COLLATE LC_IDENTIFICATION LC_MEASUREMENT LC_MESSAGES "
Defaults env_keep += "LC_MONETARY LC_NAME LC_NUMERIC LC_PAPER LC_TELEPHONE"
Defaults env_keep += "LC_TIME LC_ALL LANGUAGE LINGUAS _XKB_CHARSET XAUTHORITY "
Defaults secure_path = /sbin:/bin:/usr/sbin:/usr/bin
root ALL=(ALL) ALL
[root@master ~]# vi /etc/sudoers
[root@master ~]# cat /etc/sudoers |grep -v "#" |grep -v "^$"
Defaults requiretty
Defaults !visiblepw
Defaults always_set_home
Defaults env_reset
Defaults env_keep = "COLORS DISPLAY HOSTNAME HISTSIZE INPUTRC KDEDIR LS_COLO RS"
Defaults env_keep += "MAIL PS1 PS2 QTDIR USERNAME LANG LC_ADDRESS LC_CTYPE"
Defaults env_keep += "LC_COLLATE LC_IDENTIFICATION LC_MEASUREMENT LC_MESSAGES "
Defaults env_keep += "LC_MONETARY LC_NAME LC_NUMERIC LC_PAPER LC_TELEPHONE"
Defaults env_keep += "LC_TIME LC_ALL LANGUAGE LINGUAS _XKB_CHARSET XAUTHORITY "
Defaults secure_path = /sbin:/bin:/usr/sbin:/usr/bin
root ALL=(ALL) ALL
hduser ALL=(ALL) ALL
[root@master ~]# chmod u-w /etc/sudoers
[root@master ~]# ls -l /etc/sudoers
-r--r-----. 1 root root 4024 Jan 19 11:20 /etc/sudoers
[root@master ~]# su - hduser
[hduser@master ~]$ sudo -i
[sudo] password for hduser:
[root@master ~]# ls
anaconda-ks.cfg install.log install.log.syslog
### 安装openssh-client 客户端
[root@master ~]# yum install -y openssh-clients
### 用户的无密码登陆
login as: hduser
[email protected]'s password:
[hduser@master ~]$
[hduser@master ~]$
[hduser@master ~]$
[hduser@master ~]$ ssh-keygen -t rsa -P ""
Generating public/private rsa key pair.
Enter file in which to save the key (/home/hduser/.ssh/id_rsa):
Created directory '/home/hduser/.ssh'.
Your identification has been saved in /home/hduser/.ssh/id_rsa.
Your public key has been saved in /home/hduser/.ssh/id_rsa.pub.
The key fingerprint is:
aa:cc:b1:86:6a:c9:3d:e2:52:15:b6:ae:cf:4b:ad:3a [email protected]
The key's randomart image is:
+--[ RSA 2048]----+
| |
| o |
| . o |
| o |
| o S |
| . .. . |
|..ooo o |
|.=EB.= |
|=oo=@. |
+-----------------+
[hduser@master ~]$ cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys
[hduser@master ~]$ ssh localhost
The authenticity of host 'localhost (127.0.0.1)' can't be established.
RSA key fingerprint is 6c:58:b9:5b:c6:a3:35:4f:49:cf:8b:10:0d:93:ae:81.
Are you sure you want to continue connecting (yes/no)? yes
Warning: Permanently added 'localhost' (RSA) to the list of known hosts.
Last login: Tue Jan 19 11:24:05 2016 from 10.17.74.212
[hduser@master ~]$ exit
logout
Connection to localhost closed.
[hduser@master ~]$ ssh master.hadoop
The authenticity of host 'master.hadoop (10.18.11.198)' can't be established.
RSA key fingerprint is 6c:58:b9:5b:c6:a3:35:4f:49:cf:8b:10:0d:93:ae:81.
Are you sure you want to continue connecting (yes/no)? yes
Warning: Permanently added 'master.hadoop,10.18.11.198' (RSA) to the list of known hosts.
Last login: Tue Jan 19 11:27:12 2016 from localhost
[hduser@master ~]$ exit
logout
Connection to master.hadoop closed.
###将master上hduser的authorized_keys复制到所有的slaver1-slaver5的hduser目录下
scp /home/hduser/.ssh/authorized_keys [email protected]:/home/hduser/.ssh/
scp /home/hduser/.ssh/authorized_keys [email protected]:/home/hduser/.ssh/
scp /home/hduser/.ssh/authorized_keys [email protected]:/home/hduser/.ssh/
scp /home/hduser/.ssh/authorized_keys [email protected]:/home/hduser/.ssh/
scp /home/hduser/.ssh/authorized_keys [email protected]:/home/hduser/.ssh/
#如果出现拷贝不成功的问题,请检查是否存在/home/hduser/.ssh目录,如果不存在,请建立完hduser用户后,执行ssh localhost一下即可。
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Fri Sep 23 15:03:21 2016 from master.hadoop
[hduser@slaver1 ~]$ exit
logout
Connection to slaver1.hadoop closed.
[hduser@master ~]$ ssh slaver2.hadoop
Last login: Fri Sep 23 23:03:55 2016 from localhost
[hduser@slaver2 ~]$ exit
logout
Connection to slaver2.hadoop closed.
[hduser@master ~]$ ssh slaver3.hadoop
Last login: Fri Sep 23 23:04:31 2016 from localhost
[hduser@slaver3 ~]$ exit
logout
Connection to slaver3.hadoop closed.
[hduser@master ~]$ ssh slaver4.hadoop
The authenticity of host 'slaver4.hadoop (10.18.11.203)' can't be established.
RSA key fingerprint is bf:89:d8:50:4b:11:db:91:ca:f7:fd:2a:68:7d:07:74.
Are you sure you want to continue connecting (yes/no)? yes
Warning: Permanently added 'slaver4.hadoop' (RSA) to the list of known hosts.
Last login: Fri Sep 23 23:02:22 2016 from localhost
[hduser@slaver4 ~]$ exit
logout
Connection to slaver4.hadoop closed.
[hduser@master ~]$ ssh slaver5.hadoop
The authenticity of host 'slaver5.hadoop (10.18.11.204)' can't be established.
RSA key fingerprint is a3:b2:b1:2f:76:d7:c4:39:32:3c:ca:b7:c8:54:6d:17.
Are you sure you want to continue connecting (yes/no)? yes
Warning: Permanently added 'slaver5.hadoop' (RSA) to the list of known hosts.
Last login: Fri Sep 23 22:51:19 2016 from localhost
[hduser@slaver5 ~]$ exit
logout
Connection to slaver5.hadoop closed.
### 安装jdk
[hduser@master ~]$ ls -l
total 170892
-rw-r--r--. 1 hduser hadoop 174985642 Jul 13 2015 jdk-8u45-linux-i586.tar.gz
[hduser@master ~]$ tar zxvf jdk-8u45-linux-i586.tar.gz
[hduser@master ~]$ sudo mv jdk1.8.0_45 /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo vim /etc/profile
[hduser@master ~]$ tail -n 4 /etc/profile
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$PATH
[hduser@master ~]$ source /etc/profile
[hduser@master ~]$ java -version
java version "1.8.0_45"
Java(TM) SE Runtime Environment (build 1.8.0_45-b14)
Java HotSpot(TM) Client VM (build 25.45-b02, mixed mode)
### 建立目录
[hduser@master ~]$ sudo mkdir -p /usr/local/app/hadoop
[sudo] password for hduser:
[hduser@master ~]$ sudo chown -R hduser:hadoop /usr/local/app/hadoop
[hduser@master ~]$ mkdir -p /usr/local/app/hadoop/dfs/name
[hduser@master ~]$ mkdir -p /usr/local/app/hadoop/dfs/data
[hduser@master ~]$ mkdir -p /usr/local/app/hadoop/tmp/node
[hduser@master ~]$ mkdir -p /usr/local/app/hadoop/tmp/app-logs
[hduser@master ~]$ chmod 750 -R /usr/local/app/hadoop/dfs
[hduser@master ~]$ chmod 750 -R /usr/local/app/hadoop/tmp
[hduser@master ~]$ ls -ld /usr/local/app/hadoop/tmp/
drwxr-x---. 4 hduser hadoop 4096 Jan 19 11:56 /usr/local/app/hadoop/tmp/
[hduser@master ~]$ chmod -R 750 /usr/local/app/hadoop/dfs/
[hduser@master ~]$ ls -dl /usr/local/app/hadoop/dfs
drwxr-x---. 4 hduser hadoop 4096 Jan 19 11:53 /usr/local/app/hadoop/dfs
[root@master hadoop]# ls -l dfs/
total 8
drwxr-x---. 2 hduser hadoop 4096 Jan 19 11:53 data
drwxr-x---. 2 hduser hadoop 4096 Jan 19 11:53 name
[root@master hadoop]# ls -l tmp/
total 8
drwxr-x---. 2 hduser hadoop 4096 Jan 19 11:53 app-logs
drwxr-x---. 2 hduser hadoop 4096 Jan 19 11:53 node
### 安装hadoop
[hduser@master ~]$ ls
hadoop-2.2.0-32bit.tar.gz jdk-8u45-linux-i586.tar.gz
[hduser@master ~]$ tar zxvf hadoop-2.2.0-32bit.tar.gz
[hduser@master ~]$ sudo mv hadoop-2.2.0 /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo chown -R hduser:hadoop /usr/local/hadoop-2.2.0
### 配置hadoop环境
[hduser@master ~]$ vi /usr/local/hadoop-2.2.0/etc/hadoop/hadoop-env.sh
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/hadoop-env.sh | grep -rni "JAVA_HOME"
21:# The only required environment variable is JAVA_HOME. All others are
23:# set JAVA_HOME in this file, so that it is correctly defined on
27:#export JAVA_HOME=${JAVA_HOME}
28:export JAVA_HOME=/usr/local/jdk1.8.0_45
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/hadoop-env.sh | grep -rni "HADOOP_HEAPSIZE"
45:#export HADOOP_HEAPSIZE=
46:export HADOOP_HEAPSIZE=100
[hduser@master ~]$ vi /usr/local/hadoop-2.2.0/etc/hadoop/yarn-env.sh
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/yarn-env.sh | grep -rni "JAVA_HOME"
23:# export JAVA_HOME=/home/y/libexec/jdk1.6.0/
24:export JAVA_HOME=/usr/local/jdk1.8.0_45
25:if [ "$JAVA_HOME" != "" ]; then
26: #echo "run java in $JAVA_HOME"
27: JAVA_HOME=$JAVA_HOME
30:if [ "$JAVA_HOME" = "" ]; then
31: echo "Error: JAVA_HOME is not set."
35:JAVA=$JAVA_HOME/bin/java
[hduser@master ~]$ vi /usr/local/hadoop-2.2.0/etc/hadoop/mapred-env.sh
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/mapred-env.sh | grep -rni "JAVA_HOME"
16:# export JAVA_HOME=/home/y/libexec/jdk1.6.0/
17:export JAVA_HOME=/usr/local/jdk1.8.0_45
### 主要修改以下的几个xml档
[hduser@master ~]$ ls -l /usr/local/hadoop-2.2.0/etc/hadoop/*.xml*
-rw-r--r--. 1 hduser hadoop 3560 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/capacity-scheduler.xml
-rw-r--r--. 1 hduser hadoop 774 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/core-site.xml -----modify
-rw-r--r--. 1 hduser hadoop 9257 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/hadoop-policy.xml
-rw-r--r--. 1 hduser hadoop 775 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/hdfs-site.xml -----modify
-rw-r--r--. 1 hduser hadoop 620 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/httpfs-site.xml
-rw-r--r--. 1 hduser hadoop 4113 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/mapred-queues.xml.template
-rw-r--r--. 1 hduser hadoop 758 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/mapred-site.xml.template -----modify
-rw-r--r--. 1 hduser hadoop 2316 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/ssl-client.xml.example
-rw-r--r--. 1 hduser hadoop 2251 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/ssl-server.xml.example
-rw-r--r--. 1 hduser hadoop 690 Oct 7 2013 /usr/local/hadoop-2.2.0/etc/hadoop/yarn-site.xml -----modify
[hduser@master ~]$ vim /usr/local/hadoop-2.2.0/etc/hadoop/core-site.xml
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/core-site.xml
hadoop.tmp.dir
/usr/local/app/hadoop/tmp
fs.defaultFS
hdfs://master.hadoop:9000
io.file.buffer.size
131072
hadoop.proxyuser.hduser.hosts
*
hadoop.proxyuser.hduser.groups
*
[hduser@master ~]$ cp /usr/local/hadoop-2.2.0/etc/hadoop/hdfs-site.xml /usr/local/hadoop-2.2.0/etc/hadoop/hdfs-site.xml.old
[hduser@master ~]$ vim /usr/local/hadoop-2.2.0/etc/hadoop/hdfs-site.xml
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/hdfs-site.xml
dfs.namenode.secondary.http-address
master.hadoop:50060
dfs.namenode.name.dir
file:/usr/local/app/hadoop/dfs/name
dfs.datanode.data.dir
file:/usr/local/app/hadoop/dfs/data
dfs.http.address
master.hadoop:50070
dfs.webhdfs.enabled
true
dfs.datanode.du.reserved
1073741824
dfs.permissions
false
dfs.replication
3
Default block replication.
The actual number of replications can be specified when the file is created.
The default is used if replication is not specified in create time.
[hduser@master ~]$ cp /usr/local/hadoop-2.2.0/etc/hadoop/mapred-site.xml.template /usr/local/hadoop-2.2.0/etc/hadoop/mapred-site.xml
[hduser@master ~]$ vim /usr/local/hadoop-2.2.0/etc/hadoop/mapred-site.xml
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/mapred-site.xml
mapreduce.framework.name
yarn
mapreduce.jobhistory.address
master.hadoop:9020
mapreduce.jobhistory.webapp.address
master.hadoop:9888
[hduser@master ~]$ cp /usr/local/hadoop-2.2.0/etc/hadoop/yarn-site.xml /usr/local/hadoop-2.2.0/etc/hadoop/yarn-site.xml.old
[hduser@master ~]$ vim /usr/local/hadoop-2.2.0/etc/hadoop/yarn-site.xml
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/yarn-site.xml
yarn.resourcemanager.address
master.hadoop:9001
yarn.resourcemanager.scheduler.address
master.hadoop:9030
yarn.resourcemanager.webapp.address
master.hadoop:9088
yarn.resourcemanager.resource-tracker.address
master.hadoop:9025
yarn.resourcemanager.admin.address
master.hadoop:9040
yarn.nodemanager.aux-services
mapreduce_shuffle
yarn.nodemanager.aux-services.mapreduce.shuffle.class
org.apache.hadoop.mapred.ShuffleHandler
[hduser@master ~]$ vim /usr/local/hadoop-2.2.0/etc/hadoop/slaves
[hduser@master ~]$ cat /usr/local/hadoop-2.2.0/etc/hadoop/slaves
slaver1.hadoop
slaver2.hadoop
slaver3.hadoop
slaver4.hadoop
slaver5.hadoop
###将修改后的hadoop-2.2.0.tar.gz分别拷贝到对应的slaver硬盘中
[root@master ~]# scp /usr/local/hadoop-2.2.0.tar.gz [email protected]:/root/
[email protected]'s password:
hadoop-2.2.0.tar.gz 100% 104MB 11.6MB/s 00:09
[root@master ~]# scp /usr/local/hadoop-2.2.0.tar.gz [email protected]:/root/
[email protected]'s password:
hadoop-2.2.0.tar.gz 100% 104MB 11.6MB/s 00:09
[root@master ~]# scp /usr/local/hadoop-2.2.0.tar.gz [email protected]:/root/
[email protected]'s password:
hadoop-2.2.0.tar.gz 100% 104MB 11.6MB/s 00:09
[root@master ~]# scp /usr/local/hadoop-2.2.0.tar.gz [email protected]:/root/
[email protected]'s password:
hadoop-2.2.0.tar.gz 100% 104MB 10.4MB/s 00:10
slaver的配置仿照master的配置。具体过程参见:
######################## slaver1 #######################
###禁用IPV6
[root@slaver1 ~]# echo "install ipv6 /bin/true" >> /etc/modprobe.d/anaconda.conf
[root@slaver1 ~]# vim /etc/modprobe.d/anaconda.conf
[root@slaver1 ~]# lsmod |grep -i ipv6
nf_conntrack_ipv6 7207 2
nf_defrag_ipv6 8897 1 nf_conntrack_ipv6
nf_conntrack 65661 3 nf_conntrack_ipv4,nf_conntrack_ipv6,xt_state
ipv6 261089 35 ip6t_REJECT,nf_conntrack_ipv6,nf_defrag_ipv6
[root@slaver1 ~]# ifconfig |grep -i inet6
inet6 addr: fdd8:8f0:124b:0:201:6cff:fe45:6728/64 Scope:Global
inet6 addr: fe80::201:6cff:fe45:6728/64 Scope:Link
inet6 addr: ::1/128 Scope:Host
[root@slaver1 ~]# reboot
### 禁用防火墙
[root@slaver1 ~]# chkconfig --list |grep iptables
iptables 0:off 1:off 2:on 3:on 4:on 5:on 6:off
[root@slaver1 ~]# chkconfig iptables off
[root@slaver1 ~]# /etc/init.d/iptables stop
iptables: Setting chains to policy ACCEPT: filter [ OK ]
iptables: Flushing firewall rules: [ OK ]
iptables: Unloading modules: [ OK ]
[root@slaver1 ~]# ls
anaconda-ks.cfg hadoop-2.2.0.tar.gz install.log install.log.syslog jdk-8u45-linux-i586.tar.gz
### 安装jdk
[root@slaver1 ~]# tar zxvf jdk-8u45-linux-i586.tar.gz -C /usr/local/
[root@slaver1 ~]# tail -n 4 /etc/profile
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$PATH
[root@slaver1 ~]# source /etc/profile
[root@slaver1 ~]# java -version
java version "1.8.0_45"
Java(TM) SE Runtime Environment (build 1.8.0_45-b14)
Java HotSpot(TM) Server VM (build 25.45-b02, mixed mode)
### 建立组及安装openssh-client
[root@slaver1 ~]# groupadd hadoop
[root@slaver1 ~]# useradd -g hadoop hduser
[root@slaver1 ~]# passwd hduser
Changing password for user hduser.
New password:
BAD PASSWORD: it is based on a dictionary word
Retype new password:
passwd: all authentication tokens updated successfully.
[root@slaver1 ~]# chmod u+w /etc/sudoers
[root@slaver1 ~]# vi /etc/sudoers
[root@slaver1 ~]# chmod u-w /etc/sudoers
[root@slaver1 ~]# yum install -y openssh-clients
### hduser 登陆
login as: hduser
[email protected]'s password:
[hduser@slaver1 ~]$ ls
[hduser@slaver1 ~]$ sudo -i
We trust you have received the usual lecture from the local System
Administrator. It usually boils down to these three things:
#1) Respect the privacy of others.
#2) Think before you type.
#3) With great power comes great responsibility.
[sudo] password for hduser:
[root@slaver1 ~]# exit
logout
[hduser@slaver1 ~]$ sudo -i
[root@slaver1 ~]# exit
logout
### 创建目录
[hduser@slaver1 ~]$ sudo mkdir -p /usr/local/app/hadoop
[hduser@slaver1 ~]$ sudo chown -R hduser:hadoop /usr/local/app/hadoop
[hduser@slaver1 ~]$ mkdir -p /usr/local/app/hadoop/dfs/name
[hduser@slaver1 ~]$ mkdir -p /usr/local/app/hadoop/dfs/data
[hduser@slaver1 ~]$ mkdir -p /usr/local/app/hadoop/tmp/node
[hduser@slaver1 ~]$ mkdir -p /usr/local/app/hadoop/tmp/app-logs
[hduser@slaver1 ~]$ chmod 750 -R /usr/local/app/hadoop/dfs
[hduser@slaver1 ~]$ chmod 750 -R /usr/local/app/hadoop/tmp
[hduser@slaver1 ~]$ ls -ld /usr/local/app/hadoop/tmp/app-logs
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:25 /usr/local/app/hadoop/tmp/app-logs
[hduser@slaver1 ~]$ ls -l /usr/local/app/hadoop/dfs/
total 8
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:24 data
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:24 name
[hduser@slaver1 ~]$ ls -l /usr/local/app/hadoop/tmp/
total 8
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:25 app-logs
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:25 app-logs
drwxr-x---. 2 hduser hadoop 4096 Sep 23 13:25 node
### 安装和配置hadoop
[hduser@slaver1 ~]$ tar zxvf hadoop-2.2.0.tar.gz -C /usr/local/ <---此包配置文件已经做过修改,无需再次配置
[hduser@slaver1 ~]$ sudo chown -R hduser:hadoop /usr/local/hadoop-2.2.0
[sudo] password for hduser:
######## master hdfs格式化
[hduser@master ~]$ hdfs namenode -format
16/01/19 16:43:15 INFO namenode.NameNode: STARTUP_MSG:
/************************************************************
STARTUP_MSG: Starting NameNode
STARTUP_MSG: host = master.hadoop/10.18.11.198
STARTUP_MSG: args = [-format]
STARTUP_MSG: version = 2.2.0
STARTUP_MSG: classpath = /usr/local/hadoop-2.2.0/etc/hadoop:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-compress-1.4.1.jar:/usr/local/hadoop-2.2.0 /share/hadoop/common/lib/stax-api-1.0.1.jar:/usr/local/hadoop-2.2.0/share/hadoop /common/lib/log4j-1.2.17.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jsp -api-2.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-el-1.0.jar: /usr/local/hadoop-2.2.0/share/hadoop/common/lib/mockito-all-1.8.5.jar:/usr/local /hadoop-2.2.0/share/hadoop/common/lib/jackson-core-asl-1.8.8.jar:/usr/local/hado op-2.2.0/share/hadoop/common/lib/commons-beanutils-core-1.8.0.jar:/usr/local/had oop-2.2.0/share/hadoop/common/lib/commons-httpclient-3.1.jar:/usr/local/hadoop-2 .2.0/share/hadoop/common/lib/servlet-api-2.5.jar:/usr/local/hadoop-2.2.0/share/h adoop/common/lib/jersey-json-1.9.jar:/usr/local/hadoop-2.2.0/share/hadoop/common /lib/activation-1.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons- logging-1.1.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-net-3. 1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jetty-6.1.26.jar:/usr/loca l/hadoop-2.2.0/share/hadoop/common/lib/commons-digester-1.8.jar:/usr/local/hadoo p-2.2.0/share/hadoop/common/lib/jackson-mapper-asl-1.8.8.jar:/usr/local/hadoop-2 .2.0/share/hadoop/common/lib/asm-3.2.jar:/usr/local/hadoop-2.2.0/share/hadoop/co mmon/lib/jets3t-0.6.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jetty- util-6.1.26.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jettison-1.1.jar :/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jersey-server-1.9.jar:/usr/loca l/hadoop-2.2.0/share/hadoop/common/lib/commons-beanutils-1.7.0.jar:/usr/local/ha doop-2.2.0/share/hadoop/common/lib/xz-1.0.jar:/usr/local/hadoop-2.2.0/share/hado op/common/lib/paranamer-2.3.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/ commons-collections-3.2.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/js ch-0.1.42.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-cli-1.2.ja r:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/hadoop-annotations-2.2.0.jar:/ usr/local/hadoop-2.2.0/share/hadoop/common/lib/hadoop-auth-2.2.0.jar:/usr/local/ hadoop-2.2.0/share/hadoop/common/lib/jackson-jaxrs-1.8.8.jar:/usr/local/hadoop-2 .2.0/share/hadoop/common/lib/jersey-core-1.9.jar:/usr/local/hadoop-2.2.0/share/h adoop/common/lib/commons-codec-1.4.jar:/usr/local/hadoop-2.2.0/share/hadoop/comm on/lib/jaxb-impl-2.2.3-1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jun it-4.8.2.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-lang-2.5.ja r:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-math-2.1.jar:/usr/loca l/hadoop-2.2.0/share/hadoop/common/lib/jaxb-api-2.2.2.jar:/usr/local/hadoop-2.2. 0/share/hadoop/common/lib/avro-1.7.4.jar:/usr/local/hadoop-2.2.0/share/hadoop/co mmon/lib/commons-io-2.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jasp er-runtime-5.5.23.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/xmlenc-0.5 2.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/zookeeper-3.4.5.jar:/usr/l ocal/hadoop-2.2.0/share/hadoop/common/lib/netty-3.6.2.Final.jar:/usr/local/hadoo p-2.2.0/share/hadoop/common/lib/jackson-xc-1.8.8.jar:/usr/local/hadoop-2.2.0/sha re/hadoop/common/lib/snappy-java-1.0.4.1.jar:/usr/local/hadoop-2.2.0/share/hadoo p/common/lib/jsr305-1.3.9.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/pr otobuf-java-2.5.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/jasper-com piler-5.5.23.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/commons-configu ration-1.6.jar:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/guava-11.0.2.jar: /usr/local/hadoop-2.2.0/share/hadoop/common/lib/slf4j-api-1.7.5.jar:/usr/local/h adoop-2.2.0/share/hadoop/common/lib/slf4j-log4j12-1.7.5.jar:/usr/local/hadoop-2. 2.0/share/hadoop/common/hadoop-nfs-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoo p/common/hadoop-common-2.2.0-tests.jar:/usr/local/hadoop-2.2.0/share/hadoop/comm on/hadoop-common-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs:/usr/local/ hadoop-2.2.0/share/hadoop/hdfs/lib/log4j-1.2.17.jar:/usr/local/hadoop-2.2.0/shar e/hadoop/hdfs/lib/jsp-api-2.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/ commons-el-1.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/jackson-core-as l-1.8.8.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/servlet-api-2.5.jar:/u sr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/commons-logging-1.1.1.jar:/usr/local /hadoop-2.2.0/share/hadoop/hdfs/lib/jetty-6.1.26.jar:/usr/local/hadoop-2.2.0/sha re/hadoop/hdfs/lib/jackson-mapper-asl-1.8.8.jar:/usr/local/hadoop-2.2.0/share/ha doop/hdfs/lib/asm-3.2.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/jetty-ut il-6.1.26.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/jersey-server-1.9.ja r:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/commons-cli-1.2.jar:/usr/local/h adoop-2.2.0/share/hadoop/hdfs/lib/commons-daemon-1.0.13.jar:/usr/local/hadoop-2. 2.0/share/hadoop/hdfs/lib/jersey-core-1.9.jar:/usr/local/hadoop-2.2.0/share/hado op/hdfs/lib/commons-codec-1.4.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/ commons-lang-2.5.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/commons-io-2. 1.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/jasper-runtime-5.5.23.jar:/u sr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/xmlenc-0.52.jar:/usr/local/hadoop-2. 2.0/share/hadoop/hdfs/lib/netty-3.6.2.Final.jar:/usr/local/hadoop-2.2.0/share/ha doop/hdfs/lib/jsr305-1.3.9.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/pro tobuf-java-2.5.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/lib/guava-11.0.2. jar:/usr/local/hadoop-2.2.0/share/hadoop/hdfs/hadoop-hdfs-nfs-2.2.0.jar:/usr/loc al/hadoop-2.2.0/share/hadoop/hdfs/hadoop-hdfs-2.2.0.jar:/usr/local/hadoop-2.2.0/ share/hadoop/hdfs/hadoop-hdfs-2.2.0-tests.jar:/usr/local/hadoop-2.2.0/share/hado op/yarn/lib/commons-compress-1.4.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn /lib/junit-4.10.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/guice-3.0.jar: /usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/hamcrest-core-1.1.jar:/usr/local/h adoop-2.2.0/share/hadoop/yarn/lib/log4j-1.2.17.jar:/usr/local/hadoop-2.2.0/share /hadoop/yarn/lib/jackson-core-asl-1.8.8.jar:/usr/local/hadoop-2.2.0/share/hadoop /yarn/lib/guice-servlet-3.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/ja ckson-mapper-asl-1.8.8.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/asm-3.2 .jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/jersey-server-1.9.jar:/usr/lo cal/hadoop-2.2.0/share/hadoop/yarn/lib/xz-1.0.jar:/usr/local/hadoop-2.2.0/share/ hadoop/yarn/lib/paranamer-2.3.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/ javax.inject-1.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/hadoop-annotati ons-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/jersey-guice-1.9.jar :/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/jersey-core-1.9.jar:/usr/local/ha doop-2.2.0/share/hadoop/yarn/lib/avro-1.7.4.jar:/usr/local/hadoop-2.2.0/share/ha doop/yarn/lib/commons-io-2.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/a opalliance-1.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/netty-3.6.2.Fin al.jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/lib/snappy-java-1.0.4.1.jar:/us r/local/hadoop-2.2.0/share/hadoop/yarn/lib/protobuf-java-2.5.0.jar:/usr/local/ha doop-2.2.0/share/hadoop/yarn/hadoop-yarn-applications-distributedshell-2.2.0.jar :/usr/local/hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-server-nodemanager-2.2.0. jar:/usr/local/hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-server-common-2.2.0.ja r:/usr/local/hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-common-2.2.0.jar:/usr/lo cal/hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-api-2.2.0.jar:/usr/local/hadoop-2 .2.0/share/hadoop/yarn/hadoop-yarn-server-web-proxy-2.2.0.jar:/usr/local/hadoop- 2.2.0/share/hadoop/yarn/hadoop-yarn-server-tests-2.2.0.jar:/usr/local/hadoop-2.2 .0/share/hadoop/yarn/hadoop-yarn-client-2.2.0.jar:/usr/local/hadoop-2.2.0/share/ hadoop/yarn/hadoop-yarn-applications-unmanaged-am-launcher-2.2.0.jar:/usr/local/ hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-server-resourcemanager-2.2.0.jar:/usr /local/hadoop-2.2.0/share/hadoop/yarn/hadoop-yarn-site-2.2.0.jar:/usr/local/hado op-2.2.0/share/hadoop/mapreduce/lib/commons-compress-1.4.1.jar:/usr/local/hadoop -2.2.0/share/hadoop/mapreduce/lib/junit-4.10.jar:/usr/local/hadoop-2.2.0/share/h adoop/mapreduce/lib/guice-3.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce /lib/hamcrest-core-1.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/lo g4j-1.2.17.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/jackson-core-a sl-1.8.8.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/guice-servlet-3. 0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/jackson-mapper-asl-1.8. 8.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/asm-3.2.jar:/usr/local/ hadoop-2.2.0/share/hadoop/mapreduce/lib/jersey-server-1.9.jar:/usr/local/hadoop- 2.2.0/share/hadoop/mapreduce/lib/xz-1.0.jar:/usr/local/hadoop-2.2.0/share/hadoop /mapreduce/lib/paranamer-2.3.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/ lib/javax.inject-1.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/hadoop -annotations-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/jersey -guice-1.9.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/jersey-core-1. 9.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/lib/avro-1.7.4.jar:/usr/loc al/hadoop-2.2.0/share/hadoop/mapreduce/lib/commons-io-2.1.jar:/usr/local/hadoop- 2.2.0/share/hadoop/mapreduce/lib/aopalliance-1.0.jar:/usr/local/hadoop-2.2.0/sha re/hadoop/mapreduce/lib/netty-3.6.2.Final.jar:/usr/local/hadoop-2.2.0/share/hado op/mapreduce/lib/snappy-java-1.0.4.1.jar:/usr/local/hadoop-2.2.0/share/hadoop/ma preduce/lib/protobuf-java-2.5.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapredu ce/hadoop-mapreduce-examples-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapr educe/hadoop-mapreduce-client-app-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop /mapreduce/hadoop-mapreduce-client-shuffle-2.2.0.jar:/usr/local/hadoop-2.2.0/sha re/hadoop/mapreduce/hadoop-mapreduce-client-core-2.2.0.jar:/usr/local/hadoop-2.2 .0/share/hadoop/mapreduce/hadoop-mapreduce-client-jobclient-2.2.0-tests.jar:/usr /local/hadoop-2.2.0/share/hadoop/mapreduce/hadoop-mapreduce-client-common-2.2.0. jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/hadoop-mapreduce-client-hs-2. 2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/hadoop-mapreduce-client-h s-plugins-2.2.0.jar:/usr/local/hadoop-2.2.0/share/hadoop/mapreduce/hadoop-mapred uce-client-jobclient-2.2.0.jar:/usr/local/hadoop-2.2.0/contrib/capacity-schedule r/*.jar
STARTUP_MSG: build = https://svn.apache.org/repos/asf/hadoop/common -r 1529768; compiled by 'hortonmu' on 2013-10-07T06:28Z
STARTUP_MSG: java = 1.8.0_45
************************************************************/
16/01/19 16:43:15 INFO namenode.NameNode: registered UNIX signal handlers for [TERM, HUP, INT]
16/01/19 16:43:16 INFO namenode.FSNamesystem: HA Enabled: false
16/01/19 16:43:16 INFO namenode.FSNamesystem: Append Enabled: true
16/01/19 16:43:17 INFO util.GSet: Computing capacity for map INodeMap
16/01/19 16:43:17 INFO util.GSet: VM type = 32-bit
16/01/19 16:43:17 INFO util.GSet: 1.0% max memory = 96.7 MB
16/01/19 16:43:17 INFO util.GSet: capacity = 2^18 = 262144 entries
16/01/19 16:43:17 INFO namenode.NameNode: Caching file names occuring more than 10 times
。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。。
16/01/19 16:43:17 INFO util.GSet: capacity = 2^13 = 8192 entries
16/01/19 16:43:17 INFO common.Storage: Storage directory /usr/local/app/hadoop/dfs/name has been successfully formatted.
16/01/19 16:43:17 INFO util.ExitUtil: Exiting with status 0
16/01/19 16:43:17 INFO namenode.NameNode: SHUTDOWN_MSG:
/************************************************************
SHUTDOWN_MSG: Shutting down NameNode at master.hadoop/10.18.11.198
************************************************************/
[hduser@master ~]$ start-dfs.sh
Starting namenodes on [master.hadoop]
master.hadoop: namenode running as process 3395. Stop it first.
slaver1.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver1.hadoop.out
slaver5.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver5.hadoop.out
slaver3.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver3.hadoop.out
slaver4.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver4.hadoop.out
slaver2.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver2.hadoop.out
Starting secondary namenodes [master.hadoop]
master.hadoop: starting secondarynamenode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-secondarynamenode-master.hadoop.out
[hduser@master ~]$ jps
3395 NameNode
3863 SecondaryNameNode
3960 Jps
[hduser@slaver2 ~]$ jps
2023 DataNode
2092 Jps
[hduser@slaver3 ~]$ jps
1841 Jps
1774 DataNode
[hduser@master ~]$ stop-all.sh
This script is Deprecated. Instead use stop-dfs.sh and stop-yarn.sh
Stopping namenodes on [master.hadoop]
master.hadoop: stopping namenode
slaver3.hadoop: stopping datanode
slaver4.hadoop: stopping datanode
slaver5.hadoop: stopping datanode
slaver1.hadoop: stopping datanode
slaver2.hadoop: stopping datanode
Stopping secondary namenodes [master.hadoop]
master.hadoop: stopping secondarynamenode
stopping yarn daemons
no resourcemanager to stop
slaver1.hadoop: no nodemanager to stop
slaver5.hadoop: no nodemanager to stop
slaver4.hadoop: no nodemanager to stop
slaver3.hadoop: no nodemanager to stop
slaver2.hadoop: no nodemanager to stop
no proxyserver to stop
[hduser@master ~]$ start-all.sh
This script is Deprecated. Instead use start-dfs.sh and start-yarn.sh
Starting namenodes on [master.hadoop]
master.hadoop: starting namenode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-namenode-master.hadoop.out
slaver5.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver5.hadoop.out
slaver3.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver3.hadoop.out
slaver4.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver4.hadoop.out
slaver1.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver1.hadoop.out
slaver2.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver2.hadoop.out
Starting secondary namenodes [master.hadoop]
master.hadoop: starting secondarynamenode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-secondarynamenode-master.hadoop.out
starting yarn daemons
starting resourcemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-resourcemanager-master.hadoop.out
slaver3.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver3.hadoop.out
slaver4.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver4.hadoop.out
slaver5.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver5.hadoop.out
slaver1.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver1.hadoop.out
slaver2.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver2.hadoop.out
在Windows上通过做如下的修改就可以进行查看了。
########################
修改windows 系统下的hosts文件:
C:\Windows\System32\drivers\etc\hosts
在最后面添加如下的几行
10.18.11.198 master.hadoop
10.18.11.199 slaver1.hadoop
10.18.11.201 slaver2.hadoop
10.18.11.202 slaver3.hadoop
10.18.11.203 slaver4.hadoop
10.18.11.204 slaver5.hadoop
查看Hadoop资源管理器
http://master.hadoop:50070/
http://master.hadoop:50060/
http://master.hadoop:9088/cluster
下面在此基础上进行ZooKeeper的部署
[hduser@master ~]$ sudo tar zxvf zookeeper-3.4.5.tar.gz -C /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo vim /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@master ~]$ source /etc/profile
[hduser@master ~]$ echo $ZOOKEEPER_HOME
/usr/local/zookeeper-3.4.5
[hduser@master ~]$ ls /usr/local/app/hadoop/ -l
total 8
drwxr-x---. 4 hduser hadoop 4096 Jan 19 11:53 dfs
drwxr-x---. 5 hduser hadoop 4096 Jan 19 17:07 tmp
[hduser@master ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@master ~]$ cp /usr/local/zookeeper-3.4.5/conf/zoo_sample.cfg /usr/local/zookeeper-3.4.5/conf/zoo.cfg
[hduser@master ~]$ cat /usr/local/zookeeper-3.4.5/conf/zoo.cfg |grep -v "#"
tickTime=2000
initLimit=10
syncLimit=5
dataDir=/usr/local/app/hadoop/zookeeper
clientPort=2181
server.0=10.18.11.199:2888:3888
server.1=10.18.11.201:2888:3888
server.2=10.18.11.202:2888:3888
server.3=10.18.11.203:2888:3888
server.4=10.18.11.204:2888:3888
[hduser@slaver1 ~]$ sudo vi /etc/profile
[sudo] password for hduser:
[hduser@slaver1 ~]$ tail -n 10 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@slaver1 ~]$ sudo chown -R hduser:hadoop /usr/local/zookeeper-3.4.5
[sudo] password for hduser:
[hduser@slaver1 ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@slaver1 ~]$ ls -ld /usr/local/app/hadoop/zookeeper
drwxr-xr-x. 2 hduser hadoop 4096 Sep 23 16:19 /usr/local/app/hadoop/zookeeper
[hduser@slaver1 ~]$ vi /usr/local/app/hadoop/zookeeper/myid
[hduser@slaver1 ~]$ cat /usr/local/app/hadoop/zookeeper/myid
0
[hduser@slaver2 ~]$ sudo vi /etc/profile
[sudo] password for hduser:
[hduser@slaver2 ~]$ tail -n 10 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@slaver2 ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@slaver2 ~]$ vi /usr/local/app/hadoop/zookeeper/myid
[hduser@slaver2 ~]$ cat /usr/local/app/hadoop/zookeeper/myid
1
[hduser@slaver3 ~]$ sudo vi /etc/profile
[sudo] password for hduser:
[hduser@slaver3 ~]$ tail -n 10 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@slaver3 ~]$ sudo chown -R hduser:hadoop /usr/local/zookeeper-3.4.5
[sudo] password for hduser:
[hduser@slaver3 ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@slaver3 ~]$ ls -ld /usr/local/app/hadoop/zookeeper
drwxr-xr-x. 2 hduser hadoop 4096 Sep 24 00:26 /usr/local/app/hadoop/zookeeper
[hduser@slaver3 ~]$ echo '2' >/usr/local/app/hadoop/zookeeper/myid
[hduser@slaver3 ~]$ cat /usr/local/app/hadoop/zookeeper/myid
2
[hduser@slaver4 ~]$ sudo vi /etc/profile
[sudo] password for hduser:
[hduser@slaver4 ~]$ tail -n 10 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@slaver4 ~]$ sudo chown -R hduser:hadoop /usr/local/zookeeper-3.4.5
[sudo] password for hduser:
[hduser@slaver4 ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@slaver4 ~]$ echo '3' >/usr/local/app/hadoop/zookeeper/myid
[hduser@slaver4 ~]$ cat /usr/local/app/hadoop/zookeeper/myid
3
[hduser@master ~]$ ssh slaver5.hadoop
Last login: Fri Sep 23 22:56:41 2016 from master.hadoop
[hduser@slaver5 ~]$ sudo vi /etc/profile
[sudo] password for hduser:
[hduser@slaver5 ~]$ tail -n 10 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$PATH
[hduser@slaver5 ~]$ sudo chown -R hduser:hadoop /usr/local/zookeeper-3.4.5
[sudo] password for hduser:
[hduser@slaver5 ~]$ mkdir /usr/local/app/hadoop/zookeeper
[hduser@slaver5 ~]$ echo '4' >/usr/local/app/hadoop/zookeeper/myid
#### 直接启动,日志在后台显示
[hduser@slaver1 ~]$ zkServer.sh start
[hduser@slaver2 ~]$ zkServer.sh start
[hduser@slaver3 ~]$ zkServer.sh start
[hduser@slaver4 ~]$ zkServer.sh start
[hduser@slaver5 ~]$ zkServer.sh start
#### 日志在前台显示的启动方式
[hduser@slaver1 ~]$ zkServer.sh start-foreground
[hduser@slaver2 ~]$ zkServer.sh start-foreground
[hduser@slaver3 ~]$ zkServer.sh start-foreground
[hduser@slaver4 ~]$ zkServer.sh start-foreground
[hduser@slaver5 ~]$ zkServer.sh start-foreground
##### 问题##########
启动时报错:
Error contacting service. It is probably not running.
####查看zookeeper的运行状态
login as: hduser
[email protected]'s password:
Last login: Tue Jan 19 18:41:13 2016 from 10.17.74.212
[hduser@master ~]$ ssh slaver2.hadoop
Last login: Sat Sep 24 00:42:57 2016 from master.hadoop
[hduser@slaver2 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
[hduser@slaver2 ~]$ exit
logout
Connection to slaver2.hadoop closed.
[hduser@master ~]$ ssh slaver3.hadoop
Last login: Sat Sep 24 00:43:33 2016 from master.hadoop
[hduser@slaver3 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: leader
[hduser@slaver3 ~]$ exit
logout
Connection to slaver3.hadoop closed.
[hduser@master ~]$ ssh slaver4.hadoop
Last login: Sat Sep 24 00:42:07 2016 from master.hadoop
[hduser@slaver4 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
[hduser@slaver4 ~]$ exit
logout
Connection to slaver4.hadoop closed.
[hduser@master ~]$ ssh slaver5.hadoop
Last login: Sat Sep 24 00:31:02 2016 from master.hadoop
[hduser@slaver5 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
[hduser@slaver5 ~]$ exit
logout
Connection to slaver5.hadoop closed.
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Fri Sep 23 16:39:16 2016 from master.hadoop
[hduser@slaver1 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
###关闭slaver3.hadoop后,重新查看运行状态
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Fri Sep 23 16:39:16 2016 from master.hadoop
[hduser@slaver1 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
[hduser@slaver1 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: follower
[hduser@slaver1 ~]$ exit
logout
Connection to slaver1.hadoop closed.
[hduser@master ~]$ ssh slaver5.hadoop
Last login: Sat Sep 24 00:32:16 2016 from master.hadoop
[hduser@slaver5 ~]$ zkServer.sh status
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Mode: leader
下面开始HBase集群部署
[hduser@master ~]$ ls
hadoop-2.2.0-32bit.tar.gz hbase-0.98.8-hadoop2-bin.tar.gz jdk-8u45-linux-i586.tar.gz zookeeper-3.4.5.tar.gz
[hduser@master ~]$ tar zxvf hbase-0.98.8-hadoop2-bin.tar.gz
[hduser@master ~]$ sudo mv hbase-0.98.8-hadoop2
hbase-0.98.8-hadoop2/ hbase-0.98.8-hadoop2-bin.tar.gz
[hduser@master ~]$ sudo mv hbase-0.98.8-hadoop2 /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo chown -R hduser:hadoop /usr/local/hbase-0.98.8-hadoop2/
[hduser@master ~]$ vim /usr/local/hbase-0.98.8-hadoop2/conf/hbase-env.sh
[hduser@master ~]$ vim /usr/local/hbase-0.98.8-hadoop2/conf/hbase-env.sh
[hduser@master ~]$ cat /usr/local/hbase-0.98.8-hadoop2/conf/hbase-env.sh | grep -v "#"|grep -v "^$"
export JAVA_HOME=/usr/local/jdk1.8.0_45
export HBASE_CLASSPATH=/usr/local/hadoop-2.2.0/etc/hadoop
export HBASE_OPTS="-XX:+UseConcMarkSweepGC"
export HBASE_PID_DIR=/usr/local/app/hadoop/hbase/tmp
export HBASE_MANAGES_ZK=false
[hduser@master ~]$ mkdir -p /usr/local/app/hadoop/hbase/tmp
[hduser@master ~]$ ls -ld /usr/local/app/hadoop/hbase
drwxr-xr-x. 3 hduser hadoop 4096 Jan 19 19:10 /usr/local/app/hadoop/hbase
[hduser@master ~]$ ls -l /usr/local/app/hadoop/hbase
total 4
drwxr-xr-x. 2 hduser hadoop 4096 Jan 19 19:10 tmp
[hduser@master ~]$ hdfs dfs -mkdir /hbase
[hduser@master ~]$ vim /usr/local/hbase-0.98.8-hadoop2/conf/hbase-site.xml
hbase.master
master.hadoop:60000
hbase.master.maxclockskew
180000
hbase.rootdir
hdfs://master.hadoop:9000/hbase
hbase.cluster.distributed
true
hbase.zookeeper.quorum
slaver1.hadoop,slaver2.hadoop,slaver3.hadoop,slaver4.hadoop,slaver5.hadoop
hbase.zookeeper.property.dataDir
/usr/local/app/hadoop/zookeeper
hbase.tmp.dir
/usr/local/app/hadoop/hbase/tmp
hbase.zookeeper.property.clientPort
2181
hbase.defaults.for.version
0.98.8-hadoop2
[hduser@master ~]$ vim /usr/local/hbase-0.98.8-hadoop2/conf/regionservers
[hduser@master ~]$ cat /usr/local/hbase-0.98.8-hadoop2/conf/regionservers
slaver1.hadoop
slaver2.hadoop
slaver3.hadoop
slaver4.hadoop
slaver5.hadoop
### 配置HBase的环境变量
[hduser@master ~]$ sudo vim /etc/profile
[sudo] password for hduser:
[hduser@master ~]$ cat /etc/profile |tail -n 12
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
# set hbase environment
export HBASE_HOME=/usr/local/hbase-0.98.8-hadoop2
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$HBASE_HOME/bin:$PATH
### 将配置好的HBase目录复制到其它的slaver1-slaver5上
[hduser@master ~]$ cd /usr/local
[hduser@master local]$ sudo tar zxvf hbase-0.98.8-hadoop2-to-hbasenode.tar.gz hadoop-2.2.0/
[hduser@master local]$ scp hbase-0.98.8-hadoop2-to-hbasenode.tar.gz slaver1.hadoop:/home/hduser/
hbase-0.98.8-hadoop2-to-hbasenode.tar.gz 100% 104MB 11.6MB/s 00:09
[hduser@master local]$ scp hbase-0.98.8-hadoop2-to-hbasenode.tar.gz slaver2.hadoop:/home/hduser/
hbase-0.98.8-hadoop2-to-hbasenode.tar.gz 100% 104MB 11.6MB/s 00:09
[hduser@master local]$ scp hbase-0.98.8-hadoop2-to-hbasenode.tar.gz slaver3.hadoop:/home/hduser/
hbase-0.98.8-hadoop2-to-hbasenode.tar.gz 100% 104MB 11.6MB/s 00:09
[hduser@master local]$ scp hbase-0.98.8-hadoop2-to-hbasenode.tar.gz slaver4.hadoop:/home/hduser/
hbase-0.98.8-hadoop2-to-hbasenode.tar.gz 100% 104MB 11.6MB/s 00:09
[hduser@master local]$ scp hbase-0.98.8-hadoop2-to-hbasenode.tar.gz slaver5.hadoop:/home/hduser/
hbase-0.98.8-hadoop2-to-hbasenode.tar.gz 100% 104MB 11.6MB/s 00:09
### 解压并复制到对应目录,并赋予权限,其它的从节点都可以仿照如下的配置
hduser@slaver1 ~]$ tar zxvf hbase-0.98.8-hadoop2-to-hbasenode.tar.gz
[hduser@slaver1 ~]$ sudo mv hbase-0.98.8-hadoop2 /usr/local/
[hduser@slaver1 ~]$ sudo chown -R hduser:hadoop /usr/local/hbase-0.98.8-hadoop2
[hduser@slaver1 ~]$ mkdir -p /usr/local/app/hadoop/hbase/tmp
[hduser@slaver1 ~]$ vim /etc/profile
[hduser@slaver1 ~]$ source /etc/profile
[hduser@slaver1 ~]$ cat /etc/profile |tail -n 12
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
# set hbase environment
export HBASE_HOME=/usr/local/hbase-0.98.8-hadoop2
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$HBASE_HOME/bin:$PATH
### 启动hadoop、zookeeper、hbase应用
三者的启动顺序如下:
1、登陆slaver1-slaver5并启动对应的进程
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Mon Sep 26 17:26:52 2016 from master.hadoop
[hduser@slaver1 ~]$ jps
2002 DataNode
2105 NodeManager
13051 Jps
[hduser@slaver1 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver1 ~]$ jps
13073 QuorumPeerMain <----ZooKeeper 进程
2002 DataNode
13108 Jps
2105 NodeManager
[hduser@master ~]$ jps
24049 HMaster
4658 SecondaryNameNode
4786 ResourceManager
4475 NameNode
24381 Jps
[hduser@slaver1 ~]$ jps
2967 DataNode
14472 QuorumPeerMain
15786 Jps
3071 NodeManager
[hduser@master ~]$ hdfs dfs -ls /hbase
Found 5 items
drwxr-xr-x - hduser supergroup 0 2016-01-22 12:05 /hbase/.tmp
drwxr-xr-x - hduser supergroup 0 2016-01-22 11:52 /hbase/data
-rw-r--r-- 3 hduser supergroup 42 2016-01-22 11:52 /hbase/hbase.id
-rw-r--r-- 3 hduser supergroup 7 2016-01-22 11:52 /hbase/hbase.version
drwxr-xr-x - hduser supergroup 0 2016-01-22 11:52 /hbase/oldWALs
##########故障 ################
hbase数据库的hregionserver没有启动
[hduser@master ~]$ date
Fri Jan 22 14:18:41 CST 2016
[hduser@slaver3 ~]$ date
Mon Sep 26 20:24:00 CST 2016
[hduser@slaver1 ~]$ date
Mon Sep 26 12:25:43 CST 2016
修改所有的slaver1.hadoop-slaver4.hadoop的系统时间
[root@slaver1 ~]# vim /etc/sysconfig/clock
[root@slaver1 ~]# cat /etc/sysconfig/clock
ZONE="Asia/Shanghai"
UTC=false
ARC=false
[root@slaver1 ~]# clock -w
[root@slaver1 ~]# date -s "2016-09-26 12:36:17"
Mon Sep 26 12:36:17 CST 2016
[root@slaver1 ~]# date
Mon Sep 26 12:36:18 CST 2016
###############################
[hduser@master ~]$ start-hbase.sh
starting master, logging to /usr/local/hbase-0.98.8-hadoop2/logs/hbase-hduser-master-master.hadoop.out
slaver3.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver3.hadoop.out
slaver1.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver1.hadoop.out
slaver5.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver5.hadoop.out
slaver4.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver4.hadoop.out
slaver2.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver2.hadoop.out
[hduser@master ~]$ jps
28689 NameNode
30515 HMaster
30644 Jps
29016 ResourceManager
28876 SecondaryNameNode
[hduser@slaver1 ~]$ jps
17141 QuorumPeerMain
16984 NodeManager
16874 DataNode
17836 Jps
17597 HRegionServer
##############################################
启动过程
##############################################
[hduser@master ~]$ start-all.sh
This script is Deprecated. Instead use start-dfs.sh and start-yarn.sh
Starting namenodes on [master.hadoop]
master.hadoop: starting namenode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-namenode-master.hadoop.out
slaver1.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver1.hadoop.out
slaver2.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver2.hadoop.out
slaver3.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver3.hadoop.out
slaver4.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver4.hadoop.out
slaver5.hadoop: starting datanode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-datanode-slaver5.hadoop.out
Starting secondary namenodes [master.hadoop]
master.hadoop: starting secondarynamenode, logging to /usr/local/hadoop-2.2.0/logs/hadoop-hduser-secondarynamenode-master.hadoop.out
starting yarn daemons
starting resourcemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-resourcemanager-master.hadoop.out
slaver5.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver5.hadoop.out
slaver4.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver4.hadoop.out
slaver3.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver3.hadoop.out
slaver1.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver1.hadoop.out
slaver2.hadoop: starting nodemanager, logging to /usr/local/hadoop-2.2.0/logs/yarn-hduser-nodemanager-slaver2.hadoop.out
[hduser@master ~]$ jps
1796 SecondaryNameNode
2187 Jps
1611 NameNode
1932 ResourceManager
########### slaver1.hadoop
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Mon Sep 26 13:45:48 2016 from master.hadoop
[hduser@slaver1 ~]$ jps
1674 NodeManager
1562 DataNode
1820 Jps
[hduser@slaver1 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver1 ~]$ jps
1843 QuorumPeerMain
1674 NodeManager
1866 Jps
1562 DataNode
########### slaver2.hadoop
[hduser@master ~]$ ssh slaver2.hadoop
Last login: Mon Sep 26 13:46:05 2016 from master.hadoop
[hduser@slaver2 ~]$ jps
1831 Jps
1692 NodeManager
1582 DataNode
[hduser@slaver2 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver2 ~]$ jps
1878 Jps
1692 NodeManager
1853 QuorumPeerMain
1582 DataNode
[hduser@master ~]$ ssh slaver3.hadoop
Last login: Mon Sep 26 13:46:17 2016 from master.hadoop
[hduser@slaver3 ~]$ jps
1715 Jps
1573 NodeManager
1464 DataNode
[hduser@slaver3 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... already running as process 1504.
[hduser@slaver3 ~]$ zkServer.sh stop
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Stopping zookeeper ... STOPPED
[hduser@slaver3 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver3 ~]$ jps
1573 NodeManager
1757 QuorumPeerMain
1791 Jps
[hduser@master ~]$ ssh slaver4.hadoop
Last login: Mon Sep 26 13:46:26 2016 from master.hadoop
[hduser@slaver4 ~]$ jps
1704 NodeManager
1593 DataNode
1849 Jps
[hduser@slaver4 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver4 ~]$ jps
1904 Jps
1704 NodeManager
1593 DataNode
1871 QuorumPeerMain
[hduser@master ~]$ ssh slaver5.hadoop
Last login: Mon Sep 26 13:46:36 2016 from master.hadoop
[hduser@slaver5 ~]$ jps
1840 Jps
1697 NodeManager
1586 DataNode
[hduser@slaver5 ~]$ zkServer.sh start
JMX enabled by default
Using config: /usr/local/zookeeper-3.4.5/bin/../conf/zoo.cfg
Starting zookeeper ... STARTED
[hduser@slaver5 ~]$ jps
1697 NodeManager
1586 DataNode
1862 QuorumPeerMain
1896 Jps
[hduser@master ~]$ start-hbase.sh
starting master, logging to /usr/local/hbase-0.98.8-hadoop2/logs/hbase-hduser-master-master.hadoop.out
slaver5.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver5.hadoop.out
slaver2.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver2.hadoop.out
slaver4.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver4.hadoop.out
slaver3.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver3.hadoop.out
slaver1.hadoop: starting regionserver, logging to /usr/local/hbase-0.98.8-hadoop2/bin/../logs/hbase-hduser-regionserver-slaver1.hadoop.out
[hduser@master ~]$ jps
1796 SecondaryNameNode
1611 NameNode
1932 ResourceManager
2349 HMaster
2574 Jps
[hduser@master ~]$ ssh slaver1.hadoop
Last login: Mon Sep 26 13:50:53 2016 from master.hadoop
[hduser@slaver1 ~]$ jps
2131 Jps
1843 QuorumPeerMain
1674 NodeManager
1562 DataNode
1949 HRegionServer
[hduser@slaver1 ~]$ exit
logout
Connection to slaver1.hadoop closed.
[hduser@master ~]$ ssh slaver2.hadoop
Last login: Mon Sep 26 13:51:29 2016 from master.hadoop
[hduser@slaver2 ~]$ jps
2129 Jps
1958 HRegionServer
1692 NodeManager
1853 QuorumPeerMain
1582 DataNode
[hduser@slaver2 ~]$ exit
logout
Connection to slaver2.hadoop closed.
[hduser@master ~]$ ssh slaver3.hadoop
Last login: Mon Sep 26 13:52:20 2016 from master.hadoop
[hduser@slaver3 ~]$ jps
1573 NodeManager
1865 HRegionServer
2027 Jps
1757 QuorumPeerMain
[hduser@slaver3 ~]$ exit
logout
Connection to slaver3.hadoop closed.
[hduser@master ~]$ ssh slaver4.hadoop
Last login: Mon Sep 26 13:53:10 2016 from master.hadoop
[hduser@slaver4 ~]$ jps
2150 Jps
1975 HRegionServer
1704 NodeManager
1593 DataNode
1871 QuorumPeerMain
[hduser@slaver4 ~]$ exit
logout
Connection to slaver4.hadoop closed.
[hduser@master ~]$ ssh slaver5.hadoop
Last login: Mon Sep 26 13:53:35 2016 from master.hadoop
[hduser@slaver5 ~]$ jps
1697 NodeManager
1586 DataNode
1862 QuorumPeerMain
2168 Jps
1966 HRegionServer
[hduser@slaver5 ~]$ exit
logout
Connection to slaver5.hadoop closed.
[hduser@master ~]$ hadoop dfsadmin -report
DEPRECATED: Use of this script to execute hdfs command is deprecated.
Instead use the hdfs command for it.
Configured Capacity: 691105742848 (643.64 GB)
Present Capacity: 647142413354 (602.70 GB)
DFS Remaining: 647141740544 (602.70 GB)
DFS Used: 672810 (657.04 KB)
DFS Used%: 0.00%
Under replicated blocks: 0
Blocks with corrupt replicas: 0
Missing blocks: 0
-------------------------------------------------
Datanodes available: 5 (5 total, 0 dead)
Live datanodes:
Name: 10.18.11.202:50010 (slaver3.hadoop)
Hostname: slaver3.hadoop
Decommission Status : Normal
Configured Capacity: 144660275200 (134.73 GB)
DFS Used: 24576 (24 KB)
Non DFS Used: 9146474496 (8.52 GB)
DFS Remaining: 135513776128 (126.21 GB)
DFS Used%: 0.00%
DFS Remaining%: 93.68%
Last contact: Mon Sep 26 16:09:37 CST 2016
Name: 10.18.11.204:50010 (slaver5.hadoop)
Hostname: slaver5.hadoop
Decommission Status : Normal
Configured Capacity: 51770945536 (48.22 GB)
DFS Used: 167130 (163.21 KB)
Non DFS Used: 4461466406 (4.16 GB)
DFS Remaining: 47309312000 (44.06 GB)
DFS Used%: 0.00%
DFS Remaining%: 91.38%
Last contact: Mon Sep 26 16:09:37 CST 2016
Name: 10.18.11.203:50010 (slaver4.hadoop)
Hostname: slaver4.hadoop
Decommission Status : Normal
Configured Capacity: 51770945536 (48.22 GB)
DFS Used: 168006 (164.07 KB)
Non DFS Used: 4461875130 (4.16 GB)
DFS Remaining: 47308902400 (44.06 GB)
DFS Used%: 0.00%
DFS Remaining%: 91.38%
Last contact: Mon Sep 26 16:09:39 CST 2016
Name: 10.18.11.201:50010 (slaver2.hadoop)
Hostname: slaver2.hadoop
Decommission Status : Normal
Configured Capacity: 391132631040 (364.27 GB)
DFS Used: 166926 (163.01 KB)
Non DFS Used: 21433738226 (19.96 GB)
DFS Remaining: 369698725888 (344.31 GB)
DFS Used%: 0.00%
DFS Remaining%: 94.52%
Last contact: Mon Sep 26 16:09:37 CST 2016
Name: 10.18.11.199:50010 (slaver1.hadoop)
Hostname: slaver1.hadoop
Decommission Status : Normal
Configured Capacity: 51770945536 (48.22 GB)
DFS Used: 146172 (142.75 KB)
Non DFS Used: 4459775236 (4.15 GB)
DFS Remaining: 47311024128 (44.06 GB)
DFS Used%: 0.00%
DFS Remaining%: 91.39%
Last contact: Mon Sep 26 16:09:37 CST 2016
#########################
如果nodejs需要调用hbase,那么需要开启hbase.rest.port
具体配置如下:
[hduser@master ~]$ sed -n '60,63p' /usr/local/hbase-0.98.8-hadoop2/conf/hbase-site.xml
hbase.rest.port
8090
查看是否已经开启对应的rest.port:
[hduser@master conf]$ netstat -atn |grep 8090
开启方式如下:
[hduser@master conf]$ hbase-daemon.sh start rest
starting rest, logging to /usr/local/hbase-0.98.8-hadoop2/logs/hbase-hduser-rest-master.hadoop.out
[hduser@master conf]$ netstat -atn |grep 8090
tcp 0 0 0.0.0.0:8090 0.0.0.0:* LISTEN
##########################
HBase无法停止时的做法
##########################
当运行./stop-hbase时,出现stopping hbase..........无限点时候,先运行./start-hbase.sh,
这时候会提示hbase的各个组件正在运行,
并且给出这些程序的pid,运行kill -9 pid来终止hbase的进程,
此时hbase就停止了,再运行./start-hbase.sh来重启hbase
#### 查看hdfs的目录下的文件
[hduser@master ~]$ hdfs dfs -ls /
Found 1 items
drwxr-xr-x - hduser supergroup 0 2016-09-26 17:08 /hbase
[hduser@master ~]$ hdfs dfs -ls /hbase
Found 8 items
drwxr-xr-x - hduser supergroup 0 2016-09-26 16:07 /hbase/.tmp
drwxr-xr-x - hduser supergroup 0 2016-09-26 16:07 /hbase/WALs
drwxr-xr-x - hduser supergroup 0 2016-09-26 17:13 /hbase/archive
drwxr-xr-x - hduser supergroup 0 2016-09-26 13:54 /hbase/corrupt
drwxr-xr-x - hduser supergroup 0 2016-09-26 12:39 /hbase/data
-rw-r--r-- 3 hduser supergroup 42 2016-01-22 11:52 /hbase/hbase.id
-rw-r--r-- 3 hduser supergroup 7 2016-01-22 11:52 /hbase/hbase.version
drwxr-xr-x - hduser supergroup 0 2016-09-27 15:18 /hbase/oldWALs
############hive的安装
[hduser@master ~]$ sudo mv apache-hive-0.14.0-bin /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo chown -R hduser:hadoop /usr/local/apache-hive-0.14.0-bin
[hduser@master ~]$ tar zxvf apache-hive-0.14.0-src.tar.gz
[hduser@master ~]$ jar cvfM0 hive-hwi-0.14.0.war -C apache-hive-0.14.0-src/hwi/web .
[hduser@master ~]$ ls -l hive-hwi-0.14.0.war
-rw-r--r--. 1 hduser hadoop 151343 Sep 28 09:08 hive-hwi-0.14.0.war
[hduser@master ~]$ mv hive-hwi-0.14.0.war /usr/local/apache-hive-0.14.0-bin/lib/
[hduser@master ~]$ sudo vim /etc/profile
[hduser@master ~]$ source /etc/profile
[hduser@master ~]$ tail -n 18 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
# set hbase environment
export HBASE_HOME=/usr/local/hbase-0.98.8-hadoop2
# set hive environment
export HIVE_HOME=/usr/local/apache-hive-0.14.0-bin
export HCATALOG_HOME=/usr/local/apache-hive-0.14.0-bin/hcatalog
export CLASSPATH=$CLASSPATH:$HIVE_HOME/lib
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$HBASE_HOME/bin:$HIVE_HOME/bin:$HCATALOG_HOME/bin:$HCATALOG_HOME/sbin:$PATH
[hduser@master ~]$ cp /usr/local/apache-hive-0.14.0-bin/conf/hive-default.xml.template /usr/local/apache-hive-0.14.0-bin/conf/hive-site.xml
[hduser@master ~]$ vim /usr/local/apache-hive-0.14.0-bin/conf/hive-site.xml
[hduser@master ~]$ hdfs dfs -mkdir /tmp
[hduser@master ~]$ hdfs dfs -ls /
Found 2 items
drwxr-xr-x - hduser supergroup 0 2016-09-26 17:08 /hbase
drwxr-xr-x - hduser supergroup 0 2016-09-27 15:42 /tmp
[hduser@master ~]$ hdfs dfs -mkdir -p /user/hive/warehouse
[hduser@master ~]$ hdfs dfs -chmod g+w /tmp
[hduser@master ~]$ hdfs dfs -chmod g+w /user/hive/warehouse
[hduser@master ~]$ hdfs dfs -ls /
Found 3 items
drwxr-xr-x - hduser supergroup 0 2016-09-26 17:08 /hbase
drwxrwxr-x - hduser supergroup 0 2016-09-27 15:42 /tmp
drwxr-xr-x - hduser supergroup 0 2016-09-27 15:42 /user
[hduser@master ~]$ hdfs dfs -ls -R /user
drwxr-xr-x - hduser supergroup 0 2016-09-28 09:18 /user/hive
drwxrwxr-x - hduser supergroup 0 2016-09-28 09:18 /user/hive/warehouse
[hduser@master ~]$ vim /usr/local/apache-hive-0.14.0-bin/conf/hive-site.xml
[hduser@master ~]$ cp /usr/local/apache-hive-0.14.0-bin/conf/hive-log4j.properties.template /usr/local/apache-hive-0.14.0-bin/conf/hive-log4j.properties
[hduser@master ~]$ vim /usr/local/apache-hive-0.14.0-bin/conf/hive-log4j.properties
[hduser@master ~]$ mkdir /usr/local/apache-hive-0.14.0-bin/hcatalog/logs
[hduser@master ~]$ vim /usr/local/apache-hive-0.14.0-bin/hcatalog/sbin/hcat_server.sh
[hduser@master ~]$ grep HCAT_LOG_DIR /usr/local/apache-hive-0.14.0-bin/hcatalog/sbin/hcat_server.sh
HCAT_LOG_DIR=/usr/local/apache-hive-0.14.0-bin/hcatalog/logs
HCAT_PID_DIR=${HCAT_PID_DIR:-$HCAT_LOG_DIR}
export HADOOP_OPTS="${HADOOP_OPTS} -server -XX:+UseConcMarkSweepGC -XX:ErrorFile=${HCAT_LOG_DIR}/hcat_err_pid%p.log -Xloggc:${HCAT_LOG_DIR}/hcat_gc.log-`date +'%Y%m%d%H%M'` -verbose:gc -XX:+PrintGCDetails -XX:+PrintGCTimeStamps -XX:+PrintGCDateStamps"
nohup ${HIVE_HOME}/bin/hive --service metastore >${HCAT_LOG_DIR}/hcat.out 2>${HCAT_LOG_DIR}/hcat.err &
echo "Metastore startup failed, see ${HCAT_LOG_DIR}/hcat.err"
echo "Metastore startup failed, see ${HCAT_LOG_DIR}/hcat.err"
[hduser@master ~]$ vimdiff /usr/local/apache-hive-0.14.0-bin/conf/hive-default.xml.template /usr/local/apache-hive-0.14.0-bin/conf/hive-site.xml
|
|
hive.hwi.war.file | hive.hwi.war.file
${env:HWI_WAR_FILE} |
----------------------------------------------------------------------------| lib/hive-hwi-0.14.0.war
This sets the path to the HWI war file, relative to ${HIVE_| This sets the path to the HWI war file, relative to ${HIVE_
|
|
hive.mapred.local.mem | hive.mapred.local.mem
0 | 0
mapper/reducer memory in local mode | mapper/reducer memory in local mode
+ +--2178 lines: --------------------------------------------------|+ +--2178 lines: --------------------------------------------------
##################error#######################
[hduser@master ~]$ hive
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.max.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.maxsize
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.reduce.tasks.speculative.execution is deprecated. Instead, use mapreduce.reduce.speculative
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.committer.job.setup.cleanup.needed is deprecated. Instead, use mapreduce.job.committer.setup.cleanup.needed
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.min.split.size.per.rack is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.rack
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.min.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.min.split.size.per.node is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.node
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.reduce.tasks is deprecated. Instead, use mapreduce.job.reduces
16/09/28 09:30:12 INFO Configuration.deprecation: mapred.input.dir.recursive is deprecated. Instead, use mapreduce.input.fileinputformat.input.dir.recursive
Logging initialized using configuration in file:/usr/local/apache-hive-0.14.0-bin/conf/hive-log4j.properties
SLF4J: Class path contains multiple SLF4J bindings.
SLF4J: Found binding in [jar:file:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/slf4j-log4j12-1.7.5.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: Found binding in [jar:file:/usr/local/apache-hive-0.14.0-bin/lib/hive-jdbc-0.14.0-standalone.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: See http://www.slf4j.org/codes.html#multiple_bindings for an explanation.
SLF4J: Actual binding is of type [org.slf4j.impl.Log4jLoggerFactory]
Exception in thread "main" java.lang.RuntimeException: java.lang.IllegalArgumentException: java.net.URISyntaxException: Relative path in absolute URI: ${system:java.io.tmpdir%7D/$%7Bsystem:user.name%7D
at org.apache.hadoop.hive.ql.session.SessionState.start(SessionState.java:444)
at org.apache.hadoop.hive.cli.CliDriver.run(CliDriver.java:672)
at org.apache.hadoop.hive.cli.CliDriver.main(CliDriver.java:616)
at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
at java.lang.reflect.Method.invoke(Method.java:497)
at org.apache.hadoop.util.RunJar.main(RunJar.java:212)
Caused by: java.lang.IllegalArgumentException: java.net.URISyntaxException: Relative path in absolute URI: ${system:java.io.tmpdir%7D/$%7Bsystem:user.name%7D
at org.apache.hadoop.fs.Path.initialize(Path.java:206)
at org.apache.hadoop.fs.Path.(Path.java:172)
at org.apache.hadoop.hive.ql.session.SessionState.createSessionDirs(SessionState.java:487)
at org.apache.hadoop.hive.ql.session.SessionState.start(SessionState.java:430)
... 7 more
Caused by: java.net.URISyntaxException: Relative path in absolute URI: ${system:java.io.tmpdir%7D/$%7Bsystem:user.name%7D
at java.net.URI.checkPath(URI.java:1823)
at java.net.URI.(URI.java:745)
at org.apache.hadoop.fs.Path.initialize(Path.java:203)
... 10 more
[hduser@master ~]$ vim /usr/local/apache-hive-0.14.0-bin/conf/hive-site.xml
+-- 43 lines: --------|+ +-- 43 lines: --------
hive.exec.scratchdir | hive.exec.scratchdir
/tmp/hive | /tmp/hive
HDFS root scratch dir for Hive jobs which gets created with| HDFS root scratch dir for Hive jobs which gets created with
|
|
hive.exec.local.scratchdir | hive.exec.local.scratchdir
/tmp/hive/local | ${system:java.io.tmpdir}/${system:user.name}
Local scratch space for Hive jobs | Local scratch space for Hive jobs
|
|
hive.downloaded.resources.dir | hive.downloaded.resources.dir
/tmp/hive/resources | ${system:java.io.tmpdir}/${hive.session.id}_resources
Temporary local directory for added resources in the remote| Temporary local directory for added resources in the remote
|
|
hive.scratch.dir.permission | hive.scratch.dir.permission
700 | 700
The permission for the user specific scratch directories th| The permission for the user specific scratch directories th
+ +--1144 lines: --------------------------------------------------|+ +--1144 lines: --------------------------------------------------
hive.hwi.listen.port | hive.hwi.listen.port
9999 | 9999
This is the port the Hive Web Interface will listen onThis is the port the Hive Web Interface will listen on |
|
hive.hwi.war.file | hive.hwi.war.file
| ${env:HWI_WAR_FILE}
lib/hive-hwi-0.14.0.war | ----------------------------------------------------------------------------
This sets the path to the HWI war file, relative to ${HIVE_| This sets the path to the HWI war file, relative to ${HIVE_
|
|
hive.mapred.local.mem | hive.mapred.local.mem
0 | 0
mapper/reducer memory in local mode | mapper/reducer memory in local mode
+ +--2178 lines: --------------------------------------------------|+ +--2178 lines: --------------------------------------------------
[hduser@master ~]$ hive
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.max.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.maxsize
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.reduce.tasks.speculative.execution is deprecated. Instead, use mapreduce.reduce.speculative
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.committer.job.setup.cleanup.needed is deprecated. Instead, use mapreduce.job.committer.setup.cleanup.needed
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.min.split.size.per.rack is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.rack
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.min.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.min.split.size.per.node is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.node
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.reduce.tasks is deprecated. Instead, use mapreduce.job.reduces
16/09/28 09:41:30 INFO Configuration.deprecation: mapred.input.dir.recursive is deprecated. Instead, use mapreduce.input.fileinputformat.input.dir.recursive
Logging initialized using configuration in file:/usr/local/apache-hive-0.14.0-bin/conf/hive-log4j.properties
SLF4J: Class path contains multiple SLF4J bindings.
SLF4J: Found binding in [jar:file:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/slf4j-log4j12-1.7.5.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: Found binding in [jar:file:/usr/local/apache-hive-0.14.0-bin/lib/hive-jdbc-0.14.0-standalone.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: See http://www.slf4j.org/codes.html#multiple_bindings for an explanation.
SLF4J: Actual binding is of type [org.slf4j.impl.Log4jLoggerFactory]
hive>
hive> CREATE TABLE pokes (foo INT, bar STRING);
OK
Time taken: 1.448 seconds
hive> SHOW TABLES;
OK
pokes
Time taken: 0.077 seconds, Fetched: 1 row(s)
hive> DESCRIBE pokes;
OK
foo int
bar string
Time taken: 0.418 seconds, Fetched: 2 row(s)
hive> ALTER TABLE pokes ADD COLUMNS (new_col INT);
OK
Time taken: 0.231 seconds
hive> DESCRIBE pokes;
OK
foo int
bar string
new_col int
Time taken: 0.096 seconds, Fetched: 3 row(s)
hive> DROP TABLE pokes;
OK
Time taken: 4.451 seconds
hive> quit;
[hduser@master ~]$ hcat
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.max.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.maxsize
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.reduce.tasks.speculative.execution is deprecated. Instead, use mapreduce.reduce.speculative
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.committer.job.setup.cleanup.needed is deprecated. Instead, use mapreduce.job.committer.setup.cleanup.needed
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.min.split.size.per.rack is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.rack
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.min.split.size is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.min.split.size.per.node is deprecated. Instead, use mapreduce.input.fileinputformat.split.minsize.per.node
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.reduce.tasks is deprecated. Instead, use mapreduce.job.reduces
16/09/28 09:47:32 INFO Configuration.deprecation: mapred.input.dir.recursive is deprecated. Instead, use mapreduce.input.fileinputformat.input.dir.recursive
SLF4J: Class path contains multiple SLF4J bindings.
SLF4J: Found binding in [jar:file:/usr/local/hadoop-2.2.0/share/hadoop/common/lib/slf4j-log4j12-1.7.5.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: Found binding in [jar:file:/usr/local/apache-hive-0.14.0-bin/lib/hive-jdbc-0.14.0-standalone.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: Found binding in [jar:file:/usr/local/hbase-0.98.8-hadoop2/lib/slf4j-log4j12-1.6.4.jar!/org/slf4j/impl/StaticLoggerBinder.class]
SLF4J: See http://www.slf4j.org/codes.html#multiple_bindings for an explanation.
SLF4J: Actual binding is of type [org.slf4j.impl.Log4jLoggerFactory]
usage: hcat { -e "" | -f "" } [ -g "" ] [ -p "" ] [ -D"=" ]
-D use hadoop value for given property
-e hcat command given from command line
-f hcat commands in file
-g group for the db/table specified in CREATE statement
-h,--help Print help information
-p permissions for the db/table specified in CREATE statement
#################启动hive服务###########
## hwi service
[hduser@master ~]$ nohup hive --service hwi > /dev/null 2> /dev/null &
## hcatalog service
[hduser@master ~]$ hcat_server.sh start
## webhcat service
[hduser@master ~]$ webhcat_server.sh start
###对应的三个进程号
[hduser@master ~]$ ps -ef |grep hive
hduser 22254 20439 1 10:30 pts/0 00:00:02 /usr/local/jdk1.8.0_45/bin/java -Xmx100m -Djava.net.preferIPv4Stack=true -Dhadoop.log.dir=/usr/local/hadoop-2.2.0/logs -Dhadoop.log.file=hadoop.log -Dhadoop.home.dir=/usr/local/hadoop-2.2.0 -Dhadoop.id.str=hduser -Dhadoop.root.logger=INFO,console -Djava.library.path=/usr/local/hadoop-2.2.0/lib/native -Dhadoop.policy.file=hadoop-policy.xml -Djava.net.preferIPv4Stack=true -Xmx512m -Dhadoop.security.logger=INFO,NullAppender org.apache.hadoop.util.RunJar /usr/local/apache-hive-0.14.0-bin/lib/hive-hwi-0.14.0.jar org.apache.hadoop.hive.hwi.HWIServer
hduser 22557 1 7 10:30 pts/0 00:00:18 /usr/local/jdk1.8.0_45/bin/java -Xmx100m -server -XX:+UseConcMarkSweepGC -XX:ErrorFile=/usr/local/apache-hive-0.14.0-bin/hcatalog/logs/hcat_err_pid%p.log -Xloggc:/usr/local/apache-hive-0.14.0-bin/hcatalog/logs/hcat_gc.log-201609281030 -verbose:gc -XX:+PrintGCDetails -XX:+PrintGCTimeStamps -XX:+PrintGCDateStamps -Djava.net.preferIPv4Stack=true -Dhadoop.log.dir=/usr/local/hadoop-2.2.0/logs -Dhadoop.log.file=hadoop.log -Dhadoop.home.dir=/usr/local/hadoop-2.2.0 -Dhadoop.id.str=hduser -Dhadoop.root.logger=INFO,console -Djava.library.path=/usr/local/hadoop-2.2.0/lib/native -Dhadoop.policy.file=hadoop-policy.xml -Djava.net.preferIPv4Stack=true -Xmx512m -Dhadoop.security.logger=INFO,NullAppender org.apache.hadoop.util.RunJar /usr/local/apache-hive-0.14.0-bin/lib/hive-service-0.14.0.jar org.apache.hadoop.hive.metastore.HiveMetaStore
hduser 22788 1 6 10:33 pts/0 00:00:06 /usr/local/jdk1.8.0_45/bin/java -Xmx100m -Dwebhcat.log.dir=. -Dlog4j.configuration=file:///usr/local/apache-hive-0.14.0-bin/hcatalog/sbin/../etc/webhcat/webhcat-log4j.properties -Djava.net.preferIPv4Stack=true -Dhadoop.log.dir=/usr/local/hadoop-2.2.0/logs -Dhadoop.log.file=hadoop.log -Dhadoop.home.dir=/usr/local/hadoop-2.2.0 -Dhadoop.id.str=hduser -Dhadoop.root.logger=INFO,console -Djava.library.path=/usr/local/hadoop-2.2.0/lib/native -Dhadoop.policy.file=hadoop-policy.xml -Djava.net.preferIPv4Stack=true -Xmx512m -Dhadoop.security.logger=INFO,NullAppender org.apache.hadoop.util.RunJar /usr/local/apache-hive-0.14.0-bin/hcatalog/sbin/../share/webhcat/svr/lib/hive-webhcat-0.14.0.jar org.apache.hive.hcatalog.templeton.Main
hduser 22841 20439 0 10:34 pts/0 00:00:00 grep hive
### hive的三种存储方式,请自行百度
########## mahout 集成############
[hduser@master ~]$ tar zxvf apache-mahout-1.0-bin.tar.gz
[hduser@master ~]$ sudo mv apache-mahout-1.0-bin /usr/local/
[sudo] password for hduser:
[hduser@master ~]$ sudo chown -R hduser:hadoop /usr/local/apache-mahout-1.0-bin
[hduser@master ~]$ sudo vim /etc/profile
[hduser@master ~]$ tail -n 22 /etc/profile
# set jdk and hadoop environment
export JAVA_HOME=/usr/local/jdk1.8.0_45
export CLASSPATH=$CLASSPATH:$JAVA_HOME/lib:$JAVA_HOME/jre/lib
export HADOOP_HOME=/usr/local/hadoop-2.2.0
# set zookeeper environment
export ZOOKEEPER_HOME=/usr/local/zookeeper-3.4.5
export CLASSPATH=$CLASSPATH:$ZOOKEEPER_HOME/lib
# set hbase environment
export HBASE_HOME=/usr/local/hbase-0.98.8-hadoop2
# set hive environment
export HIVE_HOME=/usr/local/apache-hive-0.14.0-bin
export HCATALOG_HOME=/usr/local/apache-hive-0.14.0-bin/hcatalog
export CLASSPATH=$CLASSPATH:$HIVE_HOME/lib
# set mahout environment
export MAHOUT_HOME=/usr/local/apache-mahout-1.0-bin
#export MAHOUT_LOCAL=$MAHOUT_HOME
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$HBASE_HOME/bin:$HIVE_HOME/bin:$HCATALOG_HOME/bin:$HCATALOG_HOME/sbin:$MAHOUT_HOME/bin:$MAHOUT_LOCAL/bin:$PATH
[hduser@master ~]$ source /etc/profile
[hduser@master ~]$ wget -c http://archive.ics.uci.edu/ml/databases/synthetic_control/synthetic_control.data
[hduser@master ~]$ mv synthetic_control.data $MAHOUT_HOME
[hduser@master ~]$ cd $MAHOUT_HOME
[hduser@master apache-mahout-1.0-bin]$ ls synthetic_control.data -l
-rw-r--r--. 1 hduser hadoop 288374 Jun 15 1999 synthetic_control.data
[hduser@master ~]$ mahout --help
Running on hadoop, using /usr/local/hadoop-2.2.0/bin/hadoop and HADOOP_CONF_DIR=
MAHOUT-JOB: /usr/local/apache-mahout-1.0-bin/examples/target/mahout-examples-1.0-SNAPSHOT-job.jar
Unknown program '--help' chosen.
Valid program names are:
arff.vector: : Generate Vectors from an ARFF file or directory
baumwelch: : Baum-Welch algorithm for unsupervised HMM training
buildforest: : Build the random forest classifier
canopy: : Canopy clustering
cat: : Print a file or resource as the logistic regression models would see it
cleansvd: : Cleanup and verification of SVD output
clusterdump: : Dump cluster output to text
clusterpp: : Groups Clustering Output In Clusters
cmdump: : Dump confusion matrix in HTML or text formats
concatmatrices: : Concatenates 2 matrices of same cardinality into a single matrix
cvb: : LDA via Collapsed Variation Bayes (0th deriv. approx)
cvb0_local: : LDA via Collapsed Variation Bayes, in memory locally.
describe: : Describe the fields and target variable in a data set
evaluateFactorization: : compute RMSE and MAE of a rating matrix factorization against probes
fkmeans: : Fuzzy K-means clustering
hmmpredict: : Generate random sequence of observations by given HMM
itemsimilarity: : Compute the item-item-similarities for item-based collaborative filtering
kmeans: : K-means clustering
lucene.vector: : Generate Vectors from a Lucene index
lucene2seq: : Generate Text SequenceFiles from a Lucene index
matrixdump: : Dump matrix in CSV format
matrixmult: : Take the product of two matrices
parallelALS: : ALS-WR factorization of a rating matrix
qualcluster: : Runs clustering experiments and summarizes results in a CSV
recommendfactorized: : Compute recommendations using the factorization of a rating matrix
recommenditembased: : Compute recommendations using item-based collaborative filtering
regexconverter: : Convert text files on a per line basis based on regular expressions
resplit: : Splits a set of SequenceFiles into a number of equal splits
rowid: : Map SequenceFile to {SequenceFile, SequenceFile}
rowsimilarity: : Compute the pairwise similarities of the rows of a matrix
runAdaptiveLogistic: : Score new production data using a probably trained and validated AdaptivelogisticRegression model
runlogistic: : Run a logistic regression model against CSV data
seq2encoded: : Encoded Sparse Vector generation from Text sequence files
seq2sparse: : Sparse Vector generation from Text sequence files
seqdirectory: : Generate sequence files (of Text) from a directory
seqdumper: : Generic Sequence File dumper
seqmailarchives: : Creates SequenceFile from a directory containing gzipped mail archives
seqwiki: : Wikipedia xml dump to sequence file
spectralkmeans: : Spectral k-means clustering
split: : Split Input data into test and train sets
splitDataset: : split a rating dataset into training and probe parts
ssvd: : Stochastic SVD
streamingkmeans: : Streaming k-means clustering
svd: : Lanczos Singular Value Decomposition
testforest: : Test the random forest classifier
testnb: : Test the Vector-based Bayes classifier
trainAdaptiveLogistic: : Train an AdaptivelogisticRegression model
trainlogistic: : Train a logistic regression using stochastic gradient descent
trainnb: : Train the Vector-based Bayes classifier
transpose: : Take the transpose of a matrix
validateAdaptiveLogistic: : Validate an AdaptivelogisticRegression model against hold-out data set
vecdist: : Compute the distances between a set of Vectors (or Cluster or Canopy, they must fit in memory) and a list of Vectors
vectordump: : Dump vectors from a sequence file to text
viterbi: : Viterbi decoding of hidden states from given output states sequence
#### mahout error
[hduser@master ~]$ mahout --help
MAHOUT_LOCAL is set, so we don't add HADOOP_CONF_DIR to classpath.
MAHOUT_LOCAL is set, running locally
Error occurred during initialization of VM
Could not reserve enough space for 3145728KB object heap
此处请修改环境变量/etc/profile中的MAHOUT_LOCAL的值,将其修改为空,即,修改成如下:
# set mahout environment
export MAHOUT_HOME=/usr/local/apache-mahout-1.0-bin
#export MAHOUT_LOCAL=$MAHOUT_HOME
export PATH=$JAVA_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$ZOOKEEPER_HOME/bin:$HBASE_HOME/bin:$HIVE_HOME/bin:$HCATALOG_HOME/bin:$HCATALOG_HOME/sbin:$MAHOUT_HOME/bin:$MAHOUT_LOCAL/bin:$PATH
###########################################################
#######################################################
########### mahout的使用方法 #######################
#######################################################
[hduser@master ~]$ hdfs dfs -mkdir -p /user/hduser/testdata
[hduser@master ~]$ wget -c http://archive.ics.uci.edu/ml/databases/synthetic_control/synthetic_control.data
[hduser@master ~]$ hdfs dfs -put ~/synthetic_control.data /user/hduser/testdata
[hduser@master ~]$ hdfs dfs -put /usr/local/apache-mahout-1.0-bin/synthetic_control.data /user/hduser/testdata
[hduser@master ~]$ hdfs dfs -mkdir -p /user/hduser/output
[hduser@master apache-mahout-1.0-bin]$ hadoop fs -ls output
Found 15 items
-rw-r--r-- 3 hduser supergroup 194 2016-09-28 11:32 output/_policy
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:32 output/clusteredPoints
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-0
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-1
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:32 output/clusters-10-final
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-2
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:29 output/clusters-3
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:29 output/clusters-4
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:30 output/clusters-5
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:30 output/clusters-6
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-7
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-8
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-9
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/data
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/random-seeds
[hduser@master apache-mahout-1.0-bin]$ hdfs dfs -ls output
Found 15 items
-rw-r--r-- 3 hduser supergroup 194 2016-09-28 11:32 output/_policy
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:32 output/clusteredPoints
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-0
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-1
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:32 output/clusters-10-final
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/clusters-2
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:29 output/clusters-3
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:29 output/clusters-4
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:30 output/clusters-5
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:30 output/clusters-6
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-7
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-8
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:31 output/clusters-9
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/data
drwxr-xr-x - hduser supergroup 0 2016-09-28 11:28 output/random-seeds
[hduser@master ~]$ mahout -core org.apache.mahout.clustering.syntheticcontrol.kmeans.Job
........................等待几分钟....................
[hduser@master ~]$ mahout clusterdump --input /user/hduser/output/clusters-10-final --pointsDir /user/hduser/output/clusteredPoints --output /home/hduser/clusteranalyze.txt
Running on hadoop, using /usr/local/hadoop-2.2.0/bin/hadoop and HADOOP_CONF_DIR=
MAHOUT-JOB: /usr/local/apache-mahout-1.0-bin/examples/target/mahout-examples-1.0-SNAPSHOT-job.jar
16/09/28 11:42:23 INFO common.AbstractJob: Command line arguments: {--dictionaryType=[text], --distanceMeasure=[org.apache.mahout.common.distance.SquaredEuclideanDistanceMeasure], --endPhase=[2147483647], --input=[/user/hduser/output/clusters-10-final], --output=[/home/hduser/clusteranalyze.txt], --outputFormat=[TEXT], --pointsDir=[/user/hduser/output/clusteredPoints], --startPhase=[0], --tempDir=[temp]}
16/09/28 11:42:26 INFO clustering.ClusterDumper: Wrote 6 clusters
16/09/28 11:42:26 INFO driver.MahoutDriver: Program took 2365 ms (Minutes: 0.03941666666666667)
[hduser@master ~]$ ls -l clusteranalyze.txt
-rw-r--r--. 1 hduser hadoop 318737 Sep 28 11:42 clusteranalyze.txt
[hduser@master ~]$ ls -lh clusteranalyze.txt
-rw-r--r--. 1 hduser hadoop 312K Sep 28 11:42 clusteranalyze.txt
[hduser@master ~]$ mahout clusterdump -i /user/hduser/output/clusters-10-final -p /user/hduser/output/clusteredPoints -o /home/hduser/clusteranalyze.txt
[hduser@master ~]$ cat clusteranalyze.txt |wc -l
612
[hduser@master ~]$ cat clusteranalyze.txt |more