Hadoop-基础教程

1
2
3
4
5
6
7
centos7下载 http://cloud.centos.org/centos/7/vagrant/x86_64/images/CentOS-7-x86_64-Vagrant-2002_01.VirtualBox.box

jdk下载 https://www.oracle.com/java/technologies/javase-jdk8-downloads.html

hadoop下载 https://archive.cloudera.com/cdh5/cdh/5/hadoop-2.6.0-cdh5.16.2.tar.gz

hive下载 https://archive.cloudera.com/cdh5/cdh/5/hive-1.1.0-cdh5.16.2.tar.gz
1
2
3
4
vagrant box add centos7 CentOS-7-x86_64-Vagrant-2002_01.VirtualBox.box
vagrant box list
vagrant init centos7
vargrant ssh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
tar zxvf ~/software/jdk-8u241-linux-x64.tar.gz -C ~/app/
tar zxvf ~/software/hadoop-2.6.0-cdh5.16.2.tar.gz -C ~/app/
tar zxvf ~/software/hive-1.1.0-cdh5.16.2.tar.gz -C ~/app/

### 配置ssh
ssh-keygen
cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys

### 配置 ~/.bash_profile
#### java环境变量
export JAVA_HOME=~/app/jdk1.8.0_241
export PATH=$JAVA_HOME/bin:$PATH

### 验证
java -version

### haddop环境变量
export HADOOP_HOME=~/app/hadoop-2.6.0-cdh5.16.2
export PATH=$HADOOP_HOME/bin:$PATH

### 配置 etc/hadoop/hadoop-env.sh
export JAVA_HOME=~/app/jdk1.8.0_241

### 配置 etc/hadoop/core-site.xml:
<configuration>
<property>
<name>fs.defaultFS</name>
<value>hdfs://hadoop001:8020</value>
</property>
<property>
<name>hadoop.tmp.dir</name>
<value>/home/vagrant/app/tmp</value>
</property>
</configuration>

### 配置 etc/hadoop/hdfs-site.xml:
<configuration>
<property>
<name>dfs.replication</name>
<value>1</value>
</property>
</configuration>

### 第一个格式化tmp
hdfs namenode -format

### 启动服务
sbin/start-dfs.sh

### 查看服务
jps

### 查看运行状态
http://localhost:50070/

### hadoop 常用命令
hadoopfs -ls /
hadoopfs -put
hadoopfs -copyFromLocal
hadoopfs -moveFromLocal
hadoopfs -cat
hadoopfs -text
hadoopfs -get
hadoopfs -mkdir
hadoopfs -mv
hadoopfs -getmerge
hadoopfs -rm
hadoopfs -rmdir
hadoopfs -rm -r

推送数据到hdfs

1
2
hadoop fs -mkdir -p /wordcount/input
hadoop fs -put data/test.txt /wordcount/input

代码

1
2


您的支持将鼓励我继续创作