1.停止防火墙
systemctl stop firewalld.service
systemctl disable firewalld.service
2.selinux改为disable
vi /etc/selinux/config
SELINUX=disabled
3.配置java
另一个博客里
4.修改ip和hostname
另一博客里
5.ssh免密码登录
useradd hadoop
passwd hadoop输入两次密码
vi /etc/sudoers
这样hadoop用户就可以用 sudo 命令
root ALL=(ALL) ALL hadoop ALL=(ALL) NOPASSWD: ALL #加上nopasswd使用sudo时不用密码 hadoop用户
ssh localhost
cd ~
ssh-keygen -t rsa -P '' -f .ssh/id_rsa
cat .ssh/id_rsa.pub >> .ssh/authorized_keys
chmod 600 .ssh/authorized_keys
6.安装伪分布式hadoop
vi /etc/profile
export HADOOP_HOME=/usr/local/hadoop export PATH=$HADOOP_HOME/sbin:$HADOOP_HOME/bin:$PATH cd /usr/local/hadoop
sudo mkdir dfs
cd dfs
sudo mkdir name
sudo mkdir data
cd /usr/local/hadoop/etc/hadoop
6.1添加java_home
在hadoop-env.sh,yarn-env.sh,mapred-env.sh中添加java_home
6.2修改core-site.xml
<configuration> <property> <name>fs.defaultFS</name> <value>hdfs://master:9000</value> </property> <property> <name>hadoop.tmp.dir</name> <value>/usr/local/hadoop/tmp</value> </property> </configuration> 6.3修改hdfs-site.xml
<configuration> <property> <name>dfs.replication</name> <value>1</value> </property> <property> <name>hadoop.namenode.name.dir</name> <value>/usr/local/hadoop/dfs/name</value> </property> <property> <name>hadoop.datanode.data.dir</name> <value>/usr/local/hadoop/dfs/data</value> </property> </configuration> 6.4修改mapred-site.xml
sudo cp mapred-site.xml.template mapred-site.xml
<configuration> <property> <name>mapreduce.framework.name</name> <value>yarn</value> </property> </configuration> 6.5 修改yarn-site.xml<configuration> <!-- Site specific YARN configuration properties --> <property> <name>yarn.resourcemanager.hostname</name> <value>master</value> </property> <property> <name>yarn.nodemanager.aux-services</name> <value>mapreduce_shuffle</value> </property> </configuration> 7格式化hdfs系统
hadoop namenode -format
8.启动hadoop
cd /usr/local/hadoop/sbin
./start-all.sh