Ubuntu與Hadoop的兼容性非常好。Ubuntu是一個廣泛使用的Linux發行版,擁有龐大的用戶社區和豐富的文檔資源,這使得在Ubuntu上安裝和配置Hadoop變得更加容易。以下是關于在Ubuntu上安裝Hadoop的詳細步驟:
在安裝Hadoop之前,需要確保系統滿足以下要求:
sudo apt update
sudo apt install openjdk-8-jdk
sudo apt install openssh-server
ssh-keygen -t rsa
cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys
wget http://mirror.bit.edu.cn/apache/hadoop/common/hadoop-3.3.4/hadoop-3.3.4.tar.gz
tar -zxvf hadoop-3.3.4.tar.gz -C /opt/
sudo mv /opt/hadoop-3.3.4 /opt/hadoop
echo 'export HADOOP_HOME=/opt/hadoop' >> ~/.bashrc
echo 'export PATH=$PATH:$HADOOP_HOME/bin:$HADOOP_HOME/sbin' >> ~/.bashrc
source ~/.bashrc
sudo nano /opt/hadoop/etc/hadoop/hadoop-env.sh
# 設置JAVA_HOME
export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64
<configuration>
<property>
<name>fs.defaultFS</name>
<value>hdfs://localhost:9000</value>
</property>
</configuration>
<configuration>
<property>
<name>dfs.replication</name>
<value>1</value>
</property>
</configuration>
<configuration>
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
</configuration>
<configuration>
<property>
<name>yarn.resourcemanager.hostname</name>
<value>localhost</value>
</property>
</configuration>
sudo -u hadoop hadoop namenode -format
sudo -u hadoop sbin/start-dfs.sh
sudo -u hadoop sbin/start-yarn.sh