Ubuntu Hadoop 网络参数配置
一 基础网络与主机名解析
network:
version: 2
ethernets:
eth0:
dhcp4: no
addresses: [192.168.1.100/24]
gateway4: 192.168.1.1
nameservers:
addresses: [8.8.8.8, 1.1.1.1]
192.168.1.100 master
192.168.1.101 slave1
192.168.1.102 slave2
二 Hadoop 关键网络参数配置
core-site.xml
<configuration>
<!-- 默认文件系统地址(主机名或IP均可) -->
<property>
<name>fs.defaultFS</name>
<value>hdfs://master:8020</value>
</property>
</configuration>
hdfs-site.xml
<configuration>
<!-- 副本数:生产常用 3 -->
<property>
<name>dfs.replication</name>
<value>3</value>
</property>
<!-- NameNode RPC 地址(主机名) -->
<property>
<name>dfs.namenode.rpc-address</name>
<value>master:8020</value>
</property>
<!-- NameNode HTTP UI -->
<property>
<name>dfs.namenode.http-address</name>
<value>master:50070</value>
</property>
<!-- DataNode 数据传输端口 -->
<property>
<name>dfs.datanode.address</name>
<value>0.0.0.0:50010</value>
</property>
<!-- DataNode IPC -->
<property>
<name>dfs.datanode.ipc.address</name>
<value>0.0.0.0:50020</value>
</property>
<!-- 可选:关闭 IP/主机名校验(仅当你的网络环境必须使用 IP 直连且 DNS/hosts 不一致时) -->
<!-- <property>
<name>dfs.namenode.datanode.registration.ip-hostname-check</name>
<value>false</value>
</property> -->
</configuration>
yarn-site.xml
<configuration>
<!-- ResourceManager 主机名 -->
<property>
<name>yarn.resourcemanager.hostname</name>
<value>master</value>
</property>
<!-- Shuffle 服务 -->
<property>
<name>yarn.nodemanager.aux-services</name>
<value>mapreduce_shuffle</value>
</property>
<property>
<name>yarn.nodemanager.aux-services.mapreduce_shuffle.class</name>
<value>org.apache.hadoop.mapred.ShuffleHandler</value>
</property>
</configuration>
mapred-site.xml
<configuration>
<!-- 使用 YARN 作为执行框架 -->
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
</configuration>
三 系统级网络优化(可选)
net.ipv4.ip_local_port_range = 1024 65535
net.core.somaxconn = 1024
net.core.netdev_max_backlog = 1024
net.ipv4.tcp_max_syn_backlog = 1024
net.ipv4.tcp_syncookies = 1
net.ipv4.tcp_tw_reuse = 1
net.ipv4.tcp_fin_timeout = 30
四 启动与验证