2021-03-06 22:37:01 +01:00
|
|
|
#!/usr/bin/env bash
|
|
|
|
|
|
|
|
set -ueo pipefail
|
|
|
|
|
|
|
|
HADOOP_VERSION="2.10.1"
|
|
|
|
HADOOP_FILE="hadoop-$HADOOP_VERSION.tar.gz"
|
|
|
|
HADOOP_URL="https://artfiles.org/apache.org/hadoop/common/hadoop-${HADOOP_VERSION}/${HADOOP_FILE}"
|
|
|
|
HADOOP_FILE_CKSUM="2460e02cd1f80dfed7a8981bbc934c095c0a341435118bec781fd835ec2ebdc5543a03d92d24f2ddeebdfe1c2c460065ba1d394ed9a73cbb2020b40a8d8b5e07"
|
2021-03-07 23:53:00 +01:00
|
|
|
HDFS_CONFIG_TEMPLATE="hadoop/etc/hadoop/hdfs-site.xml"
|
|
|
|
HDFS_CONFIG_TEMPLATE_CORE="hadoop/etc/hadoop/core-site.xml"
|
|
|
|
HDFS_CONFIG_TEMPLATE_MAPRED="hadoop/etc/hadoop/mapred-site.xml"
|
2021-03-07 03:03:47 +01:00
|
|
|
HDFS_CONFIG_DATANODES="localhost"
|
2021-03-06 22:37:01 +01:00
|
|
|
HDFS_TEST_SUITE_EXECUTABLE="hadoop/bin/hdfs"
|
|
|
|
|
|
|
|
source setup.sh
|
|
|
|
|
2021-03-07 23:53:00 +01:00
|
|
|
declare -a DEPS=("java" "ansible-playbook")
|
2021-03-06 22:37:01 +01:00
|
|
|
|
2021-03-07 23:53:00 +01:00
|
|
|
create_hdfs_core_config_template() {
|
2021-03-06 22:37:01 +01:00
|
|
|
#printf "Writing HDFS core-site.xml config\n"
|
|
|
|
read -r -d '' CONFIG <<EOF
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
|
|
|
|
<configuration>
|
2021-03-07 23:53:00 +01:00
|
|
|
<property>
|
|
|
|
<name>fs.defaultFS</name>
|
|
|
|
<value>hdfs://{{ cluster_id }}</value>
|
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.journalnode.edits.dir</name>
|
|
|
|
<value>/.tmp/hadoop</value>
|
|
|
|
</property>
|
2021-03-06 22:37:01 +01:00
|
|
|
</configuration>
|
|
|
|
EOF
|
|
|
|
echo "$CONFIG"
|
|
|
|
}
|
|
|
|
|
2021-03-07 23:53:00 +01:00
|
|
|
create_hdfs_mapred_config_template() {
|
2021-03-06 22:37:01 +01:00
|
|
|
#printf "Writing HDFS mapred-site.xml config\n"
|
|
|
|
read -r -d '' CONFIG <<EOF
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
|
|
|
|
<configuration>
|
|
|
|
<property>
|
|
|
|
<name>fs.defaultFS</name>
|
2021-03-07 23:53:00 +01:00
|
|
|
<value>hdfs://{{ cluster_ha_id }}</value>
|
2021-03-06 22:37:01 +01:00
|
|
|
</property>
|
|
|
|
</configuration>
|
|
|
|
EOF
|
|
|
|
echo "$CONFIG"
|
|
|
|
}
|
|
|
|
|
2021-03-07 23:53:00 +01:00
|
|
|
create_hdfs_config_template() {
|
2021-03-06 22:37:01 +01:00
|
|
|
#printf "Writing HDFS hdfs-site.xml config\n"
|
|
|
|
read -r -d '' CONFIG <<EOF
|
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
|
|
|
|
<configuration>
|
2021-03-07 03:03:47 +01:00
|
|
|
<property>
|
|
|
|
<name>dfs.nameservices</name>
|
2021-03-07 23:53:00 +01:00
|
|
|
<value>{{ cluster_id }}</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
2021-03-07 23:53:00 +01:00
|
|
|
<name>dfs.ha.namenodes.{{ cluster_id }}</name>
|
2021-03-07 03:03:47 +01:00
|
|
|
<value>nn1,nn2</value>
|
|
|
|
</property>
|
2021-03-06 22:37:01 +01:00
|
|
|
<property>
|
|
|
|
<name>fs.defaultFS</name>
|
2021-03-07 23:53:00 +01:00
|
|
|
<value>hdfs://{{ cluster_id }}</value>
|
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.namenode.rpc-address.{{ cluster_id }}.nn1</name>
|
|
|
|
<value>{{ namenode_1 }}:8020</value>
|
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.namenode.rpc-address.{{ cluster_id }}.nn2</name>
|
|
|
|
<value>{{ namenode_2 }}:8020</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
2021-03-07 23:53:00 +01:00
|
|
|
<name>dfs.namenode.http-address.{{ cluster_id }}.nn1</name>
|
|
|
|
<value>{{ namenode_1 }}:50070</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
2021-03-07 23:53:00 +01:00
|
|
|
<name>dfs.namenode.http-address.{{ cluster_id }}.nn2</name>
|
|
|
|
<value>{{ namenode_2}}:50070</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
2021-03-07 23:53:00 +01:00
|
|
|
<name>dfs.namenode.http-address.{{ cluster_id }}.nn1</name>
|
|
|
|
<value>{{ namenode_1 }}:9870</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
2021-03-07 23:53:00 +01:00
|
|
|
<name>dfs.namenode.http-address.{{ cluster_id }}.nn2</name>
|
|
|
|
<value>{{ namenode_2 }}:9870</value>
|
2021-03-06 22:37:01 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.namenode.name.dir</name>
|
|
|
|
<value>/tmp/hdfs/namenode</value>
|
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.datanode.data.dir</name>
|
|
|
|
<value>/tmp/hdfs/datanode</value>
|
2021-03-07 03:03:47 +01:00
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>dfs.namenode.shared.edits.dir</name>
|
|
|
|
<value>file:///tmp/hadoop</value>
|
|
|
|
</property>
|
|
|
|
<property>
|
|
|
|
<name>ha.zookeeper.quorum</name>
|
|
|
|
<value>127.0.0.1:2181</value>
|
|
|
|
</property>
|
2021-03-06 22:37:01 +01:00
|
|
|
</configuration>
|
|
|
|
EOF
|
|
|
|
echo "$CONFIG"
|
|
|
|
}
|
|
|
|
|
|
|
|
prepare_hadoop() {
|
|
|
|
if ! [ -f "$HDFS_TEST_SUITE_EXECUTABLE" ]; then
|
|
|
|
printf "Setting up Hadoop\n"
|
|
|
|
if [ -f "$HADOOP_FILE" ]; then
|
|
|
|
printf "Hadoop archive exists\n"
|
|
|
|
if compare_checksum $HADOOP_FILE $HADOOP_FILE_CKSUM; then
|
|
|
|
extract_archive "$HADOOP_FILE" "$HADOOP_VERSION"
|
|
|
|
mv -f hadoop-$HADOOP_VERSION hadoop/
|
|
|
|
return
|
|
|
|
else
|
|
|
|
printf "Hadoop archive has wrong checksum (%s)\n" "$1"
|
|
|
|
printf "Execute script again to redownload file\n"
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
|
|
|
printf "Downloading %s\n" "$1"
|
|
|
|
curl -LO "${1}"
|
|
|
|
if compare_checksum $HADOOP_FILE $HADOOP_FILE_CKSUM; then
|
|
|
|
extract_archive "$HADOOP_FILE" "$HADOOP_VERSION"
|
|
|
|
mv -f hadoop-$HADOOP_VERSION hadoop/
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
check_dependencies
|
|
|
|
prepare_hadoop ${HADOOP_URL}
|
2021-03-07 23:53:00 +01:00
|
|
|
HDFS_CONFIG=$(create_hdfs_config_template)
|
|
|
|
HDFS_CONFIG_CORE=$(create_hdfs_core_config_template)
|
|
|
|
HDFS_CONFIG_MAPRED=$(create_hdfs_mapred_config_template)
|
|
|
|
write_file ${HDFS_CONFIG_TEMPLATE} "${HDFS_CONFIG}"
|
|
|
|
write_file ${HDFS_CONFIG_TEMPLATE_CORE} "${HDFS_CONFIG_CORE}"
|
|
|
|
write_file ${HDFS_CONFIG_TEMPLATE_MAPRED} "${HDFS_CONFIG_MAPRED}"
|
2021-03-07 03:03:47 +01:00
|
|
|
write_file ${HDFS_CONFIG_DATANODES} "localhost"
|