hbase-exporter/tests/hdfs-setup.sh

150 lines
4.5 KiB
Bash
Raw Normal View History

2021-03-06 22:37:01 +01:00
#!/usr/bin/env bash
set -ueo pipefail
HADOOP_VERSION="2.10.1"
HADOOP_FILE="hadoop-$HADOOP_VERSION.tar.gz"
HADOOP_URL="https://artfiles.org/apache.org/hadoop/common/hadoop-${HADOOP_VERSION}/${HADOOP_FILE}"
HADOOP_FILE_CKSUM="2460e02cd1f80dfed7a8981bbc934c095c0a341435118bec781fd835ec2ebdc5543a03d92d24f2ddeebdfe1c2c460065ba1d394ed9a73cbb2020b40a8d8b5e07"
2021-03-07 23:53:00 +01:00
HDFS_CONFIG_TEMPLATE="hadoop/etc/hadoop/hdfs-site.xml"
HDFS_CONFIG_TEMPLATE_CORE="hadoop/etc/hadoop/core-site.xml"
HDFS_CONFIG_TEMPLATE_MAPRED="hadoop/etc/hadoop/mapred-site.xml"
2021-03-07 03:03:47 +01:00
HDFS_CONFIG_DATANODES="localhost"
2021-03-06 22:37:01 +01:00
HDFS_TEST_SUITE_EXECUTABLE="hadoop/bin/hdfs"
source setup.sh
2021-03-07 23:53:00 +01:00
declare -a DEPS=("java" "ansible-playbook")
2021-03-06 22:37:01 +01:00
2021-03-07 23:53:00 +01:00
create_hdfs_core_config_template() {
2021-03-06 22:37:01 +01:00
#printf "Writing HDFS core-site.xml config\n"
read -r -d '' CONFIG <<EOF
<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
<configuration>
2021-03-07 23:53:00 +01:00
<property>
<name>fs.defaultFS</name>
<value>hdfs://{{ cluster_id }}</value>
</property>
<property>
<name>dfs.journalnode.edits.dir</name>
<value>/.tmp/hadoop</value>
</property>
2021-03-06 22:37:01 +01:00
</configuration>
EOF
echo "$CONFIG"
}
2021-03-07 23:53:00 +01:00
create_hdfs_mapred_config_template() {
2021-03-06 22:37:01 +01:00
#printf "Writing HDFS mapred-site.xml config\n"
read -r -d '' CONFIG <<EOF
<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
<configuration>
<property>
<name>fs.defaultFS</name>
2021-03-07 23:53:00 +01:00
<value>hdfs://{{ cluster_ha_id }}</value>
2021-03-06 22:37:01 +01:00
</property>
</configuration>
EOF
echo "$CONFIG"
}
2021-03-07 23:53:00 +01:00
create_hdfs_config_template() {
2021-03-06 22:37:01 +01:00
#printf "Writing HDFS hdfs-site.xml config\n"
read -r -d '' CONFIG <<EOF
<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
<configuration>
2021-03-07 03:03:47 +01:00
<property>
<name>dfs.nameservices</name>
2021-03-07 23:53:00 +01:00
<value>{{ cluster_id }}</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
2021-03-07 23:53:00 +01:00
<name>dfs.ha.namenodes.{{ cluster_id }}</name>
2021-03-07 03:03:47 +01:00
<value>nn1,nn2</value>
</property>
2021-03-06 22:37:01 +01:00
<property>
<name>fs.defaultFS</name>
2021-03-07 23:53:00 +01:00
<value>hdfs://{{ cluster_id }}</value>
</property>
<property>
<name>dfs.namenode.rpc-address.{{ cluster_id }}.nn1</name>
<value>{{ namenode_1 }}:8020</value>
</property>
<property>
<name>dfs.namenode.rpc-address.{{ cluster_id }}.nn2</name>
<value>{{ namenode_2 }}:8020</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
2021-03-07 23:53:00 +01:00
<name>dfs.namenode.http-address.{{ cluster_id }}.nn1</name>
<value>{{ namenode_1 }}:50070</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
2021-03-07 23:53:00 +01:00
<name>dfs.namenode.http-address.{{ cluster_id }}.nn2</name>
<value>{{ namenode_2}}:50070</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
2021-03-07 23:53:00 +01:00
<name>dfs.namenode.http-address.{{ cluster_id }}.nn1</name>
<value>{{ namenode_1 }}:9870</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
2021-03-07 23:53:00 +01:00
<name>dfs.namenode.http-address.{{ cluster_id }}.nn2</name>
<value>{{ namenode_2 }}:9870</value>
2021-03-06 22:37:01 +01:00
</property>
<property>
<name>dfs.namenode.name.dir</name>
<value>/tmp/hdfs/namenode</value>
</property>
<property>
<name>dfs.datanode.data.dir</name>
<value>/tmp/hdfs/datanode</value>
2021-03-07 03:03:47 +01:00
</property>
<property>
<name>dfs.namenode.shared.edits.dir</name>
<value>file:///tmp/hadoop</value>
</property>
<property>
<name>ha.zookeeper.quorum</name>
<value>127.0.0.1:2181</value>
</property>
2021-03-06 22:37:01 +01:00
</configuration>
EOF
echo "$CONFIG"
}
prepare_hadoop() {
if ! [ -f "$HDFS_TEST_SUITE_EXECUTABLE" ]; then
printf "Setting up Hadoop\n"
if [ -f "$HADOOP_FILE" ]; then
printf "Hadoop archive exists\n"
if compare_checksum $HADOOP_FILE $HADOOP_FILE_CKSUM; then
extract_archive "$HADOOP_FILE" "$HADOOP_VERSION"
mv -f hadoop-$HADOOP_VERSION hadoop/
return
else
printf "Hadoop archive has wrong checksum (%s)\n" "$1"
printf "Execute script again to redownload file\n"
exit 1
fi
fi
printf "Downloading %s\n" "$1"
curl -LO "${1}"
if compare_checksum $HADOOP_FILE $HADOOP_FILE_CKSUM; then
extract_archive "$HADOOP_FILE" "$HADOOP_VERSION"
mv -f hadoop-$HADOOP_VERSION hadoop/
fi
fi
}
check_dependencies
prepare_hadoop ${HADOOP_URL}
2021-03-07 23:53:00 +01:00
HDFS_CONFIG=$(create_hdfs_config_template)
HDFS_CONFIG_CORE=$(create_hdfs_core_config_template)
HDFS_CONFIG_MAPRED=$(create_hdfs_mapred_config_template)
write_file ${HDFS_CONFIG_TEMPLATE} "${HDFS_CONFIG}"
write_file ${HDFS_CONFIG_TEMPLATE_CORE} "${HDFS_CONFIG_CORE}"
write_file ${HDFS_CONFIG_TEMPLATE_MAPRED} "${HDFS_CONFIG_MAPRED}"
2021-03-07 03:03:47 +01:00
write_file ${HDFS_CONFIG_DATANODES} "localhost"