hadoop-setup-hdfs.sh 4.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. #!/usr/bin/env bash
  2. # Licensed to the Apache Software Foundation (ASF) under one or more
  3. # contributor license agreements. See the NOTICE file distributed with
  4. # this work for additional information regarding copyright ownership.
  5. # The ASF licenses this file to You under the Apache License, Version 2.0
  6. # (the "License"); you may not use this file except in compliance with
  7. # the License. You may obtain a copy of the License at
  8. #
  9. # http://www.apache.org/licenses/LICENSE-2.0
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS,
  13. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. # See the License for the specific language governing permissions and
  15. # limitations under the License.
  16. bin=`dirname "$0"`
  17. bin=`cd "$bin"; pwd`
  18. DEFAULT_LIBEXEC_DIR="$bin"/../libexec
  19. HADOOP_LIBEXEC_DIR=${HADOOP_LIBEXEC_DIR:-$DEFAULT_LIBEXEC_DIR}
  20. . $HADOOP_LIBEXEC_DIR/hadoop-config.sh
  21. usage() {
  22. echo "
  23. usage: $0 <parameters>
  24. Optional parameters:
  25. --format Force namenode format
  26. --group=hadoop Set Hadoop group
  27. -h Display this message
  28. --hdfs-user=hdfs Set HDFS user
  29. --kerberos-realm=KERBEROS.EXAMPLE.COM Set Kerberos realm
  30. --hdfs-user-keytab=/home/hdfs/hdfs.keytab Set HDFS user key tab
  31. --mapreduce-user=mr Set mapreduce user
  32. "
  33. exit 1
  34. }
  35. OPTS=$(getopt \
  36. -n $0 \
  37. -o '' \
  38. -l 'format' \
  39. -l 'hdfs-user:' \
  40. -l 'hdfs-user-keytab:' \
  41. -l 'mapreduce-user:' \
  42. -l 'kerberos-realm:' \
  43. -o 'h' \
  44. -- "$@")
  45. if [ $? != 0 ] ; then
  46. usage
  47. fi
  48. eval set -- "${OPTS}"
  49. while true ; do
  50. case "$1" in
  51. --format)
  52. FORMAT_NAMENODE=1; shift
  53. AUTOMATED=1
  54. ;;
  55. --group)
  56. HADOOP_GROUP=$2; shift 2
  57. AUTOMATED=1
  58. ;;
  59. --hdfs-user)
  60. HADOOP_HDFS_USER=$2; shift 2
  61. AUTOMATED=1
  62. ;;
  63. --mapreduce-user)
  64. HADOOP_MR_USER=$2; shift 2
  65. AUTOMATED=1
  66. ;;
  67. --yarn-user)
  68. HADOOP_YARN_USER=$2; shift 2
  69. AUTOMATED=1
  70. ;;
  71. --hdfs-user-keytab)
  72. HDFS_KEYTAB=$2; shift 2
  73. AUTOMATED=1
  74. ;;
  75. --kerberos-realm)
  76. KERBEROS_REALM=$2; shift 2
  77. AUTOMATED=1
  78. ;;
  79. --)
  80. shift ; break
  81. ;;
  82. *)
  83. echo "Unknown option: $1"
  84. usage
  85. exit 1
  86. ;;
  87. esac
  88. done
  89. HADOOP_GROUP=${HADOOP_GROUP:-hadoop}
  90. HADOOP_HDFS_USER=${HADOOP_HDFS_USER:-hdfs}
  91. HADOOP_YARN_USER=${HADOOP_YARN_USER:-yarn}
  92. HADOOP_MAPREDUCE_USER=${HADOOP_MR_USER:-mapred}
  93. if [ "${KERBEROS_REALM}" != "" ]; then
  94. # Determine kerberos location base on Linux distro.
  95. if [ -e /etc/lsb-release ]; then
  96. KERBEROS_BIN=/usr/bin
  97. else
  98. KERBEROS_BIN=/usr/kerberos/bin
  99. fi
  100. kinit_cmd="${KERBEROS_BIN}/kinit -k -t ${HDFS_KEYTAB} ${HADOOP_HDFS_USER}"
  101. su -c "${kinit_cmd}" ${HADOOP_HDFS_USER}
  102. fi
  103. echo "Setup Hadoop Distributed File System"
  104. echo
  105. # Format namenode
  106. if [ "${FORMAT_NAMENODE}" == "1" ]; then
  107. echo "Formatting namenode"
  108. echo
  109. su -c "echo Y | ${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} namenode -format" ${HADOOP_HDFS_USER}
  110. echo
  111. fi
  112. # Start namenode process
  113. echo "Starting namenode process"
  114. echo
  115. if [ -e ${HADOOP_PREFIX}/sbin/hadoop-daemon.sh ]; then
  116. DAEMON_PATH=${HADOOP_PREFIX}/sbin
  117. else
  118. DAEMON_PATH=${HADOOP_PREFIX}/bin
  119. fi
  120. su -c "${DAEMON_PATH}/hadoop-daemon.sh --config ${HADOOP_CONF_DIR} start namenode" ${HADOOP_HDFS_USER}
  121. echo
  122. echo "Initialize HDFS file system: "
  123. echo
  124. #create the /user dir
  125. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -mkdir /user" ${HADOOP_HDFS_USER}
  126. #create /tmp and give it 777
  127. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -mkdir /tmp" ${HADOOP_HDFS_USER}
  128. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -chmod 777 /tmp" ${HADOOP_HDFS_USER}
  129. #create /mapred
  130. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -mkdir /mapred" ${HADOOP_HDFS_USER}
  131. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -chmod 700 /mapred" ${HADOOP_HDFS_USER}
  132. su -c "${HADOOP_PREFIX}/bin/hadoop --config ${HADOOP_CONF_DIR} dfs -chown ${HADOOP_MAPREDUCE_USER}:system /mapred" ${HADOOP_HDFS_USER}
  133. if [ $? -eq 0 ]; then
  134. echo "Completed."
  135. else
  136. echo "Unknown error occurred, check hadoop logs for details."
  137. fi
  138. echo
  139. echo "Please startup datanode processes: /etc/init.d/hadoop-datanode start"