2009-05-19 00:30:38 -04:00
|
|
|
# Licensed to the Apache Software Foundation (ASF) under one or more
|
|
|
|
# contributor license agreements. See the NOTICE file distributed with
|
|
|
|
# this work for additional information regarding copyright ownership.
|
|
|
|
# The ASF licenses this file to You under the Apache License, Version 2.0
|
|
|
|
# (the "License"); you may not use this file except in compliance with
|
|
|
|
# the License. You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
# included in all the hadoop scripts with source command
|
|
|
|
# should not be executable directly
|
|
|
|
# also should not be passed any arguments, since we need original $*
|
|
|
|
|
2011-01-14 03:01:27 -05:00
|
|
|
# Resolve links ($0 may be a softlink) and convert a relative path
|
|
|
|
# to an absolute path. NB: The -P option requires bash built-ins
|
|
|
|
# or POSIX:2001 compliant cd and pwd.
|
2010-04-29 19:23:53 -04:00
|
|
|
this="${BASH_SOURCE-$0}"
|
2011-01-14 03:01:27 -05:00
|
|
|
common_bin=$(cd -P -- "$(dirname -- "$this")" && pwd -P)
|
|
|
|
script="$(basename -- "$this")"
|
2010-06-10 19:01:33 -04:00
|
|
|
this="$common_bin/$script"
|
2009-05-19 00:30:38 -04:00
|
|
|
|
|
|
|
# the root of the Hadoop installation
|
|
|
|
#TODO: change the env variable when dir structure is changed
|
|
|
|
export HADOOP_HOME=`dirname "$this"`/..
|
2010-06-10 19:01:33 -04:00
|
|
|
export HADOOP_COMMON_HOME="${HADOOP_HOME}"
|
2009-05-19 00:30:38 -04:00
|
|
|
#export HADOOP_HOME=`dirname "$this"`/../..
|
2010-06-10 19:01:33 -04:00
|
|
|
#export HADOOP_COMMON_HOME="${HADOOP_COMMON_HOME:-`dirname "$this"`/..}"
|
2009-05-19 00:30:38 -04:00
|
|
|
|
|
|
|
#check to see if the conf dir is given as an optional argument
|
|
|
|
if [ $# -gt 1 ]
|
|
|
|
then
|
|
|
|
if [ "--config" = "$1" ]
|
|
|
|
then
|
|
|
|
shift
|
|
|
|
confdir=$1
|
|
|
|
shift
|
|
|
|
HADOOP_CONF_DIR=$confdir
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
|
|
|
# Allow alternate conf dir location.
|
|
|
|
export HADOOP_CONF_DIR="${HADOOP_CONF_DIR:-$HADOOP_HOME/conf}"
|
|
|
|
|
2011-05-03 17:19:25 -04:00
|
|
|
# User can specify hostnames or a file where the hostnames are (not both)
|
|
|
|
if [[ ( "$HADOOP_SLAVES" != '' ) && ( "$HADOOP_SLAVE_NAMES" != '' ) ]] ; then
|
|
|
|
echo \
|
|
|
|
"Error: Please specify one variable HADOOP_SLAVES or " \
|
|
|
|
"HADOOP_SLAVE_NAME and not both."
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
|
|
|
# Process command line options that specify hosts or file with host
|
|
|
|
# list
|
2009-05-19 00:30:38 -04:00
|
|
|
if [ $# -gt 1 ]
|
|
|
|
then
|
|
|
|
if [ "--hosts" = "$1" ]
|
|
|
|
then
|
|
|
|
shift
|
2011-05-03 17:19:25 -04:00
|
|
|
export HADOOP_SLAVES="${HADOOP_CONF_DIR}/$$1"
|
|
|
|
shift
|
|
|
|
elif [ "--hostnames" = "$1" ]
|
|
|
|
then
|
|
|
|
shift
|
|
|
|
export HADOOP_SLAVE_NAMES=$1
|
2009-05-19 00:30:38 -04:00
|
|
|
shift
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
2011-05-03 17:19:25 -04:00
|
|
|
# User can specify hostnames or a file where the hostnames are (not both)
|
|
|
|
# (same check as above but now we know it's command line options that cause
|
|
|
|
# the problem)
|
|
|
|
if [[ ( "$HADOOP_SLAVES" != '' ) && ( "$HADOOP_SLAVE_NAMES" != '' ) ]] ; then
|
|
|
|
echo \
|
|
|
|
"Error: Please specify one of --hosts or --hostnames options and not both."
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
2009-05-19 00:30:38 -04:00
|
|
|
cygwin=false
|
|
|
|
case "`uname`" in
|
|
|
|
CYGWIN*) cygwin=true;;
|
|
|
|
esac
|
|
|
|
|
|
|
|
if [ -f "${HADOOP_CONF_DIR}/hadoop-env.sh" ]; then
|
|
|
|
. "${HADOOP_CONF_DIR}/hadoop-env.sh"
|
|
|
|
fi
|
|
|
|
|
2011-01-23 17:08:34 -05:00
|
|
|
# check if net.ipv6.bindv6only is set to 1
|
|
|
|
bindv6only=$(/sbin/sysctl -n net.ipv6.bindv6only 2> /dev/null)
|
|
|
|
if [ -n "$bindv6only" ] && [ "$bindv6only" -eq "1" ] && [ "$HADOOP_ALLOW_IPV6" != "yes" ]
|
|
|
|
then
|
|
|
|
echo "Error: \"net.ipv6.bindv6only\" is set to 1 - Java networking could be broken"
|
|
|
|
echo "For more info: http://wiki.apache.org/hadoop/HadoopIPv6"
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
2011-03-08 18:51:23 -05:00
|
|
|
# Newer versions of glibc use an arena memory allocator that causes virtual
|
|
|
|
# memory usage to explode. This interacts badly with the many threads that
|
|
|
|
# we use in Hadoop. Tune the variable down to prevent vmem explosion.
|
|
|
|
export MALLOC_ARENA_MAX=${MALLOC_ARENA_MAX:-4}
|
|
|
|
|
2009-05-19 00:30:38 -04:00
|
|
|
# some Java parameters
|
|
|
|
if [ "$JAVA_HOME" != "" ]; then
|
|
|
|
#echo "run java in $JAVA_HOME"
|
|
|
|
JAVA_HOME=$JAVA_HOME
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ "$JAVA_HOME" = "" ]; then
|
|
|
|
echo "Error: JAVA_HOME is not set."
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
|
|
|
JAVA=$JAVA_HOME/bin/java
|
|
|
|
JAVA_HEAP_MAX=-Xmx1000m
|
|
|
|
|
|
|
|
# check envvars which might override default args
|
|
|
|
if [ "$HADOOP_HEAPSIZE" != "" ]; then
|
|
|
|
#echo "run with heapsize $HADOOP_HEAPSIZE"
|
|
|
|
JAVA_HEAP_MAX="-Xmx""$HADOOP_HEAPSIZE""m"
|
|
|
|
#echo $JAVA_HEAP_MAX
|
|
|
|
fi
|
|
|
|
|
|
|
|
# CLASSPATH initially contains $HADOOP_CONF_DIR
|
|
|
|
CLASSPATH="${HADOOP_CONF_DIR}"
|
|
|
|
CLASSPATH=${CLASSPATH}:$JAVA_HOME/lib/tools.jar
|
|
|
|
|
|
|
|
# for developers, add Hadoop classes to CLASSPATH
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/classes" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_COMMON_HOME/build/classes
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/webapps" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_COMMON_HOME/build
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/test/classes" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_COMMON_HOME/build/test/classes
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/test/core/classes" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_COMMON_HOME/build/test/core/classes
|
2010-03-19 22:17:38 -04:00
|
|
|
fi
|
2009-05-19 00:30:38 -04:00
|
|
|
|
|
|
|
# so that filenames w/ spaces are handled correctly in loops below
|
|
|
|
IFS=
|
|
|
|
|
|
|
|
# for releases, add core hadoop jar & webapps to CLASSPATH
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/webapps" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_COMMON_HOME
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
2010-06-10 19:01:33 -04:00
|
|
|
for f in $HADOOP_COMMON_HOME/hadoop-*.jar; do
|
2009-05-19 00:30:38 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
|
|
|
|
# add libs to CLASSPATH
|
2010-06-10 19:01:33 -04:00
|
|
|
for f in $HADOOP_COMMON_HOME/lib/*.jar; do
|
2009-05-19 00:30:38 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/ivy/lib/Hadoop-Common/common" ]; then
|
|
|
|
for f in $HADOOP_COMMON_HOME/build/ivy/lib/Hadoop-Common/common/*.jar; do
|
2009-07-27 14:34:57 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
fi
|
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/ivy/lib/Hadoop-Hdfs/common" ]; then
|
|
|
|
for f in $HADOOP_COMMON_HOME/build/ivy/lib/Hadoop-Hdfs/common/*.jar; do
|
2009-07-27 14:34:57 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
fi
|
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/ivy/lib/Hadoop/common" ]; then
|
|
|
|
for f in $HADOOP_COMMON_HOME/build/ivy/lib/Hadoop/common/*.jar; do
|
2009-05-19 00:30:38 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
fi
|
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
for f in $HADOOP_COMMON_HOME/lib/jsp-2.1/*.jar; do
|
2009-05-19 00:30:38 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
|
|
|
|
# add user-specified CLASSPATH last
|
|
|
|
if [ "$HADOOP_CLASSPATH" != "" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:${HADOOP_CLASSPATH}
|
|
|
|
fi
|
|
|
|
|
|
|
|
# default log directory & file
|
|
|
|
if [ "$HADOOP_LOG_DIR" = "" ]; then
|
|
|
|
HADOOP_LOG_DIR="$HADOOP_HOME/logs"
|
|
|
|
fi
|
|
|
|
if [ "$HADOOP_LOGFILE" = "" ]; then
|
|
|
|
HADOOP_LOGFILE='hadoop.log'
|
|
|
|
fi
|
|
|
|
|
|
|
|
# default policy file for service-level authorization
|
|
|
|
if [ "$HADOOP_POLICYFILE" = "" ]; then
|
|
|
|
HADOOP_POLICYFILE="hadoop-policy.xml"
|
|
|
|
fi
|
|
|
|
|
|
|
|
# restore ordinary behaviour
|
|
|
|
unset IFS
|
|
|
|
|
|
|
|
# cygwin path translation
|
|
|
|
if $cygwin; then
|
2010-06-10 19:01:33 -04:00
|
|
|
HADOOP_COMMON_HOME=`cygpath -w "$HADOOP_COMMON_HOME"`
|
2009-05-19 00:30:38 -04:00
|
|
|
HADOOP_LOG_DIR=`cygpath -w "$HADOOP_LOG_DIR"`
|
2010-08-23 13:29:13 -04:00
|
|
|
JAVA_LIBRARY_PATH=`cygpath -w "$JAVA_LIBRARY_PATH"`
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
2010-08-23 13:29:13 -04:00
|
|
|
|
2009-05-19 00:30:38 -04:00
|
|
|
# setup 'java.library.path' for native-hadoop code if necessary
|
2010-08-23 13:29:13 -04:00
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "${HADOOP_COMMON_HOME}/build/native" -o -d "${HADOOP_COMMON_HOME}/lib/native" ]; then
|
2009-09-29 17:26:06 -04:00
|
|
|
JAVA_PLATFORM=`CLASSPATH=${CLASSPATH} ${JAVA} -Xmx32m ${HADOOP_JAVA_PLATFORM_OPTS} org.apache.hadoop.util.PlatformName | sed -e "s/ /_/g"`
|
2009-05-19 00:30:38 -04:00
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "$HADOOP_COMMON_HOME/build/native" ]; then
|
2010-08-23 13:29:13 -04:00
|
|
|
if [ "x$JAVA_LIBRARY_PATH" != "x" ]; then
|
2011-01-12 02:22:46 -05:00
|
|
|
JAVA_LIBRARY_PATH=${JAVA_LIBRARY_PATH}:${HADOOP_COMMON_HOME}/build/native/${JAVA_PLATFORM}/lib
|
2010-08-23 13:29:13 -04:00
|
|
|
else
|
2011-01-12 02:22:46 -05:00
|
|
|
JAVA_LIBRARY_PATH=${HADOOP_COMMON_HOME}/build/native/${JAVA_PLATFORM}/lib
|
2010-08-23 13:29:13 -04:00
|
|
|
fi
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
|
|
|
|
2010-06-10 19:01:33 -04:00
|
|
|
if [ -d "${HADOOP_COMMON_HOME}/lib/native" ]; then
|
2009-05-19 00:30:38 -04:00
|
|
|
if [ "x$JAVA_LIBRARY_PATH" != "x" ]; then
|
2010-06-10 19:01:33 -04:00
|
|
|
JAVA_LIBRARY_PATH=${JAVA_LIBRARY_PATH}:${HADOOP_COMMON_HOME}/lib/native/${JAVA_PLATFORM}
|
2009-05-19 00:30:38 -04:00
|
|
|
else
|
2010-06-10 19:01:33 -04:00
|
|
|
JAVA_LIBRARY_PATH=${HADOOP_COMMON_HOME}/lib/native/${JAVA_PLATFORM}
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
|
|
|
# cygwin path translation
|
|
|
|
if $cygwin; then
|
|
|
|
JAVA_LIBRARY_PATH=`cygpath -p "$JAVA_LIBRARY_PATH"`
|
|
|
|
fi
|
|
|
|
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.log.dir=$HADOOP_LOG_DIR"
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.log.file=$HADOOP_LOGFILE"
|
2010-06-10 19:01:33 -04:00
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.home.dir=$HADOOP_COMMON_HOME"
|
2009-05-19 00:30:38 -04:00
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.id.str=$HADOOP_IDENT_STRING"
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.root.logger=${HADOOP_ROOT_LOGGER:-INFO,console}"
|
2011-02-16 13:46:54 -05:00
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.security.logger=${HADOOP_SECURITY_LOGGER:-INFO,console}"
|
2009-05-19 00:30:38 -04:00
|
|
|
if [ "x$JAVA_LIBRARY_PATH" != "x" ]; then
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Djava.library.path=$JAVA_LIBRARY_PATH"
|
|
|
|
fi
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Dhadoop.policy.file=$HADOOP_POLICYFILE"
|
|
|
|
|
2011-01-23 17:08:34 -05:00
|
|
|
# Disable ipv6 as it can cause issues
|
|
|
|
HADOOP_OPTS="$HADOOP_OPTS -Djava.net.preferIPv4Stack=true"
|
|
|
|
|
2009-05-19 00:30:38 -04:00
|
|
|
# put hdfs in classpath if present
|
|
|
|
if [ "$HADOOP_HDFS_HOME" = "" ]; then
|
|
|
|
if [ -d "${HADOOP_HOME}/hdfs" ]; then
|
|
|
|
HADOOP_HDFS_HOME=$HADOOP_HOME/hdfs
|
2009-08-24 18:06:54 -04:00
|
|
|
#echo Found HDFS installed at $HADOOP_HDFS_HOME
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ -d "${HADOOP_HDFS_HOME}" ]; then
|
2010-06-10 19:01:33 -04:00
|
|
|
|
|
|
|
if [ -d "$HADOOP_HDFS_HOME/webapps" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_HDFS_HOME
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ -d "${HADOOP_HDFS_HOME}/conf" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:${HADOOP_HDFS_HOME}/conf
|
|
|
|
fi
|
|
|
|
|
2009-08-24 18:06:54 -04:00
|
|
|
for f in $HADOOP_HDFS_HOME/hadoop-hdfs-*.jar; do
|
2009-05-19 00:30:38 -04:00
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
|
|
|
|
# add libs to CLASSPATH
|
|
|
|
for f in $HADOOP_HDFS_HOME/lib/*.jar; do
|
|
|
|
CLASSPATH=${CLASSPATH}:$f;
|
|
|
|
done
|
|
|
|
|
|
|
|
if [ -d "$HADOOP_HDFS_HOME/build/classes" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_HDFS_HOME/build/classes
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
2009-08-24 18:06:54 -04:00
|
|
|
# cygwin path translation
|
|
|
|
if $cygwin; then
|
|
|
|
HADOOP_HDFS_HOME=`cygpath -w "$HADOOP_HDFS_HOME"`
|
|
|
|
fi
|
|
|
|
|
2009-05-19 00:30:38 -04:00
|
|
|
# set mapred home if mapred is present
|
|
|
|
if [ "$HADOOP_MAPRED_HOME" = "" ]; then
|
|
|
|
if [ -d "${HADOOP_HOME}/mapred" ]; then
|
|
|
|
HADOOP_MAPRED_HOME=$HADOOP_HOME/mapred
|
2009-08-24 18:06:54 -04:00
|
|
|
#echo Found MAPRED installed at $HADOOP_MAPRED_HOME
|
2009-05-19 00:30:38 -04:00
|
|
|
fi
|
|
|
|
fi
|
|
|
|
|
2009-08-24 18:06:54 -04:00
|
|
|
if [ -d "${HADOOP_MAPRED_HOME}" ]; then
|
2010-06-10 19:01:33 -04:00
|
|
|
|
|
|
|
if [ -d "$HADOOP_MAPRED_HOME/webapps" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_MAPRED_HOME
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ -d "${HADOOP_MAPRED_HOME}/conf" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:${HADOOP_MAPRED_HOME}/conf
|
|
|
|
fi
|
|
|
|
|
2009-08-24 18:06:54 -04:00
|
|
|
for f in $HADOOP_MAPRED_HOME/hadoop-mapred-*.jar; do
|
|
|
|
CLASSPATH=${CLASSPATH}:$f
|
|
|
|
done
|
|
|
|
|
|
|
|
for f in $HADOOP_MAPRED_HOME/lib/*.jar; do
|
|
|
|
CLASSPATH=${CLASSPATH}:$f
|
|
|
|
done
|
|
|
|
|
|
|
|
if [ -d "$HADOOP_MAPRED_HOME/build/classes" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_MAPRED_HOME/build/classes
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ -d "$HADOOP_MAPRED_HOME/build/tools" ]; then
|
|
|
|
CLASSPATH=${CLASSPATH}:$HADOOP_MAPRED_HOME/build/tools
|
|
|
|
fi
|
|
|
|
|
|
|
|
for f in $HADOOP_MAPRED_HOME/hadoop-mapred-tools-*.jar; do
|
|
|
|
TOOL_PATH=${TOOL_PATH}:$f;
|
|
|
|
done
|
|
|
|
for f in $HADOOP_MAPRED_HOME/build/hadoop-mapred-tools-*.jar; do
|
|
|
|
TOOL_PATH=${TOOL_PATH}:$f;
|
|
|
|
done
|
|
|
|
fi
|
|
|
|
|
|
|
|
# cygwin path translation
|
|
|
|
if $cygwin; then
|
|
|
|
HADOOP_MAPRED_HOME=`cygpath -w "$HADOOP_MAPRED_HOME"`
|
|
|
|
TOOL_PATH=`cygpath -p -w "$TOOL_PATH"`
|
|
|
|
fi
|
|
|
|
|
|
|
|
|