2012-08-01 16:17:31 -04:00
|
|
|
#!/usr/bin/env bash
|
|
|
|
|
2012-09-25 17:43:40 -04:00
|
|
|
#
|
2012-08-04 20:04:33 -04:00
|
|
|
# Licensed to the Apache Software Foundation (ASF) under one or more
|
|
|
|
# contributor license agreements. See the NOTICE file distributed with
|
|
|
|
# this work for additional information regarding copyright ownership.
|
|
|
|
# The ASF licenses this file to You under the Apache License, Version 2.0
|
|
|
|
# (the "License"); you may not use this file except in compliance with
|
|
|
|
# the License. You may obtain a copy of the License at
|
|
|
|
#
|
2013-07-16 20:21:33 -04:00
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
2012-08-04 20:04:33 -04:00
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2013-07-16 20:21:33 -04:00
|
|
|
#
|
2012-08-04 20:04:33 -04:00
|
|
|
|
2012-08-01 16:17:31 -04:00
|
|
|
# Runs a Spark command as a daemon.
|
|
|
|
#
|
|
|
|
# Environment Variables
|
|
|
|
#
|
2014-10-28 15:29:01 -04:00
|
|
|
# SPARK_CONF_DIR Alternate conf dir. Default is ${SPARK_HOME}/conf.
|
|
|
|
# SPARK_LOG_DIR Where log files are stored. ${SPARK_HOME}/logs by default.
|
2012-08-01 16:17:31 -04:00
|
|
|
# SPARK_MASTER host:path where spark code should be rsync'd from
|
|
|
|
# SPARK_PID_DIR The pid files are stored. /tmp by default.
|
|
|
|
# SPARK_IDENT_STRING A string representing this instance of spark. $USER by default
|
|
|
|
# SPARK_NICENESS The scheduling priority for daemons. Defaults to 0.
|
|
|
|
##
|
|
|
|
|
2015-04-13 08:02:55 -04:00
|
|
|
usage="Usage: spark-daemon.sh [--config <conf-dir>] (start|stop|status) <spark-command> <spark-instance-number> <args...>"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
|
|
|
# if no args specified, show usage
|
|
|
|
if [ $# -le 1 ]; then
|
|
|
|
echo $usage
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
2014-09-08 13:24:15 -04:00
|
|
|
sbin="`dirname "$0"`"
|
|
|
|
sbin="`cd "$sbin"; pwd`"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2013-09-23 00:42:34 -04:00
|
|
|
. "$sbin/spark-config.sh"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
|
|
|
# get arguments
|
2013-10-15 03:35:44 -04:00
|
|
|
|
2013-10-17 01:51:09 -04:00
|
|
|
# Check if --config is passed as an argument. It is an optional parameter.
|
2013-10-17 01:55:15 -04:00
|
|
|
# Exit if the argument is not a directory.
|
2013-10-17 01:51:09 -04:00
|
|
|
|
2013-10-15 03:35:44 -04:00
|
|
|
if [ "$1" == "--config" ]
|
|
|
|
then
|
|
|
|
shift
|
2014-09-08 13:24:15 -04:00
|
|
|
conf_dir="$1"
|
2013-10-15 03:35:44 -04:00
|
|
|
if [ ! -d "$conf_dir" ]
|
|
|
|
then
|
2013-10-17 01:51:09 -04:00
|
|
|
echo "ERROR : $conf_dir is not a directory"
|
|
|
|
echo $usage
|
2013-10-15 03:35:44 -04:00
|
|
|
exit 1
|
|
|
|
else
|
2014-09-08 13:24:15 -04:00
|
|
|
export SPARK_CONF_DIR="$conf_dir"
|
2013-10-15 03:35:44 -04:00
|
|
|
fi
|
|
|
|
shift
|
|
|
|
fi
|
|
|
|
|
2014-10-01 18:15:09 -04:00
|
|
|
option=$1
|
2012-08-01 16:17:31 -04:00
|
|
|
shift
|
|
|
|
command=$1
|
|
|
|
shift
|
2013-03-06 21:06:32 -05:00
|
|
|
instance=$1
|
|
|
|
shift
|
2012-08-01 16:17:31 -04:00
|
|
|
|
|
|
|
spark_rotate_log ()
|
|
|
|
{
|
|
|
|
log=$1;
|
|
|
|
num=5;
|
|
|
|
if [ -n "$2" ]; then
|
|
|
|
num=$2
|
|
|
|
fi
|
|
|
|
if [ -f "$log" ]; then # rotate logs
|
|
|
|
while [ $num -gt 1 ]; do
|
|
|
|
prev=`expr $num - 1`
|
|
|
|
[ -f "$log.$prev" ] && mv "$log.$prev" "$log.$num"
|
|
|
|
num=$prev
|
|
|
|
done
|
|
|
|
mv "$log" "$log.$num";
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
2014-03-25 01:24:21 -04:00
|
|
|
. "$SPARK_PREFIX/bin/load-spark-env.sh"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
|
|
|
if [ "$SPARK_IDENT_STRING" = "" ]; then
|
|
|
|
export SPARK_IDENT_STRING="$USER"
|
|
|
|
fi
|
|
|
|
|
2013-08-31 20:31:07 -04:00
|
|
|
|
|
|
|
export SPARK_PRINT_LAUNCH_COMMAND="1"
|
|
|
|
|
2012-08-01 16:17:31 -04:00
|
|
|
# get log directory
|
|
|
|
if [ "$SPARK_LOG_DIR" = "" ]; then
|
|
|
|
export SPARK_LOG_DIR="$SPARK_HOME/logs"
|
|
|
|
fi
|
|
|
|
mkdir -p "$SPARK_LOG_DIR"
|
2014-09-08 13:24:15 -04:00
|
|
|
touch "$SPARK_LOG_DIR"/.spark_test > /dev/null 2>&1
|
2012-08-01 16:17:31 -04:00
|
|
|
TEST_LOG_DIR=$?
|
|
|
|
if [ "${TEST_LOG_DIR}" = "0" ]; then
|
2014-09-08 13:24:15 -04:00
|
|
|
rm -f "$SPARK_LOG_DIR"/.spark_test
|
2012-08-01 16:17:31 -04:00
|
|
|
else
|
2014-09-08 13:24:15 -04:00
|
|
|
chown "$SPARK_IDENT_STRING" "$SPARK_LOG_DIR"
|
2012-08-01 16:17:31 -04:00
|
|
|
fi
|
|
|
|
|
|
|
|
if [ "$SPARK_PID_DIR" = "" ]; then
|
|
|
|
SPARK_PID_DIR=/tmp
|
|
|
|
fi
|
|
|
|
|
|
|
|
# some variables
|
2014-09-08 13:24:15 -04:00
|
|
|
log="$SPARK_LOG_DIR/spark-$SPARK_IDENT_STRING-$command-$instance-$HOSTNAME.out"
|
|
|
|
pid="$SPARK_PID_DIR/spark-$SPARK_IDENT_STRING-$command-$instance.pid"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
|
|
|
# Set default scheduling priority
|
|
|
|
if [ "$SPARK_NICENESS" = "" ]; then
|
|
|
|
export SPARK_NICENESS=0
|
|
|
|
fi
|
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
run_command() {
|
|
|
|
mode="$1"
|
|
|
|
shift
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
mkdir -p "$SPARK_PID_DIR"
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
if [ -f "$pid" ]; then
|
|
|
|
TARGET_ID="$(cat "$pid")"
|
2015-04-17 06:08:37 -04:00
|
|
|
if [[ $(ps -p "$TARGET_ID" -o comm=) =~ "java" ]]; then
|
2015-03-11 04:03:01 -04:00
|
|
|
echo "$command running as process $TARGET_ID. Stop it first."
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
fi
|
2013-08-24 02:30:17 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
if [ "$SPARK_MASTER" != "" ]; then
|
|
|
|
echo rsync from "$SPARK_MASTER"
|
|
|
|
rsync -a -e ssh --delete --exclude=.svn --exclude='logs/*' --exclude='contrib/hod/logs/*' "$SPARK_MASTER/" "$SPARK_HOME"
|
|
|
|
fi
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
spark_rotate_log "$log"
|
|
|
|
echo "starting $command, logging to $log"
|
|
|
|
|
|
|
|
case "$mode" in
|
|
|
|
(class)
|
|
|
|
nohup nice -n "$SPARK_NICENESS" "$SPARK_PREFIX"/bin/spark-class $command "$@" >> "$log" 2>&1 < /dev/null &
|
|
|
|
newpid="$!"
|
|
|
|
;;
|
|
|
|
|
|
|
|
(submit)
|
|
|
|
nohup nice -n "$SPARK_NICENESS" "$SPARK_PREFIX"/bin/spark-submit --class $command "$@" >> "$log" 2>&1 < /dev/null &
|
|
|
|
newpid="$!"
|
|
|
|
;;
|
|
|
|
|
|
|
|
(*)
|
|
|
|
echo "unknown mode: $mode"
|
|
|
|
exit 1
|
|
|
|
;;
|
|
|
|
esac
|
|
|
|
|
|
|
|
echo "$newpid" > "$pid"
|
|
|
|
sleep 2
|
|
|
|
# Check if the process has died; in that case we'll tail the log so the user can see
|
2015-04-17 06:08:37 -04:00
|
|
|
if [[ ! $(ps -p "$newpid" -o comm=) =~ "java" ]]; then
|
2015-03-11 04:03:01 -04:00
|
|
|
echo "failed to launch $command:"
|
|
|
|
tail -2 "$log" | sed 's/^/ /'
|
|
|
|
echo "full log in $log"
|
|
|
|
fi
|
|
|
|
}
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
case $option in
|
2012-08-01 16:17:31 -04:00
|
|
|
|
2015-03-11 04:03:01 -04:00
|
|
|
(submit)
|
|
|
|
run_command submit "$@"
|
|
|
|
;;
|
|
|
|
|
|
|
|
(start)
|
|
|
|
run_command class "$@"
|
2012-08-01 16:17:31 -04:00
|
|
|
;;
|
2013-08-24 02:30:17 -04:00
|
|
|
|
2012-08-01 16:17:31 -04:00
|
|
|
(stop)
|
|
|
|
|
|
|
|
if [ -f $pid ]; then
|
2015-02-13 05:27:23 -05:00
|
|
|
TARGET_ID="$(cat "$pid")"
|
2015-02-19 15:07:51 -05:00
|
|
|
if [[ $(ps -p "$TARGET_ID" -o comm=) =~ "java" ]]; then
|
2015-02-13 05:27:23 -05:00
|
|
|
echo "stopping $command"
|
2015-02-19 18:13:02 -05:00
|
|
|
kill "$TARGET_ID" && rm -f "$pid"
|
2012-08-01 16:17:31 -04:00
|
|
|
else
|
2015-02-13 05:27:23 -05:00
|
|
|
echo "no $command to stop"
|
2012-08-01 16:17:31 -04:00
|
|
|
fi
|
|
|
|
else
|
2015-02-13 05:27:23 -05:00
|
|
|
echo "no $command to stop"
|
2012-08-01 16:17:31 -04:00
|
|
|
fi
|
|
|
|
;;
|
|
|
|
|
2015-04-13 08:02:55 -04:00
|
|
|
(status)
|
|
|
|
|
|
|
|
if [ -f $pid ]; then
|
|
|
|
TARGET_ID="$(cat "$pid")"
|
|
|
|
if [[ $(ps -p "$TARGET_ID" -o comm=) =~ "java" ]]; then
|
|
|
|
echo $command is running.
|
|
|
|
exit 0
|
|
|
|
else
|
|
|
|
echo $pid file is present but $command not running
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
else
|
|
|
|
echo $command not running.
|
|
|
|
exit 2
|
|
|
|
fi
|
|
|
|
;;
|
|
|
|
|
2012-08-01 16:17:31 -04:00
|
|
|
(*)
|
|
|
|
echo $usage
|
|
|
|
exit 1
|
|
|
|
;;
|
|
|
|
|
|
|
|
esac
|
|
|
|
|
|
|
|
|