Merge pull request #2 from riptano/DSP-5892-2

RussellSpitzer · RussellSpitzer · commit b731636bcba5 · 2015-08-07T12:40:48.000-07:00
Jobserver Integration with DSE
diff --git a/bin/kill-process-tree.sh b/bin/kill-process-tree.sh
@@ -0,0 +1,60 @@
+#!/bin/bash
+
+if [ "$(which pgrep)" == "" ]; then
+    echo "pgrep is not available" >&2
+    exit 1
+fi
+
+if [ "$#" != "2" ]; then
+    echo "Syntax error, the expected usage is: kill-process-tree <signal> <process_id>" >&2
+    exit 1
+fi
+
+# This simple script allows to kill the whole process tree. The first argument is a signal and the second
+# is the root process
+parent=$2
+signal=$1
+
+# A string which will be populated with descendant processes ids
+pids="$parent"
+
+# Kills the given process if it is running. It also checks whether the given parameter contains process ID
+function kill_if_running() {
+    if [[ "$1" =~ [0-9]+ ]]; then
+        ps -e -o pid= | grep $1 > /dev/null
+        if [ $? -eq 0 ]; then
+            kill "-$signal" "$1"
+            return 0
+        else
+            return 1
+        fi
+    fi
+}
+
+# Populates pids with descendant processes ids
+function get_descendants_pids() {
+    for cpid in $(pgrep -P $1);
+    do
+        pids="$cpid $pids"
+        get_descendants_pids $cpid
+    done
+}
+
+get_descendants_pids $parent
+
+for pid in $pids
+do
+    if [ "$signal" == "" ]; then
+        echo "$pid"
+    else
+        kill_if_running $pid
+        if [ $? -eq 0 ]; then
+            # If the process has been really killed, then wait for 3 seconds before going to the next
+            # process. In most cases, where there is a scripts execution hierarchy with Java process
+            # at the bottom, it is sufficient to kill that Java process and the scripts will just exit
+            # in a natural way
+            echo "Sent $signal to $pid, sleeping for 3 seconds"
+            sleep 3s
+        fi
+    fi
+done
diff --git a/bin/server_package.sh b/bin/server_package.sh
@@ -44,8 +44,9 @@ fi
 FILES="job-server-extras/target/scala-$majorVersion/spark-job-server.jar
        bin/server_start.sh
        bin/server_stop.sh
+       bin/kill-process-tree.sh
        $CONFIG_DIR/$ENV.conf
-       config/log4j-server.properties"
+       config/logback-server.xml"
 
 rm -rf $WORK_DIR
 mkdir -p $WORK_DIR
diff --git a/bin/server_start.sh b/bin/server_start.sh
@@ -6,7 +6,7 @@ set -e
 
 get_abs_script_path() {
   pushd . >/dev/null
-  cd $(dirname $0)
+  cd "$(dirname "$0")"
   appdir=$(pwd)
   popd  >/dev/null
 }
@@ -26,14 +26,14 @@ JAVA_OPTS="-XX:MaxDirectMemorySize=512M
 
 MAIN="spark.jobserver.JobServer"
 
-conffile=$(ls -1 $appdir/*.conf | head -1)
+conffile="$(ls -1 "$appdir"/*.conf | head -1)"
 if [ -z "$conffile" ]; then
   echo "No configuration file found"
   exit 1
 fi
 
 if [ -f "$appdir/settings.sh" ]; then
-  . $appdir/settings.sh
+  . "$appdir/settings.sh"
 else
   echo "Missing $appdir/settings.sh, exiting"
   exit 1
@@ -46,7 +46,7 @@ fi
 
 pidFilePath=$appdir/$PIDFILE
 
-if [ -f "$pidFilePath" ] && kill -0 $(cat "$pidFilePath"); then
+if [ -f "$pidFilePath" ] && kill -0 "$(cat "$pidFilePath")"; then
    echo 'Job server is already running'
    exit 1
 fi
@@ -57,8 +57,9 @@ if [ -z "$LOG_DIR" ]; then
 fi
 mkdir -p $LOG_DIR
 
-LOGGING_OPTS="-Dlog4j.configuration=file:$appdir/log4j-server.properties
-              -DLOG_DIR=$LOG_DIR"
+LOGGING_OPTS="-DLOG_DIR=$LOG_DIR"
+
+export SPARK_SUBMIT_LOGBACK_CONF_FILE="$appdir/logback-server.xml"
 
 # For Mesos
 CONFIG_OVERRIDES=""
@@ -77,8 +78,9 @@ fi
 # This needs to be exported for standalone mode so drivers can connect to the Spark cluster
 export SPARK_HOME
 
-$SPARK_HOME/bin/spark-submit --class $MAIN --driver-memory $DRIVER_MEMORY \
+# DSE_BIN is set in settings.sh
+"$DSE_HOME/bin/dse" spark-submit --class "$MAIN" --driver-memory 5G \
   --conf "spark.executor.extraJavaOptions=$LOGGING_OPTS" \
   --driver-java-options "$GC_OPTS $JAVA_OPTS $LOGGING_OPTS $CONFIG_OVERRIDES" \
-  $@ $appdir/spark-job-server.jar $conffile 2>&1 &
-echo $! > $pidFilePath
+  "$@" "$appdir/spark-job-server.jar" "$conffile" 2>&1 &
+echo "$!" > "$pidFilePath"
diff --git a/bin/server_stop.sh b/bin/server_stop.sh
@@ -3,26 +3,30 @@
 
 get_abs_script_path() {
   pushd . >/dev/null
-  cd $(dirname $0)
+  cd "$(dirname "$0")"
   appdir=$(pwd)
   popd  >/dev/null
 }
 
 get_abs_script_path
 
 if [ -f "$appdir/settings.sh" ]; then
-  . $appdir/settings.sh
+  . "$appdir/settings.sh"
 else
   echo "Missing $appdir/settings.sh, exiting"
   exit 1
 fi
 
 pidFilePath=$appdir/$PIDFILE
 
-if [ ! -f "$pidFilePath" ] || ! kill -0 $(cat "$pidFilePath"); then
+if [ ! -f "$pidFilePath" ] || ! kill -0 "$(cat "$pidFilePath")"; then
    echo 'Job server not running'
 else
   echo 'Stopping job server...'
-  kill -15 $(cat "$pidFilePath") && rm -f "$pidFilePath"
+  PID="$(cat "$pidFilePath")"
+  "$(dirname "$0")"/kill-process-tree.sh 15 $PID && rm "$pidFilePath"
   echo '...job server stopped'
 fi
+
+
+
diff --git a/job-server/config/dse.conf b/job-server/config/dse.conf
@@ -0,0 +1,58 @@
+# Template for a Spark Job Server configuration file
+# When deployed these settings are loaded when job server starts
+#
+# Spark Cluster / Job Server configuration
+spark {
+  # Spark Master will be automatically learned via the DSE
+  # spark.master will be passed to each job's JobContext
+  # master = "local[4]"
+  # master = "mesos://vm28-hulk-pub:5050"
+  # master = "yarn-client"
+
+  # Default # of CPUs for jobs to use for Spark standalone cluster
+  job-number-cpus = 4
+
+  jobserver {
+    port = 8090
+    jar-store-rootdir = /tmp/jobserver/jars
+
+    jobdao = spark.jobserver.io.JobFileDAO
+
+    filedao {
+      rootdir = /tmp/spark-job-server/filedao/data
+    }
+  }
+
+  # predefined Spark contexts
+  # contexts {
+  #   my-low-latency-context {
+  #     num-cpu-cores = 1           # Number of cores to allocate.  Required.
+  #     memory-per-node = 512m         # Executor memory per node, -Xmx style eg 512m, 1G, etc.
+  #   }
+  #   # define additional contexts here
+  # }
+
+  # universal context configuration.  These settings can be overridden, see README.md
+  context-settings {
+    num-cpu-cores = 2           # Number of cores to allocate.  Required.
+    memory-per-node = 512m         # Executor memory per node, -Xmx style eg 512m, #1G, etc.
+
+    # in case spark distribution should be accessed from HDFS (as opposed to being installed on every mesos slave)
+    # spark.executor.uri = "hdfs://namenode:8020/apps/spark/spark.tgz"
+
+    # uris of jars to be loaded into the classpath for this context. Uris is a string list, or a string separated by commas ','
+    # dependent-jar-uris = ["file:///some/path/present/in/each/mesos/slave/somepackage.jar"]
+    
+    # If you wish to pass any settings directly to the sparkConf as-is, add them here in passthrough,
+    # such as hadoop connection settings that don't use the "spark." prefix
+    passthrough {
+      #es.nodes = "192.1.1.1"
+    }
+  }
+
+  # This needs to match SPARK_HOME for cluster SparkContexts to be created successfully
+  # home = "/home/spark/spark"
+}
+
+# Note that you can use this file to define settings not only for job server,
+# but for your Spark jobs as well.  Spark job configuration merges with this configuration file as defaults.
diff --git a/job-server/config/dse.sh b/job-server/config/dse.sh
@@ -0,0 +1,45 @@
+# DataStax Distribution Config
+# Environment and deploy file
+# For use with bin/server_deploy, bin/server_package etc.
+
+APP_USER=cassandra
+APP_GROUP=cassandra
+
+#Check Home Directory
+#Relative Tar Location and
+#Package location for dse-env.sh to get environment variables
+if [ -z "$DSE_ENV" ]; then
+    for include in "$HOME/.dse-env.sh" \
+                   "`dirname "$0"`/../../../bin/dse-env.sh" \
+                   "/etc/dse/dse-env.sh"; do
+        if [ -r "$include" ]; then
+            DSE_ENV="$include"
+            break
+        fi
+    done
+fi
+
+#ENV is set for the build script server_package, If it isn't set then we need
+# to be able to read DSE_ENV to set Spark Env variables
+if [ -z "$DSE_ENV" ] &&  [ -z "$ENV" ]; then
+    echo "DSE_ENV could not be determined."
+    exit 1
+elif [ -r "$DSE_ENV" ]; then
+    . "$DSE_ENV"
+elif [ -z "$ENV" ]; then
+    echo "Location pointed by DSE_ENV not readable: $DSE_ENV"
+    exit 1
+fi
+
+SPARK_VERSION=1.3.1.0 #Last digit is DSE Specific 
+
+DEPLOY_HOSTS="localhost"
+
+INSTALL_DIR="$DSE_COMPONENTS_ROOT/spark/spark-jobserver"
+LOG_DIR=/var/log/spark/job-server
+
+PIDFILE=spark-jobserver.pid
+
+SPARK_CONF_DIR=${SPARK_CONF_DIR:-"$SPARK_HOME/conf"}
+
+SCALA_VERSION=2.10.5 # or 2.11.6
diff --git a/version.sbt b/version.sbt
@@ -1 +1 @@
-version in ThisBuild := "0.5.2-SNAPSHOT"
+version in ThisBuild := "0.5.1.155"

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-version in ThisBuild := "0.5.2-SNAPSHOT"`
	`1`	`+version in ThisBuild := "0.5.1.155"`