riptano
diff --git a/‎README.md‎
Lines changed: 4 additions & 4 deletions b/‎README.md‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎bin/manager_start.sh‎
Lines changed: 40 additions & 24 deletions b/‎bin/manager_start.sh‎
Lines changed: 40 additions & 24 deletions
diff --git a/‎bin/server_package.sh‎
Lines changed: 1 addition & 0 deletions b/‎bin/server_package.sh‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎build.sbt‎
Lines changed: 2 additions & 1 deletion b/‎build.sbt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎doc/EMR.md‎
Lines changed: 2 additions & 0 deletions b/‎doc/EMR.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎doc/cluster.md‎
Lines changed: 66 additions & 0 deletions b/‎doc/cluster.md‎
Lines changed: 66 additions & 0 deletions
diff --git a/‎doc/mesos.md‎
Lines changed: 35 additions & 85 deletions b/‎doc/mesos.md‎
Lines changed: 35 additions & 85 deletions
diff --git a/‎doc/yarn.md‎
Lines changed: 4 additions & 9 deletions b/‎doc/yarn.md‎
Lines changed: 4 additions & 9 deletions
@@ -6,7 +6,7 @@ spark-jobserver provides a RESTful interface for submitting and managing [Apache
 This repo contains the complete Spark job server project, including unit tests and deploy scripts.
 It was originally started at [Ooyala](http://www.ooyala.com), but this is now the main development repo.
 
-Other useful links: [Troubleshooting Tips](doc/troubleshooting.md), [Yarn tips](doc/yarn.md), [Mesos tips](doc/mesos.md), [JMX tips](doc/jmx.md).
+Other useful links: [Troubleshooting](doc/troubleshooting.md), [cluster](doc/cluster.md), [YARN client](doc/yarn.md), [YARN on EMR](doc/EMR.md), [Mesos](doc/mesos.md), [JMX tips](doc/jmx.md).
 
 Also see [Chinese docs / 中文](doc/chinese/job-server.md).
 
@@ -103,7 +103,7 @@ Spark Job Server is now included in Datastax Enterprise 4.8!
 - Kill running jobs via stop context and delete job
 - Separate jar uploading step for faster job startup
 - Asynchronous and synchronous job API.  Synchronous API is great for low latency jobs!
-- Works with Standalone Spark as well as Mesos and yarn-client
+- Works with Standalone Spark as well on [cluster](doc/cluster.md), [Mesos](doc/mesos.md), YARN [client](doc/yarn.md) and [on EMR](doc/EMR.md))
 - Job and jar info is persisted via a pluggable DAO interface
 - Named Objects (such as RDDs or DataFrames) to cache and retrieve RDDs or DataFrames by name, improving object sharing and reuse among jobs.
 - Supports Scala 2.10 and 2.11
@@ -568,6 +568,8 @@ curl -k --basic --user 'user:pw' https://localhost:8090/contexts
 
 ## Deployment
 
+See also running on [cluster](doc/cluster.md), [YARN client](doc/yarn.md), on [EMR](doc/EMR.md) and running on [Mesos](doc/mesos.md).
+
 ### Manual steps
 
 1. Copy `config/local.sh.template` to `<environment>.sh` and edit as appropriate.  NOTE: be sure to set SPARK_VERSION if you need to compile against a different version.
@@ -906,8 +908,6 @@ To add to the underlying Hadoop configuration in a Spark context, add the hadoop
 
 For the exact context configuration parameters, see JobManagerActor docs as well as application.conf.
 
-Also see the [yarn doc](doc/yarn.md) for more tips.
-
 ### Other configuration settings
 
 For all of the Spark Job Server configuration settings, see `job-server/src/main/resources/application.conf`.
 
@@ -1,6 +1,6 @@
 #!/bin/bash
 # Script to start the job manager
-# args: <work dir for context> <cluster address> [proxy_user]
+# args: <master> <deployMode> <akkaAdress> <actorName> <workDir> [<proxyUser>]
 set -e
 
 get_abs_script_path() {
@@ -13,12 +13,8 @@ get_abs_script_path
 
 . $appdir/setenv.sh
 
-# Override logging options to provide per-context logging
-LOGGING_OPTS="-Dlog4j.configuration=file:$appdir/log4j-server.properties
-              -DLOG_DIR=$2"
-
 GC_OPTS="-XX:+UseConcMarkSweepGC
-         -verbose:gc -XX:+PrintGCTimeStamps -Xloggc:$appdir/gc.out
+         -verbose:gc -XX:+PrintGCTimeStamps
          -XX:MaxPermSize=512m
          -XX:+CMSClassUnloadingEnabled "
 
@@ -27,26 +23,46 @@ JAVA_OPTS="-XX:MaxDirectMemorySize=$MAX_DIRECT_MEMORY
 
 MAIN="spark.jobserver.JobManager"
 
-MESOS_OPTS=""
-if [ $1 == "mesos-cluster" ]; then
-    MESOS_OPTS="--master $MESOS_SPARK_DISPATCHER --deploy-mode cluster"
-    appdir=$REMOTE_JOBSERVER_DIR
-fi
+# copy files via spark-submit and read them from current (container) dir
+if [ $2 = "cluster" -a -z "$REMOTE_JOBSERVER_DIR" ]; then
+  SPARK_SUBMIT_OPTIONS="$SPARK_SUBMIT_OPTIONS
+    --master $1 --deploy-mode cluster
+    --conf spark.yarn.submit.waitAppCompletion=false
+    --files $appdir/log4j-cluster.properties,$conffile"
+  JAR_FILE="$appdir/spark-job-server.jar"
+  CONF_FILE=$(basename $conffile)
+  LOGGING_OPTS="-Dlog4j.configuration=log4j-cluster.properties"
 
-if [ ! -z $5 ]; then
-  cmd='$SPARK_HOME/bin/spark-submit --class $MAIN --driver-memory $JOBSERVER_MEMORY
-  --conf "spark.executor.extraJavaOptions=$LOGGING_OPTS"
-  --proxy-user $5
-  $MESOS_OPTS
-  --driver-java-options "$GC_OPTS $JAVA_OPTS $LOGGING_OPTS $CONFIG_OVERRIDES"
-  $appdir/spark-job-server.jar $2 $3 $4 $conffile'
+# use files in REMOTE_JOBSERVER_DIR
+elif [ $2 == "cluster" ]; then
+  SPARK_SUBMIT_OPTIONS="$SPARK_SUBMIT_OPTIONS
+    --master $1 --deploy-mode cluster
+    --conf spark.yarn.submit.waitAppCompletion=false"
+  JAR_FILE="$REMOTE_JOBSERVER_DIR/spark-job-server.jar"
+  CONF_FILE="$REMOTE_JOBSERVER_DIR/$(basename $conffile)"
+  LOGGING_OPTS="-Dlog4j.configuration=$REMOTE_JOBSERVER_DIR/log4j-cluster.properties"
+
+# client mode, use files from app dir
 else
-  cmd='$SPARK_HOME/bin/spark-submit --class $MAIN --driver-memory $JOBSERVER_MEMORY
-  --conf "spark.executor.extraJavaOptions=$LOGGING_OPTS"
-  --driver-java-options "$GC_OPTS $JAVA_OPTS $LOGGING_OPTS $CONFIG_OVERRIDES"
-  $MESOS_OPTS
-  $appdir/spark-job-server.jar $2 $3 $4 $conffile'
+  JAR_FILE="$appdir/spark-job-server.jar"
+  CONF_FILE="$conffile"
+  LOGGING_OPTS="-Dlog4j.configuration=file:$appdir/log4j-server.properties -DLOG_DIR=$5"
+  GC_OPTS="$GC_OPTS -Xloggc:$5/gc.out"
+fi
+
+if [ -n "$6" ]; then
+  SPARK_SUBMIT_OPTIONS="$SPARK_SUBMIT_OPTIONS --proxy-user $6"
+fi
+
+if [ -n "$JOBSERVER_KEYTAB" ]; then
+  SPARK_SUBMIT_OPTIONS="$SPARK_SUBMIT_OPTIONS --keytab $JOBSERVER_KEYTAB"
 fi
 
-eval $cmd
+cmd='$SPARK_HOME/bin/spark-submit --class $MAIN --driver-memory $JOBSERVER_MEMORY
+      --conf "spark.executor.extraJavaOptions=$LOGGING_OPTS"
+      $SPARK_SUBMIT_OPTIONS
+      --driver-java-options "$GC_OPTS $JAVA_OPTS $LOGGING_OPTS $CONFIG_OVERRIDES $SPARK_SUBMIT_JAVA_OPTIONS"
+      $JAR_FILE $3 $4 $CONF_FILE'
+
+eval $cmd 2>&1 > $5/spark-job-server.out
 
@@ -51,6 +51,7 @@ pushd "${bin}/.." > /dev/null
          bin/setenv.sh
          ${CONFIG_DIR}/${ENV}.conf
          config/shiro.ini
+         config/log4j-cluster.properties
          config/log4j-server.properties"
 
   rm -rf $WORK_DIR
 
@@ -44,6 +44,7 @@ lazy val jobServerTestJar = Project(id = "job-server-tests", base = file("job-se
   .settings(noPublishSettings)
   .dependsOn(jobServerApi)
   .disablePlugins(SbtScalariform)
+  .disablePlugins(ScoverageSbtPlugin) // do not include in coverage report
 
 lazy val jobServerApi = Project(id = "job-server-api", base = file("job-server-api"))
   .settings(commonSettings)
@@ -274,7 +275,7 @@ lazy val commonSettings = Defaults.coreDefaultSettings ++ dirSettings ++ implici
 
 lazy val scoverageSettings = {
   // Semicolon-separated list of regexs matching classes to exclude
-  coverageExcludedPackages := ".+Benchmark.*"
+  coverageExcludedPackages := ".+Benchmark.*;.+Example.*;.+TestJob"
 }
 
 lazy val publishSettings = Seq(
 
@@ -1,5 +1,7 @@
 ## Step by step instruction on how to run Spark Job Server on EMR 4.2.0 (Spark 1.6.0)
 
+See also running in [cluster mode](cluster.md), running [YARN in client mode](yarn.md) and running on [Mesos](Mesos.md).
+
 ### Create EMR 4.2.0 cluster
 
 Create EMR cluster using AWS EMR console or aws cli.
 
@@ -0,0 +1,66 @@
+## Configuring Job Server for YARN cluster mode
+
+See also running [YARN in client mode](yarn.md), running [YARN on EMR](EMR.md) and running on [Mesos](mesos.md).
+
+### Job Server configuration
+
+Add the following properties in your job server config file:
+- set `spark.master` property to `yarn`, `spark://...` or `mesos://...`
+- set `spark.submit.deployMode` property to `cluster`
+- set `spark.jobserver.context-per-jvm` to `true`
+- set `akka.remote.netty.tcp.hostname` to the cluster interface of the host running the frontend
+- set `akka.remote.netty.tcp.maximum-frame-size` to support big remote jars fetch
+
+Optional / required in spark standalone mode:
+- set `REMOTE_JOBSERVER_DIR` to `hdfs://...`, `file://...` or `http://...` in your settings `xxx.sh`
+- copy `spark-job-server.jar`, your job server config and `log4j-cluster.properties` file into this location
+
+Example job server config (replace `CLUSTER-IP` with the internal IP of the host running the job server frontend):
+
+    spark {
+      # deploy in yarn cluster mode
+      master = yarn
+      submit.deployMode = cluster
+
+      jobserver {
+        context-per-jvm = true
+
+        # start a H2 DB server, reachable in your cluster
+        sqldao {
+          jdbc {
+            url = "jdbc:h2:tcp://CLUSTER-IP:9092/h2-db;AUTO_RECONNECT=TRUE"
+          }
+        }
+        startH2Server = false
+      }
+    }
+
+    # start akka on this interface, reachable from your cluster
+    akka {
+      remote.netty.tcp {
+        hostname = "CLUSTER-IP"
+
+        # This controls the maximum message size, including job results, that can be sent
+        maximum-frame-size = 100 MiB
+      }
+    }
+
+Note:
+- YARN transfers the files provided via `--files` submit option into the cluster / container. Spark standalone does not support this in cluster mode and you have to transfer them manual.
+- Instead of running a H2 DB instance you can also run a real DB reachable inside your cluster. You can't use the default (host only) H2 configuration in a cluster setup.
+- Akka binds by [default](../job-server/src/main/resources/application.conf) to the local host interface and is not reachable from the cluster. You need to configure the akka hostname to the cluster internal address.
+
+### Reading files uploaded via frontend
+
+Files uploaded via the data API (`/data`) are stored on your job server frontend host.
+Call the [DataFileCache](../job-server-api/src/main/scala/spark/jobserver/api/SparkJobBase.scala) API implemented by the job environment in your spark jobs to access them:
+
+```scala
+  object RemoteDriverExample extends NewSparkJob {
+    def runJob(sc: SparkContext, runtime: JobEnvironment, data: JobData): JobOutput =
+      runtime.getDataFile(...)
+```
+
+The job server transfers the files via akka to the host running your driver and caches them there.
+
+Note: Files uploaded via the JAR or binary API are stored and transfered via the Job DB.
@@ -1,114 +1,64 @@
 ## Configuring Job Server for Mesos
 
+See also running on [cluster](cluster.md), YARN in [client mode](yarn.md) and running on [EMR](EMR.md).
+
 ### Mesos client mode
 
-Configuring job-server for Mesos cluster mode is straight forward. All you need to change is `spark.master` config to 
+Configuring job-server for Mesos client mode is straight forward. All you need to change is `spark.master` config to 
 point to Mesos master URL in job-server config file.
 
 Example config file (important settings are marked with # important):
 
     spark {
-      master =  <mesos master URL here> # important, example: mesos://mesos-master:5050
-    
-      # Default # of CPUs for jobs to use for Spark standalone cluster
-      job-number-cpus = 4
-
-      jobserver {
-        port = 8090
-        jobdao = spark.jobserver.io.JobSqlDAO
-
-        sqldao {
-          # Directory where default H2 driver stores its data. Only needed for H2.
-          rootdir = /database
-
-          # Full JDBC URL / init string.  Sorry, needs to match above.
-          # Substitutions may be used to launch job-server, but leave it out here in the default or tests won't pass
-          jdbc.url = "jdbc:h2:file:/database/h2-db"
-        }
-      }
-
-      # universal context configuration.  These settings can be overridden, see README.md
-      context-settings {
-        num-cpu-cores = 2           # Number of cores to allocate.  Required.
-        memory-per-node = 512m         # Executor memory per node, -Xmx style eg 512m, #1G, etc.
-      }
+      master = <mesos master URL here> # example: mesos://mesos-master:5050
     }
 
-### Mesos cluster Mode
+### Mesos cluster mode
 
 Configuring job-server for Mesos cluster mode is a bit tricky as compared to client mode.
 
-Here is the checklist for the changes needed for the same:
-
-- You need to start Mesos dispatcher in your cluster by running `./sbin/start-mesos-dispatcher.sh` available in 
+You need to start Mesos dispatcher in your cluster by running `./sbin/start-mesos-dispatcher.sh` available in 
 spark package. This step is not specific to job-server and as mentioned in [official spark documentation](https://spark.apache.org/docs/latest/running-on-mesos.html#cluster-mode) this is needed 
 to submit spark job in Mesos cluster mode. 
 
-- Add following config at the end of job-server's settings.sh file:
-    
-    ```
-    REMOTE_JOBSERVER_DIR=<path to job-server directory> # copy job-server directory on this location on all mesos agent nodes 
-    MESOS_SPARK_DISPATCHER=<mesos dispatcher URL> # example: mesos://mesos-dispatcher:7077
-    ```
-
-- Set `spark.jobserver.driver-mode` property to `mesos-cluster` in job-server config file.
+Add the following config to you job-server config file:
+- set `spark.master` property to messos dispatcher URL (example: `mesos://mesos-dispatcher:7077`)
+- set `spark.submit.deployMode` property to `cluster`
+- set `spark.jobserver.context-per-jvm` to `true`
+- set `akka.remote.netty.tcp.hostname` to the cluster interface of the host running the frontend
+- set `akka.remote.netty.tcp.maximum-frame-size` to support big remote jars fetch
 
-- Also override akka default configs in job-server config file to support big remote jars fetch, we have to set frame 
-size to some large value, for example:
-
-```
-akka.remote.netty.tcp {
-    # use remote IP address to form akka cluster, not 127.0.0.1. This should be the IP of of the machine where the file 
-    # resides. That means for each mesos agents (where job-server directory is copied on REMOTE_JOBSERVER_DIR path),
-    # the hostname should be the remote IP of that node.  
-    #  
-    hostname = "xxxxx" 
-    # This controls the maximum message size, including job results, that can be sent
-    maximum-frame-size = 104857600b
-}
-```
-
-- set `spark.master` to Mesos master URL (and not mesos-dispatcher URL).   
-
-- set `spark.jobserver.context-per-jvm` to `true` in job-server config file.
-
-Example config file (important settings are marked with # important):
+Example job server config (replace `CLUSTER-IP` with the internal IP of the host running the job server frontend):
 
     spark {
-      master =  <mesos master URL here> # important, example: mesos://mesos-master:5050
-    
-      # Default # of CPUs for jobs to use for Spark standalone cluster
-      job-number-cpus = 4
+      master =  <mesos dispatcher URL> # example: mesos://mesos-dispatcher:7077
+      submit.deployMode = cluster
 
       jobserver {
-        port = 8090
-        driver-mode = mesos-cluster  #important
-        context-per-jvm = true       #important
-        jobdao = spark.jobserver.io.JobSqlDAO
-        
-        sqldao {
-          # Directory where default H2 driver stores its data. Only needed for H2.
-          rootdir = /database
+        context-per-jvm = true
 
-          # Full JDBC URL / init string.  Sorry, needs to match above.
-          # Substitutions may be used to launch job-server, but leave it out here in the default or tests won't pass
-          jdbc.url = "jdbc:h2:file:/database/h2-db"
+        # start a H2 DB server, reachable in your cluster
+        sqldao {
+          jdbc {
+            url = "jdbc:h2:tcp://CLUSTER-IP:9092/h2-db;AUTO_RECONNECT=TRUE"
+          }
         }
-      }
-
-      # universal context configuration.  These settings can be overridden, see README.md
-      context-settings {
-        num-cpu-cores = 2           # Number of cores to allocate.  Required.
-        memory-per-node = 512m         # Executor memory per node, -Xmx style eg 512m, #1G, etc.
+        startH2Server = false
       }
     }
 
-    akka.remote.netty.tcp {    
-        # use remote IP address to form akka cluster, not 127.0.0.1. This should be the IP of of the machine where the file 
-        # resides. That means for each mesos agents (where job-server directory is copied on REMOTE_JOBSERVER_DIR path),
-        # the hostname should be the remote IP of that node.  
-        #  
-        hostname = "xxxxx"    #important
+    # start akka on this interface, reachable from your cluster
+    akka {
+      remote.netty.tcp {
+        hostname = "CLUSTER-IP"
+
         # This controls the maximum message size, including job results, that can be sent
-        maximum-frame-size = 104857600b    #important
+        maximum-frame-size = 100 MiB
+      }
     }
+
+- Optional: Add following config at the end of job-server's settings.sh file:
+    
+    ```
+    REMOTE_JOBSERVER_DIR=<path to job-server directory> # copy of job-server directory on all mesos agent nodes 
+    ```
@@ -1,10 +1,6 @@
-## Configuring Job Server for YARN
+## Configuring Job Server for YARN in client mode with docker
 
-(Looking for contributors for this page)
-
-(I would like to thank Jon Buffington for sharing the config tips below.... @velvia)
-
-Note:  This is for yarn with docker.  If you are looking to deploy on a yarn cluster via EMR, then this link would be more useful [EMR](https://github.com/spark-jobserver/spark-jobserver/blob/master/doc/EMR.md)
+See also running in [cluster mode](cluster.md), running [YARN on EMR](EMR.md) and running on [Mesos](mesos.md).
 
 ### Configuring the Spark-Jobserver Docker package to run in Yarn-Client Mode
 
@@ -19,11 +15,10 @@ Files we need:
 - dockerfile
 - cluster-config directory with hdfs-site.xml and yarn-site.xml (You should have these files already)
 
-Example docker.conf (important settings are marked with # important):
+Example docker.conf:
 
     spark {
-      master = "yarn-client" # important
-      master = ${?SPARK_MASTER}
+      master = yarn
 
       # Default # of CPUs for jobs to use for Spark standalone cluster
       job-number-cpus = 4