running-on-yarn.md

layout: global
title: Launching Spark on YARN
SPARK_HADOOP_VERSION=2.0.5-alpha SPARK_YARN=true sbt/sbt assembly
SPARK_JAR=<SPARK_ASSEMBLY_JAR_FILE> ./bin/spark-class org.apache.spark.deploy.yarn.Client \
  --jar <YOUR_APP_JAR_FILE> \
  --class <APP_MAIN_CLASS> \
  --arg <APP_MAIN_ARGUMENT> \
  --num-executors <NUMBER_OF_EXECUTOR_PROCESSES> \
  --driver-memory <MEMORY_FOR_ApplicationMaster> \
  --executor-memory <MEMORY_PER_EXECUTOR> \
  --executor-cores <CORES_PER_EXECUTOR> \
  --name <application_name> \
  --queue <queue_name> \
  --addJars <any_local_files_used_in_SparkContext.addJar> \
  --files <files_for_distributed_cache> \
  --archives <archives_for_distributed_cache>
# Build the Spark assembly JAR and the Spark examples JAR
$ SPARK_HADOOP_VERSION=2.0.5-alpha SPARK_YARN=true sbt/sbt assembly

# Configure logging
$ cp conf/log4j.properties.template conf/log4j.properties

# Submit Spark's ApplicationMaster to YARN's ResourceManager, and instruct Spark to run the SparkPi example
$ SPARK_JAR=./assembly/target/scala-{{site.SCALA_BINARY_VERSION}}/spark-assembly-{{site.SPARK_VERSION}}-hadoop2.0.5-alpha.jar \
    ./bin/spark-class org.apache.spark.deploy.yarn.Client \
      --jar examples/target/scala-{{site.SCALA_BINARY_VERSION}}/spark-examples-assembly-{{site.SPARK_VERSION}}.jar \
      --class org.apache.spark.examples.SparkPi \
      --arg yarn-cluster \
      --arg 5 \
      --num-executors 3 \
      --driver-memory 4g \
      --executor-memory 2g \
      --executor-cores 1