diff --git a/app/com/linkedin/drelephant/spark/fetchers/SparkRestClient.scala b/app/com/linkedin/drelephant/spark/fetchers/SparkRestClient.scala
index 20ec8cbb9..072a0ff8e 100644
--- a/app/com/linkedin/drelephant/spark/fetchers/SparkRestClient.scala
+++ b/app/com/linkedin/drelephant/spark/fetchers/SparkRestClient.scala
@@ -95,13 +95,20 @@ class SparkRestClient(sparkConf: SparkConf) {
           getLogData(attemptTarget)
         }
       } else Future.successful(None)
+      val futureFailedTasks = if (fetchFailedTasks) {
+        Future {
+          getStagesWithFailedTasks(attemptTarget)
+        }
+      } else {
+        Future.successful(Seq.empty)
+      }
 
       SparkRestDerivedData(
         applicationInfo,
         Await.result(futureJobDatas, DEFAULT_TIMEOUT),
         Await.result(futureStageDatas, DEFAULT_TIMEOUT),
         Await.result(futureExecutorSummaries, Duration(5, SECONDS)),
-        Seq.empty,
+        Await.result(futureFailedTasks, DEFAULT_TIMEOUT),
         Await.result(futureLogData, Duration(5, SECONDS))
       )
 
@@ -211,7 +218,7 @@ class SparkRestClient(sparkConf: SparkConf) {
   }
 
   private def getStageDatas(attemptTarget: WebTarget): Seq[StageDataImpl] = {
-    val target = attemptTarget.path("stages")
+    val target = attemptTarget.path("stages/withSummaries")
     try {
       get(target, SparkRestObjectMapper.readValue[Seq[StageDataImpl]])
     } catch {
diff --git a/app/com/linkedin/drelephant/spark/fetchers/statusapiv1/statusapiv1.scala b/app/com/linkedin/drelephant/spark/fetchers/statusapiv1/statusapiv1.scala
index 808a3f4b0..dfd20e43e 100644
--- a/app/com/linkedin/drelephant/spark/fetchers/statusapiv1/statusapiv1.scala
+++ b/app/com/linkedin/drelephant/spark/fetchers/statusapiv1/statusapiv1.scala
@@ -143,11 +143,17 @@ trait StageData{
   def status: StageStatus
   def stageId: Int
   def attemptId: Int
+  def numTasks: Int
   def numActiveTasks: Int
   def numCompleteTasks: Int
   def numFailedTasks: Int
 
   def executorRunTime: Long
+  def executorCpuTime: Long
+  def submissionTime: Option[Date]
+  def firstTaskLaunchedTime: Option[Date]
+  def completionTime: Option[Date]
+  def failureReason: Option[String]
 
   def inputBytes: Long
   def inputRecords: Long
@@ -166,7 +172,14 @@ trait StageData{
 
   def accumulatorUpdates: Seq[AccumulableInfo]
   def tasks: Option[Map[Long, TaskDataImpl]]
-  def executorSummary: Option[Map[String, ExecutorStageSummary]]}
+  def executorSummary: Option[Map[String, ExecutorStageSummary]]
+
+  def peakJvmUsedMemory: Option[Long]
+  def peakExecutionMemory: Option[Long]
+  def peakStorageMemory: Option[Long]
+  def peakUnifiedMemory: Option[Long]
+  def taskSummary : Option[TaskMetricDistributions]
+  def executorMetricsSummary : Option[ExecutorMetricDistributions]}
 
 trait TaskData{
   def taskId: Long
@@ -219,10 +232,15 @@ trait TaskMetricDistributions{
   def quantiles: IndexedSeq[Double]
 
   def executorDeserializeTime: IndexedSeq[Double]
+  def executorDeserializeCpuTime: IndexedSeq[Double]
   def executorRunTime: IndexedSeq[Double]
+  def executorCpuTime: IndexedSeq[Double]
   def resultSize: IndexedSeq[Double]
   def jvmGcTime: IndexedSeq[Double]
   def resultSerializationTime: IndexedSeq[Double]
+  def gettingResultTime: IndexedSeq[Double]
+  def schedulerDelay: IndexedSeq[Double]
+  def peakExecutionMemory: IndexedSeq[Double]
   def memoryBytesSpilled: IndexedSeq[Double]
   def diskBytesSpilled: IndexedSeq[Double]
 
@@ -246,6 +264,7 @@ trait ShuffleReadMetricDistributions{
   def localBlocksFetched: IndexedSeq[Double]
   def fetchWaitTime: IndexedSeq[Double]
   def remoteBytesRead: IndexedSeq[Double]
+  def remoteBytesReadToDisk: IndexedSeq[Double]
   def totalBlocksFetched: IndexedSeq[Double]}
 
 trait ShuffleWriteMetricDistributions{
@@ -253,6 +272,25 @@ trait ShuffleWriteMetricDistributions{
   def writeRecords: IndexedSeq[Double]
   def writeTime: IndexedSeq[Double]}
 
+trait ExecutorMetricDistributions{
+  def quantiles: IndexedSeq[Double]
+  def numTasks: IndexedSeq[Double]
+  def inputBytes : IndexedSeq[Double]
+  def inputRecords : IndexedSeq[Double]
+  def outputBytes : IndexedSeq[Double]
+  def outputRecords : IndexedSeq[Double]
+  def shuffleRead : IndexedSeq[Double]
+  def shuffleReadRecords : IndexedSeq[Double]
+  def shuffleWrite : IndexedSeq[Double]
+  def shuffleWriteRecords : IndexedSeq[Double]
+  def memoryBytesSpilled : IndexedSeq[Double]
+  def diskBytesSpilled : IndexedSeq[Double]
+  def peakJvmUsedMemory : IndexedSeq[Double]
+  def peakExecutionMemory : IndexedSeq[Double]
+  def peakStorageMemory : IndexedSeq[Double]
+  def peakUnifiedMemory : IndexedSeq[Double]}
+
+
 trait AccumulableInfo{
   def id: Long
   def name: String
@@ -353,11 +391,17 @@ class StageDataImpl(
   var status: StageStatus,
   var stageId: Int,
   var attemptId: Int,
+  var numTasks: Int,
   var numActiveTasks: Int ,
   var numCompleteTasks: Int,
   var numFailedTasks: Int,
 
   var executorRunTime: Long,
+  var executorCpuTime: Long,
+  var submissionTime: Option[Date],
+  var firstTaskLaunchedTime: Option[Date],
+  var completionTime: Option[Date],
+  var failureReason: Option[String],
 
   var inputBytes: Long,
   var inputRecords: Long,
@@ -376,7 +420,13 @@ class StageDataImpl(
 
   var accumulatorUpdates: Seq[AccumulableInfoImpl],
   var tasks: Option[Map[Long, TaskDataImpl]],
-  var executorSummary: Option[Map[String, ExecutorStageSummaryImpl]]) extends StageData
+  var executorSummary: Option[Map[String, ExecutorStageSummaryImpl]],
+  var peakJvmUsedMemory: Option[Long],
+  var peakExecutionMemory: Option[Long],
+  var peakStorageMemory: Option[Long],
+  var peakUnifiedMemory: Option[Long],
+  var taskSummary : Option[TaskMetricDistributionsImpl],
+  var executorMetricsSummary : Option[ExecutorMetricDistributionsImpl]) extends StageData
 
 class TaskDataImpl(
   var taskId: Long,
@@ -427,12 +477,16 @@ class ShuffleWriteMetricsImpl(
 
 class TaskMetricDistributionsImpl(
   var quantiles: IndexedSeq[Double],
-
   var executorDeserializeTime: IndexedSeq[Double],
+  var executorDeserializeCpuTime: IndexedSeq[Double],
   var executorRunTime: IndexedSeq[Double],
+  var executorCpuTime: IndexedSeq[Double],
   var resultSize: IndexedSeq[Double],
   var jvmGcTime: IndexedSeq[Double],
   var resultSerializationTime: IndexedSeq[Double],
+  var gettingResultTime: IndexedSeq[Double],
+  var schedulerDelay: IndexedSeq[Double],
+  var peakExecutionMemory: IndexedSeq[Double],
   var memoryBytesSpilled: IndexedSeq[Double],
   var diskBytesSpilled: IndexedSeq[Double],
 
@@ -456,6 +510,7 @@ class ShuffleReadMetricDistributionsImpl(
   var localBlocksFetched: IndexedSeq[Double],
   var fetchWaitTime: IndexedSeq[Double],
   var remoteBytesRead: IndexedSeq[Double],
+  var remoteBytesReadToDisk: IndexedSeq[Double],
   var totalBlocksFetched: IndexedSeq[Double]) extends ShuffleReadMetricDistributions
 
 class ShuffleWriteMetricDistributionsImpl(
@@ -468,3 +523,21 @@ class AccumulableInfoImpl(
   var name: String,
   var update: Option[String],
   var value: String) extends AccumulableInfo
+
+class ExecutorMetricDistributionsImpl(
+  var quantiles: IndexedSeq[Double],
+  var numTasks: IndexedSeq[Double],
+  var inputBytes : IndexedSeq[Double],
+  var inputRecords : IndexedSeq[Double],
+  var outputBytes : IndexedSeq[Double],
+  var outputRecords : IndexedSeq[Double],
+  var shuffleRead : IndexedSeq[Double],
+  var shuffleReadRecords : IndexedSeq[Double],
+  var shuffleWrite : IndexedSeq[Double],
+  var shuffleWriteRecords : IndexedSeq[Double],
+  var memoryBytesSpilled : IndexedSeq[Double],
+  var diskBytesSpilled : IndexedSeq[Double],
+  var peakJvmUsedMemory : IndexedSeq[Double],
+  var peakExecutionMemory : IndexedSeq[Double],
+  var peakStorageMemory : IndexedSeq[Double],
+  var peakUnifiedMemory : IndexedSeq[Double]) extends ExecutorMetricDistributions
diff --git a/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParameterAdjustment.scala b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParameterAdjustment.scala
new file mode 100644
index 000000000..907c7ec72
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParameterAdjustment.scala
@@ -0,0 +1,67 @@
+package com.linkedin.drelephant.spark.heuristics
+
+/**
+  * Adjustments to configuration parameters for fixing flagged issues.
+  */
+private[heuristics] sealed trait ConfigurationParameterAdjustment[T] {
+
+  /**
+    * Determine if the value should be adjusted.
+    *
+    * @param value the value to adjust.
+    * @return true if the value should be adjusted, false otherwise.
+    */
+  def canAdjust(value: T): Boolean
+
+  /** Adjust the value.
+    *
+    * @param value the value to adjust.
+    * @return the adjusted recommended value.
+    */
+  def adjust(value: T): T
+}
+
+/** If the number of cores is greater than the threshold, then divide by divisor. */
+private[heuristics] case class CoreDivisorAdjustment(
+    threshold: Int,
+    divisor: Double) extends ConfigurationParameterAdjustment[Int] {
+  override def canAdjust(numCores: Int): Boolean =  (numCores > threshold)
+  override def adjust(numCores: Int): Int = Math.ceil(numCores / divisor).toInt
+}
+
+/** Set the number of cores to threshold, if the number of cores is greater. */
+private[heuristics] case class CoreSetAdjustment(
+    threshold: Int) extends ConfigurationParameterAdjustment[Int] {
+  override def canAdjust(numCores: Int): Boolean =  (numCores > threshold)
+  override def adjust(numCores: Int): Int = threshold
+}
+
+/** If the memory is less than the threshold, then multiply by multiplier. */
+private[heuristics] case class MemoryMultiplierAdjustment(
+    threshold: Long,
+    multiplier: Double) extends ConfigurationParameterAdjustment[Long] {
+  override def canAdjust(memBytes: Long): Boolean =  (memBytes < threshold)
+  override def adjust(memBytes: Long): Long = (memBytes * multiplier).toLong
+}
+
+/** If the memory is less than the threshold, then set to the theshold. */
+private[heuristics] case class MemorySetAdjustment(
+    threshold: Long) extends ConfigurationParameterAdjustment[Long] {
+  override def canAdjust(memBytes: Long): Boolean =  (memBytes < threshold)
+  override def adjust(memBytes: Long): Long = threshold
+}
+
+/** If the number of partitions is less than the threshold, then multiply by multiplier. */
+private[heuristics] case class PartitionMultiplierAdjustment(
+    threshold: Int,
+    multiplier: Double) extends ConfigurationParameterAdjustment[Int] {
+  override def canAdjust(numPartitions: Int): Boolean = (numPartitions < threshold)
+  override def adjust(numPartitions: Int): Int = (numPartitions * multiplier).toInt
+}
+
+/** If the number of partitions is less than the threshold, then set to threshold. */
+private[heuristics] case class PartitionSetAdjustment(
+    threshold: Int) extends ConfigurationParameterAdjustment[Int] {
+  override def canAdjust(numPartitions: Int): Boolean = (numPartitions < threshold)
+  override def adjust(numPartitions: Int): Int = threshold
+}
diff --git a/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristic.scala b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristic.scala
new file mode 100644
index 000000000..b791b61bb
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristic.scala
@@ -0,0 +1,603 @@
+/*
+ * Copyright 2016 LinkedIn Corp.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License"); you may not
+ * use this file except in compliance with the License. You may obtain a copy of
+ * the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+ * License for the specific language governing permissions and limitations under
+ * the License.
+ */
+
+package com.linkedin.drelephant.spark.heuristics
+
+import com.linkedin.drelephant.analysis._
+import com.linkedin.drelephant.configurations.heuristic.HeuristicConfigurationData
+import com.linkedin.drelephant.spark.data.SparkApplicationData
+import com.linkedin.drelephant.spark.fetchers.statusapiv1.{ExecutorSummary, TaskDataImpl}
+
+import scala.collection.JavaConverters
+import scala.collection.mutable.ArrayBuffer
+
+/**
+  * A heuristic for recommending configuration parameter values, based on metrics from the application run.
+  * @param heuristicConfigurationData
+  */
+class ConfigurationParametersHeuristic(private val heuristicConfigurationData: HeuristicConfigurationData)
+  extends Heuristic[SparkApplicationData] {
+
+  import JavaConverters._
+  import ConfigurationParametersHeuristic._
+  import ConfigurationUtils._
+
+  // the maximum number of recommended partitions
+  private val maxRecommendedPartitions = heuristicConfigurationData.getParamMap
+    .getOrDefault(MAX_RECOMMENDED_PARTITIONS_KEY, DEFAULT_MAX_RECOMMENDED_PARTITIONS).toInt
+
+  override def getHeuristicConfData(): HeuristicConfigurationData = heuristicConfigurationData
+
+  override def apply(data: SparkApplicationData): HeuristicResult = {
+
+    lazy val appConfigurationProperties: Map[String, String] =
+      data.appConfigurationProperties
+
+    val evaluator = new Evaluator(this, data)
+
+    // add current configuration parameter values, and recommended parameter values to the result.
+    var resultDetails = ArrayBuffer(
+      new HeuristicResultDetails("Current spark.executor.memory",
+        bytesToString(evaluator.sparkExecutorMemory)),
+      new HeuristicResultDetails("Current spark.driver.memory",
+        bytesToString(evaluator.sparkDriverMemory)),
+      new HeuristicResultDetails("Current spark.executor.cores", evaluator.sparkExecutorCores.toString),
+      new HeuristicResultDetails("Current spark.driver.cores", evaluator.sparkDriverCores.toString),
+      new HeuristicResultDetails("Current spark.memory.fraction", evaluator.sparkMemoryFraction.toString))
+    evaluator.sparkExecutorInstances.foreach { numExecutors =>
+      resultDetails += new HeuristicResultDetails("Current spark.executor.instances", numExecutors.toString)
+    }
+    evaluator.sparkExecutorMemoryOverhead.foreach { memOverhead =>
+      resultDetails += new HeuristicResultDetails("Current spark.yarn.executor.memoryOverhead",
+        bytesToString(memOverhead))
+    }
+    evaluator.sparkDriverMemoryOverhead.foreach { memOverhead =>
+      resultDetails += new HeuristicResultDetails("Current spark.yarn.driver.memoryOverhead",
+        bytesToString(memOverhead))
+    }
+
+    resultDetails ++= Seq(
+    new HeuristicResultDetails("Current spark.sql.shuffle.partitions", evaluator.sparkSqlShufflePartitions.toString),
+      new HeuristicResultDetails("Recommended spark.executor.cores", evaluator.recommendedExecutorCores.toString),
+      new HeuristicResultDetails("Recommended spark.executor.memory",
+        bytesToString(evaluator.recommendedExecutorMemory)),
+      new HeuristicResultDetails("Recommended spark.memory.fraction", evaluator.recommendedMemoryFraction.toString),
+      new HeuristicResultDetails("Recommended spark.sql.shuffle.partitions", evaluator.recommendedNumPartitions.toString),
+      new HeuristicResultDetails("Recommended spark.driver.cores", evaluator.recommendedDriverCores.toString),
+      new HeuristicResultDetails("Recommended spark.driver.memory",
+        bytesToString(evaluator.recommendedDriverMemory))
+     )
+    evaluator.recommendedExecutorInstances.foreach { numExecutors =>
+      resultDetails += new HeuristicResultDetails("Recommended spark.executor.instances", numExecutors.toString)
+    }
+    evaluator.recommendedExecutorMemoryOverhead.foreach { memoryOverhead =>
+      resultDetails += new HeuristicResultDetails("Recommended spark.yarn.executor.memoryOverhead",
+        bytesToString(memoryOverhead))
+    }
+    evaluator.recommendedDriverMemoryOverhead.foreach { memoryOverhead =>
+      resultDetails += new HeuristicResultDetails("Recommended spark.yarn.driver.memoryOverhead",
+        bytesToString(memoryOverhead))
+    }
+    if (evaluator.stageDetails.getValue.length > 0) {
+      resultDetails += evaluator.stageDetails
+    }
+
+    new HeuristicResult(
+      heuristicConfigurationData.getClassName,
+      heuristicConfigurationData.getHeuristicName,
+      evaluator.severity,
+      evaluator.score,
+      resultDetails.asJava
+    )
+  }
+}
+
+ object ConfigurationParametersHeuristic {
+   import ConfigurationUtils._
+
+   /**
+     * Evaluate the metrics for a given Spark application, and determine recommended configuration
+     * parameter values
+     *
+     * @param configurationParametersHeuristic configuration parameters heurisitc
+     * @param data Spark application data
+     */
+   class Evaluator(
+       configurationParametersHeuristic: ConfigurationParametersHeuristic,
+       data: SparkApplicationData) {
+     lazy val appConfigurationProperties: Map[String, String] =
+       data.appConfigurationProperties
+
+     // current configuration parameters
+     lazy val sparkExecutorMemory = stringToBytes(
+       appConfigurationProperties.get(SPARK_EXECUTOR_MEMORY)
+         .getOrElse(SPARK_EXECUTOR_MEMORY_DEFAULT))
+     lazy val sparkDriverMemory = stringToBytes(appConfigurationProperties
+       .get(SPARK_DRIVER_MEMORY).getOrElse(SPARK_DRIVER_MEMORY_DEFAULT))
+     lazy val sparkExecutorCores = appConfigurationProperties
+       .get(SPARK_EXECUTOR_CORES).map(_.toInt).getOrElse(SPARK_EXECUTOR_CORES_DEFAULT)
+     lazy val sparkDriverCores = appConfigurationProperties
+       .get(SPARK_DRIVER_CORES).map(_.toInt).getOrElse(SPARK_DRIVER_CORES_DEFAULT)
+     lazy val sparkMemoryFraction = appConfigurationProperties
+       .get(SPARK_MEMORY_FRACTION).map(_.toDouble).getOrElse(SPARK_MEMORY_FRACTION_DEFAULT)
+     lazy val sparkSqlShufflePartitions = appConfigurationProperties
+       .get(SPARK_SQL_SHUFFLE_PARTITIONS).map(_.toInt).getOrElse(SPARK_SQL_SHUFFLE_PARTITIONS_DEFAULT)
+     lazy val sparkExecutorInstances = appConfigurationProperties
+       .get(SPARK_EXECUTOR_INSTANCES).map(_.toInt)
+     lazy val sparkExecutorMemoryOverhead = appConfigurationProperties
+       .get(SPARK_EXECUTOR_MEMORY_OVERHEAD).map(stringToBytes(_))
+     lazy val sparkDriverMemoryOverhead = appConfigurationProperties
+       .get(SPARK_DRIVER_MEMORY_OVERHEAD).map(stringToBytes(_))
+
+     // from observation of user applications, adjusting spark.memory.fraction has not had
+     // much benefit, so always set to the default value.
+     val recommendedMemoryFraction: Double = SPARK_MEMORY_FRACTION_DEFAULT
+
+     // recommended executor configuration values, whose recommended values will be
+     // adjusted as various metrics are analyzed. Initialize to current values.
+     var recommendedNumPartitions: Int = sparkSqlShufflePartitions
+     var recommendedExecutorMemory: Long = sparkExecutorMemory
+     var recommendedExecutorCores: Int = sparkExecutorCores
+
+     // TODO: adjust when there is more information about total container memory usage
+     val recommendedDriverMemoryOverhead: Option[Long] = sparkDriverMemoryOverhead
+
+     private lazy val executorSummaries: Seq[ExecutorSummary] = data.executorSummaries
+     private lazy val driver: ExecutorSummary = executorSummaries.find(_.id == "driver").getOrElse(null)
+
+     if (driver == null) {
+       throw new Exception("No driver found!")
+     }
+
+     val currentParallelism = sparkExecutorInstances.map(_ * sparkExecutorCores)
+
+     val jvmUsedMemoryHeuristic =
+       new JvmUsedMemoryHeuristic(configurationParametersHeuristic.heuristicConfigurationData)
+     val jvmUsedMemoryEvaluator = new JvmUsedMemoryHeuristic.Evaluator(jvmUsedMemoryHeuristic, data)
+
+     val executorGcHeuristic =
+       new ExecutorGcHeuristic(configurationParametersHeuristic.heuristicConfigurationData)
+     val executorGcEvaluator = new ExecutorGcHeuristic.Evaluator(executorGcHeuristic, data)
+     val executorGcSeverity = executorGcEvaluator.severityTimeA
+
+     val stageAnalyzer =
+       new StagesAnalyzer(configurationParametersHeuristic.heuristicConfigurationData, data)
+     val stageAnalysis = stageAnalyzer.getStageAnalysis()
+
+     // check for long running tasks, and increase number of partitions if applicable
+     adjustParametersForLongTasks()
+
+     // check for execution memory spill for any stages, and adjust memory, cores, number of
+     // partitions
+     // (recommendedExecutorCores, recommendedExecutorMemory, recommendedNumPartitions) =
+     adjustParametersForExecutionMemorySpill()
+
+     // check for too much time in GC or OOM, and adjust memory, cores, number of partitions
+     if (hasOOMorGC()) {
+         adjustParametersForGCandOOM()
+     } else {
+       // check if executor memory can be lowered
+         adjustExecutorMemory()
+     }
+
+     // check to see if the number of executor instances should be adjusted
+     val recommendedExecutorInstances = calculateExecutorInstances()
+
+     // check to see if the executor memory overhead should be adjusted
+     val recommendedExecutorMemoryOverhead = calculateExecutorMemoryOverhead()
+
+     // adjust driver configuration parameters
+     val (recommendedDriverCores, recommendedDriverMemory, driverSeverity, driverScore) =
+       adjustDriverParameters()
+
+     // stage level informaton and recommendations
+     private val stageDetailsStr = stageAnalysis.flatMap { analysis =>
+       analysis.taskFailureResult.details ++ analysis.stageFailureResult.details ++
+         analysis.taskSkewResult.details ++ analysis.longTaskResult.details ++
+         analysis.executionMemorySpillResult.details ++ analysis.stageGCResult.details
+     }.toArray.mkString("\n")
+     val stageDetails = new HeuristicResultDetails("stage details", stageDetailsStr)
+
+     val score = stageAnalysis.map(_.getStageAnalysisResults.map(_.score).sum).sum +
+       executorGcEvaluator.score + jvmUsedMemoryEvaluator.score + driverScore
+
+     val severity = Severity.max(calculateStageSeverity(stageAnalysis), executorGcSeverity,
+       jvmUsedMemoryEvaluator.severity, driverSeverity)
+
+
+     /**
+       * If there are any long tasks, calculate a good value for the number of partitions
+       * to decrease run time.
+       */
+     private def adjustParametersForLongTasks() = {
+       // Adjusting spark.sql.shuffle.partitions is only useful if a stage with long tasks is
+       // using this value to determine the number of tasks, so check to see the number of tasks
+       // match this value. Also, if the stage is reading input data, the number of tasks will be
+       // determined by DaliSpark.SPLIT_SIZE, so filter out these stages as well.
+       // As part of the stage analysis, information about these special cases are recorded, and
+       // the information can be returned to the user, so that they can modify their application.
+       if (stageAnalysis.exists(analysis => hasSignificantSeverity(analysis.longTaskResult.severity))) {
+         val medianDurations = stageAnalysis.filter { stageInfo =>
+           stageInfo.inputBytes == 0 && stageInfo.numTasks == sparkSqlShufflePartitions
+         }.map(_.medianRunTime.map(_.toLong).getOrElse(0L))
+         val maxMedianDuration = if (medianDurations.size > 0) {
+           medianDurations.max
+         } else {
+           0L
+         }
+         recommendedNumPartitions = Math.max(recommendedNumPartitions,
+           Math.min(DEFAULT_MAX_RECOMMENDED_PARTITIONS.toInt,
+             (sparkSqlShufflePartitions * maxMedianDuration / DEFAULT_TARGET_TASK_DURATION.toLong).toInt))
+       }
+     }
+
+     /**
+       * Examine stages for execution memory spill, and adjust cores, memory and partitions
+       * to try to keep execution memory from spilling.
+       *  - Decreasing cores reduces the number of tasks running concurrently on the executor,
+       *    so there is more executor memory available per task.
+       *  - Increasing executor memory also proportionally increases the size of the unified
+       *    memory region.
+       *  - Increasing the number of partitions divides the total data across more tasks, so that
+       *    there is less data (and memory needed to store it) per task.
+       */
+     private def adjustParametersForExecutionMemorySpill() = {
+
+       // calculate recommended values for num partitions, executor memory and cores to
+       // try to avoid/reduce spill
+       if (stageAnalysis.exists { analysis =>
+         hasSignificantSeverity(analysis.executionMemorySpillResult.severity)
+       }) {
+         // find the stage with the max amount of execution memory spill, that has tasks equal to
+         // spark.sql.shuffle.partitions and no skew.
+         val stagesWithSpill = stageAnalysis.filter { stageInfo =>
+           !hasSignificantSeverity(stageInfo.taskSkewResult.severity) &&
+             stageInfo.numTasks == sparkSqlShufflePartitions
+         }
+         if (stagesWithSpill.size > 0) {
+           val maxSpillStage = stagesWithSpill.maxBy(_.executionMemorySpillResult.memoryBytesSpilled)
+
+           if (maxSpillStage.executionMemorySpillResult.memoryBytesSpilled > 0) {
+             // calculate the total unified memory allocated for all tasks, plus the execution memory
+             // spill -- this is roughly the amount of memory needed to keep execution data in memory.
+             // Note that memoryBytesSpilled is the total amount of execution memory spilled, which could
+             // be sequential, so this calculation could be higher than the actual amount needed.
+             val totalUnifiedMemoryNeeded = maxSpillStage.executionMemorySpillResult.memoryBytesSpilled +
+               calculateTotalUnifiedMemory(sparkExecutorMemory, sparkMemoryFraction,
+                 sparkExecutorCores, sparkSqlShufflePartitions)
+
+             // If the amount of unified memory allocated for all tasks with the recommended
+             // memory value is less than the calculated needed value.
+             def checkMem(modified: Boolean): Boolean = {
+               calculateTotalUnifiedMemory(recommendedExecutorMemory, recommendedMemoryFraction,
+                 recommendedExecutorCores, recommendedNumPartitions) < totalUnifiedMemoryNeeded
+             }
+             // Try incrementally adjusting the number of cores, memory, and partitions to try
+             // to keep everything (allocated unified memory plus spill) in memory
+             adjustExecutorParameters(STAGE_SPILL_ADJUSTMENTS, checkMem)
+           }
+         }
+       }
+     }
+
+     /** @return true if the application has tasks that failed with OutOfMemory, or spent too much time in GC */
+     private def hasOOMorGC() = {
+       hasSignificantSeverity(executorGcSeverity) ||
+         stageAnalysis.exists(stage => hasSignificantSeverity(stage.taskFailureResult.oomSeverity))
+     }
+
+     /**
+       * Adjust cores, memory and/or partitions to reduce likelihood of OutOfMemory errors or
+       * excessive time in GC.
+       *  - Decreasing cores reduces the number of tasks running concurrently on the executor,
+       *    so there is more executor memory available per task.
+       *  - Increasing executor memory also proportionally increases memory available per task.
+       *  - Increasing the number of partitions divides the total data across more tasks, so that
+       *    there is less data processed (and memory needed to store it) per task.
+       */
+     private def adjustParametersForGCandOOM() = {
+       // check if there are any stages with OOM errors, that have a non-default number
+       // of tasks (adjusting the number of partitions won't hep in this case)
+       val stageWithNonDefaultPartitionOOM = stageAnalysis.exists { stage =>
+         hasSignificantSeverity(stage.taskFailureResult.oomSeverity) &&
+           stage.numTasks != sparkSqlShufflePartitions
+       }
+
+       // check for stages with GC issues that have a non-default number of tasks.
+       // There is some randomness in when GC is done, but in case of correlation,
+       // avoid trying to adjust the number of partitions to fix.
+       val stagesWithNonDefaultPartitionGC = stageAnalysis.exists { stage =>
+         hasSignificantSeverity(stage.stageGCResult.severity) && stage.numTasks != sparkSqlShufflePartitions
+       }
+
+       // If there are stages with non-default partitions, that have OOM or GC issues,
+       // avoid trying adjustments to the number of partitions, since this will not help
+       // those stages.
+       val adjustments = if (stageWithNonDefaultPartitionOOM || stagesWithNonDefaultPartitionGC) {
+         OOM_GC_ADJUSTMENTS.filter{ adjustment =>
+           adjustment match {
+             case _: PartitionMultiplierAdjustment => false
+             case _: PartitionSetAdjustment => false
+             case _ => true
+           }
+         }
+       } else {
+         OOM_GC_ADJUSTMENTS
+       }
+
+       if (recommendedNumPartitions <= sparkSqlShufflePartitions &&
+         recommendedExecutorCores >= sparkExecutorCores &&
+         recommendedExecutorMemory <= sparkExecutorMemory) {
+         // Configuration parameters haven't been adjusted for execution memory spill or long tasks.
+         // Adjust them now to try to prevent OOM.
+         adjustExecutorParameters(adjustments, (modified: Boolean) => !modified)
+       }
+     }
+
+     /**
+       * Adjust the executor configuration parameters, according to the passed in
+       * adjustment recommendations.
+       *
+       * @param adjustments the list of adjustments to try.
+       * @param continueFn Given if the last adjustment was applied, return whether or not
+       *                   adjustments should continue (true) or terminate (false)
+       */
+     private def adjustExecutorParameters(
+         adjustments: Seq[ConfigurationParameterAdjustment[_>: Int with Long <: AnyVal]],
+         continueFn: (Boolean) => Boolean) = {
+       var modified = false
+       val iter = adjustments.iterator
+
+       while (iter.hasNext && continueFn(modified)) {
+         iter.next() match {
+           case adjustment: CoreDivisorAdjustment =>
+             if (adjustment.canAdjust(recommendedExecutorCores)) {
+               recommendedExecutorCores = adjustment.adjust(recommendedExecutorCores)
+               modified = true
+             }
+           case adjustment: CoreSetAdjustment =>
+             if (adjustment.canAdjust(recommendedExecutorCores)) {
+               recommendedExecutorCores = adjustment.adjust(recommendedExecutorCores)
+               modified = true
+             }
+           case adjustment: MemoryMultiplierAdjustment =>
+             if (adjustment.canAdjust(recommendedExecutorMemory)) {
+               recommendedExecutorMemory = adjustment.adjust(recommendedExecutorMemory)
+               modified = true
+             }
+           case adjustment: MemorySetAdjustment =>
+             if (adjustment.canAdjust(recommendedExecutorMemory)) {
+               recommendedExecutorMemory = adjustment.adjust(recommendedExecutorMemory)
+               modified = true
+             }
+           case adjustment: PartitionMultiplierAdjustment =>
+             if (adjustment.canAdjust(recommendedNumPartitions)) {
+               recommendedNumPartitions = adjustment.adjust(recommendedNumPartitions)
+               modified = true
+             }
+           case adjustment: PartitionSetAdjustment =>
+             if (adjustment.canAdjust(recommendedNumPartitions)) {
+               recommendedNumPartitions = adjustment.adjust(recommendedNumPartitions)
+               modified = true
+             }
+         }
+       }
+     }
+
+     /**
+       * Check if executor memory has been over allocated, compared to max peak JVM used memory.
+       * If so, either increase cores to make better use of the memory, or decrease executor
+       * memory.
+       */
+     private def adjustExecutorMemory() = {
+       if (((sparkExecutorMemory > SPARK_EXECUTOR_MEMORY_THRESHOLD_LOW &&
+         jvmUsedMemoryEvaluator.severity != Severity.NONE) ||
+         (sparkExecutorMemory > SPARK_EXECUTOR_MEMORY_THRESHOLD_MODERATE &&
+           (jvmUsedMemoryEvaluator.severity != Severity.NONE &&
+             jvmUsedMemoryEvaluator.severity != Severity.LOW)))) {
+         if (sparkExecutorMemory <= SPARK_EXECUTOR_MEMORY_THRESHOLD_INCREASE_CORES &&
+           sparkExecutorCores < MAX_RECOMMENDED_CORES) {
+           // try to increase the number of cores, so that more tasks can run in parallel, and make
+           // use of the allocated memory
+           val possibleCores = ((sparkExecutorMemory - JvmUsedMemoryHeuristic.reservedMemory) /
+             (jvmUsedMemoryEvaluator.maxExecutorPeakJvmUsedMemory * (1 + DEFAULT_MEMORY_BUFFER_PERCENTAGE)
+             / sparkExecutorCores)).toInt
+           recommendedExecutorCores = Math.min(MAX_RECOMMENDED_CORES, possibleCores)
+         }
+
+         // adjust the allocated memory
+         recommendedExecutorMemory = calculateRecommendedMemory(sparkExecutorMemory,
+           jvmUsedMemoryEvaluator.maxExecutorPeakJvmUsedMemory, sparkExecutorCores,
+           recommendedExecutorCores)
+       }
+     }
+
+     /**
+       * If the number of executor instances is explicitly specified, then calculate the
+       * recommended number of executor instances, trying to keep the level of parallelism
+       * the same.
+       * @return the recommended number of executor instances.
+       */
+     private def calculateExecutorInstances(): Option[Int] = {
+       sparkExecutorInstances.map { numExecutors =>
+         Seq(numExecutors * sparkExecutorCores / recommendedExecutorCores,
+           recommendedNumPartitions / recommendedExecutorCores, MAX_RECOMMENDED_NUM_EXECUTORS).min
+       }
+     }
+
+     /**
+       * Adjust memory overhead by inceasing if any containers were killed by YARN
+       * for exceeding memory limits.
+       * TODO: adjust down if current value is too high, need to check historical settings
+       * and/or total container memory usage
+       *
+       * @return the recommended value in bytes for executor memory overhead
+       */
+     private def calculateExecutorMemoryOverhead(): Option[Long] = {
+       val overheadMemoryIncrement = 1L * GB_TO_BYTES
+
+       if (stageAnalysis.exists { stage =>
+         hasSignificantSeverity(stage.taskFailureResult.containerKilledSeverity)
+       }) {
+         val actualMemoryOverhead = sparkExecutorMemoryOverhead.getOrElse {
+           Math.max(SPARK_MEMORY_OVERHEAD_MIN_DEFAULT.toLong,
+             (sparkExecutorMemory * SPARK_MEMORY_OVERHEAD_PCT_DEFAULT).toLong)
+         }
+         Some(actualMemoryOverhead + overheadMemoryIncrement)
+       } else {
+         sparkExecutorMemoryOverhead
+       }
+     }
+
+     /**
+       * Adjust driver configuration parameters, and calculate the severity and score
+       * for driver heuristics.
+       *
+       * @return the recommended values for driver cores, memory, severity and score
+       */
+     private def adjustDriverParameters(): (Int, Long, Severity, Int) = {
+       val driverHeuristic =
+         new DriverHeuristic(configurationParametersHeuristic.heuristicConfigurationData)
+       val driverEvaluator = new DriverHeuristic.Evaluator(driverHeuristic, data)
+
+       val driverCores = Math.min(sparkDriverCores, DEFAULT_MAX_DRIVER_CORES)
+
+       val driverMemory = calculateRecommendedMemory(sparkDriverMemory,
+         driverEvaluator.maxDriverPeakJvmUsedMemory, sparkDriverCores,
+         driverCores)
+
+       val driverSeverity = Severity.max(driverEvaluator.severityJvmUsedMemory,
+         driverEvaluator.severityDriverCores)
+
+       val driverScore = driverEvaluator.severityJvmUsedMemory.getValue +
+       driverEvaluator.severityDriverCores.getValue
+
+       (driverCores, driverMemory, driverSeverity, driverScore)
+     }
+   }
+
+   /**
+     * Calculate the severity for the stage level heuristics.
+     *
+     * @param analyses the analysis for all the stages
+     * @return the stage heristics severity.
+     */
+   private def calculateStageSeverity(analyses: Seq[StageAnalysis]): Severity = {
+     val stageSeverities = analyses.map(_.getStageAnalysisResults.maxBy(_.severity.getValue).severity)
+     if (stageSeverities.size > 0) {
+       stageSeverities.maxBy(_.getValue)
+     } else {
+       Severity.NONE
+     }
+   }
+
+   /**
+     * Calculate the recommended amount of memory, based on how much was used, and if there
+     * are changes to the number of cores (assume memory used is proportional to number of cores).
+     *
+     * @param allocatedMemory allocated memory
+     * @param jvmUsedMemory max JVM used memory
+     * @param numCores current number of cores
+     * @param recommendedCores recommended number of cores
+     * @return the recommended memory in bytes.
+     */
+   private def calculateRecommendedMemory(
+       allocatedMemory: Long,
+       jvmUsedMemory: Long,
+       numCores: Int,
+       recommendedCores: Int): Long = {
+     val calculatedMem = (jvmUsedMemory * Math.ceil(recommendedCores / numCores.toDouble) *
+       (1 + DEFAULT_MEMORY_BUFFER_PERCENTAGE) + JvmUsedMemoryHeuristic.reservedMemory).toLong
+     Math.min(Math.max(DEFAULT_MIN_MEMORY, calculatedMem), allocatedMemory)
+   }
+
+   /** If the severity is sigificant (not NONE or LOW). */
+   private def hasSignificantSeverity(severity: Severity): Boolean = {
+     severity != Severity.NONE && severity != Severity.LOW
+   }
+
+   /**
+     * Calculate the total amount of unified memory allocated across all tasks for
+     * the stage.
+     *
+     * @param executorMemory executor memory in bytes
+     * @param memoryFraction spark.memory.fraction
+     * @param executorCores number of executor cores
+     * @param numTasks number of tasks/partitions
+     * @return
+     */
+   private def calculateTotalUnifiedMemory(
+       executorMemory: Long,
+       memoryFraction: Double,
+       executorCores: Int,
+       numTasks: Int): Long = {
+     // amount of unified memory available for each task
+     val unifiedMemPerTask = (executorMemory - SPARK_RESERVED_MEMORY) * memoryFraction /
+       executorCores
+     (unifiedMemPerTask * numTasks).toLong
+   }
+
+   private val REGEX_MATCHER = raw"(\d+)((?:[T|G|M|K])?B?)?"r
+
+   /**
+     * Given a memory value in bytes, convert it to a string with the unit that round to a >0 integer part.
+     *
+     * @param size The memory value in long bytes
+     * @return The formatted string, null if
+     */
+   private def bytesToString(size: Long): String = {
+     val (value, unit) = {
+       if (size >= 2L * GB_TO_BYTES) {
+         (size.asInstanceOf[Double] / GB_TO_BYTES, "GB")
+       } else {
+         (size.asInstanceOf[Double] / MB_TO_BYTES, "MB")
+       }
+     }
+     s"${Math.ceil(value).toInt}${unit}"
+   }
+
+   /**
+     * Convert a formatted string into a long value in bytes. If no units
+     * are specified, then the default is MB.
+     *
+     * @param formattedString The string to convert
+     * @return The bytes value
+     */
+   private def stringToBytes(formattedString: String): Long = {
+     if (formattedString == null || formattedString.isEmpty) {
+       return 0L
+     }
+     //handling if the string has , for eg. 1,000MB
+     val regularizedString = formattedString.replace(",", "").toUpperCase
+     regularizedString match {
+       case REGEX_MATCHER(value, unit) =>
+         val num = value.toLong
+         if (unit.length == 0) {
+           num * MB_TO_BYTES
+         } else {
+           unit.charAt(0) match {
+             case 'T' => num * TB_TO_BYTES
+             case 'G' => num * GB_TO_BYTES
+             case 'M' => num * MB_TO_BYTES
+             case 'K' => num * KB_TO_BYTES
+             case 'B' => num
+           }
+         }
+       case _ =>
+         throw new IllegalArgumentException(s"Unable to parse memory size from formatted string [${formattedString}].")
+     }
+   }
+ }
\ No newline at end of file
diff --git a/app/com/linkedin/drelephant/spark/heuristics/ConfigurationUtils.scala b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationUtils.scala
new file mode 100644
index 000000000..8d7b785c2
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/heuristics/ConfigurationUtils.scala
@@ -0,0 +1,186 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import com.linkedin.drelephant.analysis.SeverityThresholds
+
+object ConfigurationUtils {
+  val JVM_USED_MEMORY = "jvmUsedMemory"
+
+  // Spark configuration parameters
+  val SPARK_EXECUTOR_MEMORY = "spark.executor.memory"
+  val SPARK_DRIVER_MEMORY = "spark.driver.memory"
+  val SPARK_EXECUTOR_MEMORY_OVERHEAD = "spark.yarn.executor.memoryOverhead"
+  val SPARK_DRIVER_MEMORY_OVERHEAD = "spark.yarn.driver.memoryOverhead"
+  val SPARK_EXECUTOR_CORES = "spark.executor.cores"
+  val SPARK_DRIVER_CORES = "spark.driver.cores"
+  val SPARK_EXECUTOR_INSTANCES = "spark.executor.instances"
+  val SPARK_SQL_SHUFFLE_PARTITIONS = "spark.sql.shuffle.partitions"
+  val SPARK_MEMORY_FRACTION = "spark.memory.fraction"
+
+  // Spark default configuration values
+  val SPARK_EXECUTOR_MEMORY_DEFAULT = "1g"
+  val SPARK_DRIVER_MEMORY_DEFAULT = "1g"
+  val SPARK_EXECUTOR_CORES_DEFAULT = 1
+  val SPARK_DRIVER_CORES_DEFAULT = 1
+  val SPARK_SQL_SHUFFLE_PARTITIONS_DEFAULT = 200
+  val SPARK_MEMORY_FRACTION_DEFAULT = 0.6
+
+  // if the overhead memory is not explicitly specified by the user, the default amount is
+  // max(0.1 * spark.executor.memory, 384MB)
+  val SPARK_MEMORY_OVERHEAD_PCT_DEFAULT = 0.1
+
+  // the minimum amount of overhead memory
+  val SPARK_MEMORY_OVERHEAD_MIN_DEFAULT = 384L << 20 // 384MB
+
+  // the amount of Spark reserved memory (300MB)
+  val SPARK_RESERVED_MEMORY = 300L << 20
+
+  // number of milliseconds in a minute
+  val MILLIS_PER_MIN = 1000D * 60.0D
+
+  // the index for the median value for executor and task metrics distributions
+  val DISTRIBUTION_MEDIAN_IDX = 2
+
+  // the index for the max value for executor and task metrics distributions
+  val DISTRIBUTION_MAX_IDX = 4
+
+  // keys for finding Dr. Elephant configuration parameter values
+  val SPARK_STAGE_EXECUTION_MEMORY_SPILL_THRESHOLD_KEY = "spark_stage_execution_memory_spill_threshold"
+  val SPARK_STAGE_TASK_SKEW_THRESHOLD_KEY = "spark_stage_task_skew_threshold"
+  val SPARK_STAGE_TASK_DURATION_THRESHOLD_KEY = "spark_stage_task_duration_threshold"
+  val SPARK_STAGE_MAX_DATA_PROCESSED_THRESHOLD_KEY = "spark_stage_task_duration_threshold"
+  val TASK_FAILURE_RATE_SEVERITY_THRESHOLDS_KEY = "stage_task_failure_rate_severity_threshold"
+  val MAX_DATA_PROCESSED_THRESHOLD_KEY = "execution_memory_spill_max_data_threshold"
+  val LONG_TASK_TO_STAGE_DURATION_RATIO_KEY = "task_skew_task_to_stage_duration_ratio"
+  val TASK_SKEW_TASK_DURATION_MIN_THRESHOLD_KEY = "task_skew_task_duration_threshold"
+  val MAX_RECOMMENDED_PARTITIONS_KEY = "max_recommended_partitions"
+
+  // keys for finding specific recommendations
+  val EXECUTION_MEMORY_SPILL_LARGE_DATA_RECOMMENDATION_KEY = "execution_memory_spill_large_data_recommendation"
+  val TASK_SKEW_INPUT_DATA_RECOMMENDATION_KEY = "task_skew_input_data_recommendation"
+  val TASK_SKEW_GENERIC_RECOMMENDATION_KEY = "task_skew_generic_recommendation"
+  val LONG_TASKS_LARGE_DATA_RECOMMENDATION_KEY = "long_tasks_large_data_recommendation"
+  val SLOW_TASKS_RECOMMENDATION_KEY = "slow_tasks_recommendation"
+  val LONG_TASKS_FEW_PARTITIONS_RECOMMENDATION_KEY = "long tasks_few_partitions"
+  val LONG_TASKS_FEW_INPUT_PARTITIONS_RECOMMENDATION_KEY = "long tasks_few_input_partitions"
+
+  // default recommendations
+  val DEFAULT_EXECUTION_MEMORY_SPILL_LARGE_DATA_RECOMMENDATION = "a large amount of data is being processesd. " +
+    "Examine the application to see if this can be reduced"
+  val DEFAULT_TASK_SKEW_INPUT_DATA_RECOMMENDATION = "please try to modify the application to make the input partitions more even"
+  val DEFAULT_TASK_SKEW_GENERIC_RECOMMENDATION = "please try to modify the application to make the partitions more even"
+  val DEFAULT_LONG_TASKS_LARGE_DATA_RECOMMENDATION = "please try to reduce the amount of data being processed"
+  val DEFAULT_SLOW_TASKS_RECOMMENDATION = "please optimize the code to improve performance"
+  val DEFAULT_LONG_TASKS_FEW_PARTITIONS_RECOMMENDATION = "please increase the number of partitions"
+  val DEFAULT_LONG_TASKS_FEW_INPUT_PARTITIONS_RECOMMENDATION = "please increase the number of partitions for reading data"
+
+  // Severity thresholds for task duration in minutes, when checking to see if the median task
+  // run time is too long for a stage.
+  val DEFAULT_TASK_DURATION_THRESHOLDS =
+    SeverityThresholds(low = 2.5D * MILLIS_PER_MIN, moderate = 5.0D * MILLIS_PER_MIN,
+      severe = 10.0D * MILLIS_PER_MIN, critical = 15.0D * MILLIS_PER_MIN, ascending = true)
+
+  // Severity thresholds for checking task skew, ratio of maximum to median task run times.
+  val DEFAULT_TASK_SKEW_THRESHOLDS =
+    SeverityThresholds(low = 2, moderate = 4, severe = 8, critical = 16, ascending = true)
+
+  // Severity thresholds for checking execution memory spill, ratio of execution spill compared
+  // to the maximum amount of data (input, output, shuffle read, or shuffle write) processed.
+  val DEFAULT_EXECUTION_MEMORY_SPILL_THRESHOLDS =
+    SeverityThresholds(low = 0.01D, moderate = 0.1D, severe = 0.25D, critical = 0.5D, ascending = true)
+
+  // The ascending severity thresholds for the ratio of JVM GC time and task run time,
+  // checking if too much time is being spent in GC.
+  val DEFAULT_GC_SEVERITY_A_THRESHOLDS =
+    SeverityThresholds(low = 0.08D, moderate = 0.09D, severe = 0.1D, critical = 0.15D, ascending = true)
+
+  /** The default severity thresholds for the rate of a stage's tasks failing. */
+  val DEFAULT_TASK_FAILURE_RATE_SEVERITY_THRESHOLDS =
+    SeverityThresholds(low = 0.05D, moderate = 0.1D, severe = 0.15D, critical = 0.2D, ascending = true)
+
+  // The default threshold (3TB) for checking for maximum amount of data processed, for which to
+  // alert for execution memory spill. Tasks processing more data would be expected to have some
+  // amount of spill, due to the large amount of data processed.
+  // Estimating the size based on some reasonable values for configuration parameters (and how
+  // much data could be kept in unified memory given these values):
+  //   spark.executor.memory / spark.executor.cores * spark.memory.fraction *
+  //     (1 - spark.memory.storageFraction) * spark.sql.shuffle.partitions
+  //   = 5GB / 2 * 0.6 * (1 - 0.5) * 4000
+  val DEFAULT_MAX_DATA_PROCESSED_THRESHOLD = "3TB"
+
+  // The default threshold for the ratio of the time for longest running task for a stage to the
+  // stage duration. With Spark, some amount of task skew may be OK, since exectuors can process
+  // multiple tasks, so one executor could process multiple shorter tasks, while another executor
+  // processes a longer task. However, if the length of the long task is a large fraction of the
+  // stage duration, then it is likely contributing to the overall stage duration.
+  val DEFAULT_LONG_TASK_TO_STAGE_DURATION_RATIO = "0.75"
+
+  // Some task skew is also tolerable if the tasks are short (2.5 minutes or less).
+  val DEFAULT_TASK_SKEW_TASK_DURATION_MIN_THRESHOLD = "150000"
+
+  // The target task duration (2.5 minutes). This is the same as the idle executor timeout.
+  val DEFAULT_TARGET_TASK_DURATION = "150000"
+
+  // The default maximum number of partitions that would be recommended. More partitions means
+  // less data per partition, so shorter tasks and less memory needed per task. However more
+  // partitions also inceases the amount of overhead for shuffle.
+  val DEFAULT_MAX_RECOMMENDED_PARTITIONS = "4000"
+
+  // Default maximum number of cores for the driver.
+  val DEFAULT_MAX_DRIVER_CORES = 2
+
+  // Default minimum executor memory (640MB for executor memory, and 384MB for overhead
+  // memory, summing to 1GB total memory).
+  val DEFAULT_MIN_MEMORY = 640L << 20
+
+  // Default maximum recommended number of cores.
+  val MAX_RECOMMENDED_CORES = 4
+
+  // Default maximum recommended number of executors.
+  val MAX_RECOMMENDED_NUM_EXECUTORS = 500
+
+  // Executor memory threshold for increasing number of cores, if JVM used memory
+  // is flagged as MODERATE or higher
+  val SPARK_EXECUTOR_MEMORY_THRESHOLD_MODERATE = 2L << 30
+
+  // Executor memory threshold for increasing number of cores, if JVM used memory
+  // is flagged as LOW or higher
+  val SPARK_EXECUTOR_MEMORY_THRESHOLD_LOW = 4L << 30
+
+  // Max amount of executor memory, for which increasing the number of cores is
+  // considered, if there is extra unused executor memory.
+  val SPARK_EXECUTOR_MEMORY_THRESHOLD_INCREASE_CORES = 8L << 30
+
+  // Default buffer (over max Used JVM memory), when calculating executor memory.
+  val DEFAULT_MEMORY_BUFFER_PERCENTAGE = 0.25
+
+  // Adjustments to try for avoiding execution memory spill.
+  // This will try incrementally:
+  // - increasing the number of partitions, so that there is less data per partition,
+  //   to reduce the likelihood of execution memory spill.
+  // - increasing overall executor memory, so that there is also more space in the
+  //   unified memory region
+  // - reducing the number of cores, since executor memory is divided across the number
+  //   of tasks running in parallel, so if there are fewer concurrent tasks, then there
+  //   is more memory for each task.
+  val STAGE_SPILL_ADJUSTMENTS =
+    Seq(PartitionSetAdjustment(400), MemorySetAdjustment(4L << 30), CoreSetAdjustment(4),
+      PartitionSetAdjustment(1000), MemorySetAdjustment(6L << 30), CoreSetAdjustment(3),
+      PartitionSetAdjustment(2000), MemorySetAdjustment(8L << 30), CoreSetAdjustment(2),
+      PartitionSetAdjustment(4000), MemorySetAdjustment(10L << 30))
+
+  // Adjustments to try to avoiding OOM or GC issues.
+  // Try reducing cores, increasing memory, or increasing partitions
+  val OOM_GC_ADJUSTMENTS = Seq(
+    CoreDivisorAdjustment(MAX_RECOMMENDED_CORES, 2.0),
+    MemoryMultiplierAdjustment(4L << 30, 2.0),
+    MemoryMultiplierAdjustment(8L << 30, 1.5),
+    PartitionMultiplierAdjustment(DEFAULT_MAX_RECOMMENDED_PARTITIONS.toInt / 2, 2.0),
+    CoreSetAdjustment(2),
+    MemoryMultiplierAdjustment(16L << 30, 1.25)
+  )
+
+  val TB_TO_BYTES = 1L << 40
+  val GB_TO_BYTES = 1L << 30
+  val MB_TO_BYTES = 1L << 20
+  val KB_TO_BYTES = 1L << 10
+}
\ No newline at end of file
diff --git a/app/com/linkedin/drelephant/spark/heuristics/StageAnalysisResult.scala b/app/com/linkedin/drelephant/spark/heuristics/StageAnalysisResult.scala
new file mode 100644
index 000000000..3a9f3f402
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/heuristics/StageAnalysisResult.scala
@@ -0,0 +1,78 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import com.linkedin.drelephant.analysis.Severity
+
+/** Stage analysis result. */
+private[heuristics] sealed trait StageAnalysisResult {
+
+  // the severity for the stage and heuristic evaluated
+  val severity: Severity
+
+  // the heuristics score for the stage and heuristic evaluated
+  val score: Int
+
+  // information, details and advice from the analysis
+  val details: Seq[String]
+}
+
+/** Simple stage analysis result, with the severity, score, and details. */
+private[heuristics] case class SimpleStageAnalysisResult(
+    severity: Severity,
+    score: Int,
+    details: Seq[String]) extends StageAnalysisResult
+
+/**
+  * Stage analysis result for examining the stage for task skew.
+  *
+  * @param severity task skew severity.
+  * @param score heuristics score for task skew.
+  * @param details information and recommendations from analysis for task skew.
+  * @param rawSeverity severity based only on task skew, and not considering other thresholds
+  *                    (task duration or ratio of task duration to stage suration).
+  */
+private[heuristics] case class TaskSkewResult(
+    severity: Severity,
+    score: Int,
+    details: Seq[String],
+    rawSeverity: Severity) extends StageAnalysisResult
+
+/**
+  * Stage analysis result for examining the stage for execution memory spill.
+  *
+  * @param severity execution memory spill severity.
+  * @param score heuristics score for execution memory spill.
+  * @param details information and recommendations from analysis for execution memory spill.
+  * @param rawSeverity severity based only on execution memory spill, and not considering other
+  *                    thresholds (max amount of data processed for the stage).
+  * @param memoryBytesSpilled the total amount of execution memory bytes spilled for the stage.
+  * @param maxTaskBytesSpilled the maximum number of bytes spilled by a task.
+  */
+private[heuristics] case class ExecutionMemorySpillResult(
+    severity: Severity,
+    score: Int,
+    details: Seq[String],
+    rawSeverity: Severity,
+    memoryBytesSpilled: Long,
+    maxTaskBytesSpilled: Long) extends StageAnalysisResult
+
+/**
+  * Stage analysis result for examining the stage for task failures.
+  *
+  * @param severity task failure severity.
+  * @param score heuristic score for task failures.
+  * @param details information and recommendations from analysis for task failures.
+  * @param oomSeverity severity for task failures due to OutOfMemory errors.
+  * @param containerKilledSeverity severity for task failures due to container killed by YARN.
+  * @param numFailures number of task failures for the stage.
+  * @param numOOM number of tasks which failed to to OutOfMemory errors.
+  * @param numContainerKilled number of tasks which failed due to container killed by YARN.
+  */
+private[heuristics] case class TaskFailureResult(
+    severity: Severity,
+    score: Int,
+    details: Seq[String],
+    oomSeverity: Severity,
+    containerKilledSeverity: Severity,
+    numFailures: Int,
+    numOOM: Int,
+    numContainerKilled: Int) extends StageAnalysisResult
diff --git a/app/com/linkedin/drelephant/spark/heuristics/StagesAnalyzer.scala b/app/com/linkedin/drelephant/spark/heuristics/StagesAnalyzer.scala
new file mode 100644
index 000000000..e4d4a4a7d
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/heuristics/StagesAnalyzer.scala
@@ -0,0 +1,532 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import scala.collection.mutable.ArrayBuffer
+import com.linkedin.drelephant.analysis.{Severity, SeverityThresholds}
+import com.linkedin.drelephant.configurations.heuristic.HeuristicConfigurationData
+import com.linkedin.drelephant.spark.data.SparkApplicationData
+import com.linkedin.drelephant.spark.fetchers.statusapiv1.{StageData, StageStatus, TaskDataImpl}
+import com.linkedin.drelephant.util.{MemoryFormatUtils, Utils}
+
+/**
+  * Analysis results for a stage.
+  *
+  * @param stageId the stage ID.
+  * @param executionMemorySpillResult stage analysis result for examining the stage for execution
+  *                                   memory spill.
+  * @param longTaskResult stage analysis result for examining the stage for long tasks.
+  * @param taskSkewResult stage analysis result for examining the stage for task skew.
+  * @param taskFailureResult stage analysis result for examining the stage for task failures.
+  * @param stageFailureResult stage analysis result for examining the stage for stage failure.
+  * @param stageGCResult stage analysis result for examining the stage for GC.
+  * @param numTasks number of tasks for the stage.
+  * @param medianRunTime median task run time.
+  * @param maxRunTime maximum task run time.
+  * @param stageDuration: wall clock time for the stage in ms.
+  * @param inputBytes: number of input bytes read
+  * @param outputBytes: number of output bytes written
+  * @param shuffleReadBytes number of shuffle read bytes
+  * @param shuffleWriteBytes number of shuffle write bytes
+  */
+private[heuristics] case class StageAnalysis(
+    stageId: Int,
+    executionMemorySpillResult: ExecutionMemorySpillResult,
+    longTaskResult: SimpleStageAnalysisResult,
+    taskSkewResult: TaskSkewResult,
+    taskFailureResult: TaskFailureResult,
+    stageFailureResult: SimpleStageAnalysisResult,
+    stageGCResult: SimpleStageAnalysisResult,
+    numTasks: Int,
+    medianRunTime: Option[Double],
+    maxRunTime: Option[Double],
+    stageDuration: Option[Long],
+    inputBytes: Long,
+    outputBytes: Long,
+    shuffleReadBytes: Long,
+    shuffleWriteBytes: Long) {
+
+  def getStageAnalysisResults: Seq[StageAnalysisResult] =
+    Seq(executionMemorySpillResult, longTaskResult, taskSkewResult, taskFailureResult,
+      stageFailureResult, stageGCResult)
+}
+
+/**
+  * Analyzes the stage level metrics for the given application.
+  *
+  * @param heuristicConfigurationData heuristic configuration data
+  * @param data Spark application data
+  */
+private[heuristics] class StagesAnalyzer(
+    private val heuristicConfigurationData: HeuristicConfigurationData,
+    private val data: SparkApplicationData) {
+
+  import ConfigurationUtils._
+
+  // serverity thresholds for execution memory spill
+  private val executionMemorySpillThresholds: SeverityThresholds =
+    SeverityThresholds.parse(heuristicConfigurationData.getParamMap
+      .get(SPARK_STAGE_EXECUTION_MEMORY_SPILL_THRESHOLD_KEY), ascending = true)
+      .getOrElse(DEFAULT_EXECUTION_MEMORY_SPILL_THRESHOLDS)
+
+  // severity thresholds for task skew
+  private val taskSkewThresholds: SeverityThresholds =
+    SeverityThresholds.parse(heuristicConfigurationData.getParamMap
+      .get(SPARK_STAGE_TASK_SKEW_THRESHOLD_KEY), ascending = true)
+      .getOrElse(DEFAULT_TASK_SKEW_THRESHOLDS)
+
+  // severity thresholds for task duration (long running tasks)
+  private val taskDurationThresholds: SeverityThresholds =
+    SeverityThresholds.parse(heuristicConfigurationData.getParamMap
+      .get(SPARK_STAGE_TASK_DURATION_THRESHOLD_KEY), ascending = true)
+      .getOrElse(DEFAULT_TASK_DURATION_THRESHOLDS)
+
+  // severity thresholds for task failures
+  private val taskFailureRateSeverityThresholds: SeverityThresholds =
+    SeverityThresholds.parse(heuristicConfigurationData.getParamMap
+      .get(TASK_FAILURE_RATE_SEVERITY_THRESHOLDS_KEY), ascending = true)
+      .getOrElse(DEFAULT_TASK_FAILURE_RATE_SEVERITY_THRESHOLDS)
+
+  // execution memory spill: threshold for processed data, above which some spill is expected
+  private val maxDataProcessedThreshold = MemoryFormatUtils.stringToBytes(
+    heuristicConfigurationData.getParamMap
+    .getOrDefault(MAX_DATA_PROCESSED_THRESHOLD_KEY, DEFAULT_MAX_DATA_PROCESSED_THRESHOLD))
+
+  // threshold for ratio of max task duration to stage duration, for flagging task skew
+  private val longTaskToStageDurationRatio = heuristicConfigurationData.getParamMap
+    .getOrDefault(LONG_TASK_TO_STAGE_DURATION_RATIO_KEY, DEFAULT_LONG_TASK_TO_STAGE_DURATION_RATIO).toDouble
+
+  // min threshold for median task duration, for flagging task skew
+  private val taskDurationMinThreshold = heuristicConfigurationData.getParamMap
+    .getOrDefault(TASK_SKEW_TASK_DURATION_MIN_THRESHOLD_KEY, DEFAULT_TASK_SKEW_TASK_DURATION_MIN_THRESHOLD).toLong
+
+  // the maximum number of recommended partitions
+  private val maxRecommendedPartitions = heuristicConfigurationData.getParamMap
+    .getOrDefault(MAX_RECOMMENDED_PARTITIONS_KEY, DEFAULT_MAX_RECOMMENDED_PARTITIONS).toInt
+
+  // recommendation to give if there is execution memory spill due to too much data being processed.
+  // Some amount of spill is expected in this, but alert the users so that they are aware that spill
+  // is happening.
+  private val executionMemorySpillRecommendation = heuristicConfigurationData.getParamMap
+    .getOrDefault(EXECUTION_MEMORY_SPILL_LARGE_DATA_RECOMMENDATION_KEY,
+      DEFAULT_EXECUTION_MEMORY_SPILL_LARGE_DATA_RECOMMENDATION)
+
+  // recommendation to give if task skew is detected, and input data is read for the stage.
+  private val taskSkewInputDataRecommendation = heuristicConfigurationData.getParamMap
+    .getOrDefault(TASK_SKEW_INPUT_DATA_RECOMMENDATION_KEY, DEFAULT_TASK_SKEW_INPUT_DATA_RECOMMENDATION)
+
+  // recommendation to give if task skew is detected, and there is no input data.
+  private val taskSkewGenericRecommendation = heuristicConfigurationData.getParamMap
+    .getOrDefault(TASK_SKEW_GENERIC_RECOMMENDATION_KEY, DEFAULT_TASK_SKEW_GENERIC_RECOMMENDATION)
+
+  // recommendation to give if there are long running tasks, and there is a lot of data being
+  // processed, and many partitions already. In this case, long running tasks may be expected, but
+  // alert the user, in case it is possible to filter out some data.
+  private val longTasksLargeDataRecommenation = heuristicConfigurationData.getParamMap
+    .getOrDefault(LONG_TASKS_LARGE_DATA_RECOMMENDATION_KEY, DEFAULT_LONG_TASKS_LARGE_DATA_RECOMMENDATION)
+
+  // recommendation to give if there are long running tasks, a reasonable number of partitions,
+  // and not too much data processed. In this case, the tasks are slow.
+  private val slowTasksRecommendation = heuristicConfigurationData.getParamMap
+  .getOrDefault(SLOW_TASKS_RECOMMENDATION_KEY, DEFAULT_SLOW_TASKS_RECOMMENDATION)
+
+  // recommendation to give if there are long running tasks and relatively few partitions.
+  private val longTasksFewPartitionsRecommendation = heuristicConfigurationData.getParamMap
+  .getOrDefault(LONG_TASKS_FEW_PARTITIONS_RECOMMENDATION_KEY, DEFAULT_LONG_TASKS_FEW_PARTITIONS_RECOMMENDATION)
+
+  // recommendation to give if there are long running tasks, input data is being read (and so
+  // controlling the number of tasks), and relatively few partitions.
+  private val longTasksFewInputPartitionsRecommendation = heuristicConfigurationData.getParamMap
+  .getOrDefault(LONG_TASKS_FEW_INPUT_PARTITIONS_RECOMMENDATION_KEY,
+    DEFAULT_LONG_TASKS_FEW_INPUT_PARTITIONS_RECOMMENDATION)
+
+
+  /** @return list of analysis results for all the stages. */
+  def getStageAnalysis(): Seq[StageAnalysis] = {
+    val appConfigurationProperties: Map[String, String] = data.appConfigurationProperties
+    val curNumPartitions = appConfigurationProperties.get(SPARK_SQL_SHUFFLE_PARTITIONS)
+      .map(_.toInt).getOrElse(SPARK_SQL_SHUFFLE_PARTITIONS_DEFAULT)
+
+    data.stageDatas.map { stageData =>
+      val medianTime = stageData.taskSummary.collect {
+        case distribution => distribution.executorRunTime(DISTRIBUTION_MEDIAN_IDX)
+      }
+      val maxTime = stageData.taskSummary.collect {
+        case distribution => distribution.executorRunTime(DISTRIBUTION_MAX_IDX)
+      }
+      val stageDuration = (stageData.submissionTime, stageData.completionTime) match {
+        case (Some(submissionTime), Some(completionTime)) =>
+          Some(completionTime.getTime() - submissionTime.getTime())
+        case _ => None
+      }
+      val stageId = stageData.stageId
+
+      val executionMemorySpillResult = checkForExecutionMemorySpill(stageId, stageData)
+      val longTaskResult = checkForLongTasks(stageId, stageData, medianTime, curNumPartitions)
+      val taskSkewResult = checkForTaskSkew(stageId, stageData, medianTime, maxTime, stageDuration,
+          executionMemorySpillResult.severity)
+      val stageFailureResult = checkForStageFailure(stageId, stageData)
+      val taskFailureResult = checkForTaskFailure(stageId, stageData)
+      val gcResult = checkForGC(stageId, stageData)
+
+      new StageAnalysis(stageData.stageId, executionMemorySpillResult, longTaskResult,
+        taskSkewResult, taskFailureResult, stageFailureResult, gcResult, stageData.numTasks,
+        medianTime, maxTime, stageDuration, stageData.inputBytes, stageData.outputBytes,
+        stageData.shuffleReadBytes, stageData.shuffleWriteBytes)
+    }
+  }
+
+  /**
+    * Check stage for execution memory spill.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @return results of execution memory spill analysis for the stage.
+    */
+  private def checkForExecutionMemorySpill(
+      stageId: Int,
+      stageData: StageData): ExecutionMemorySpillResult = {
+    val maxData = Seq(stageData.inputBytes, stageData.shuffleReadBytes,
+      stageData.shuffleWriteBytes, stageData.outputBytes).max
+    val rawSpillSeverity = executionMemorySpillThresholds.severityOf(
+      stageData.memoryBytesSpilled / maxData.toDouble)
+    val details = new ArrayBuffer[String]
+    val executionSpillSeverity = if (maxData < maxDataProcessedThreshold) {
+      rawSpillSeverity
+    } else {
+      // don't flag execution memory spill if there is a lot of data being processed,
+      // since some spill may be unavoidable in this case.
+      if (hasSignificantSeverity(rawSpillSeverity)) {
+        details += s"Stage $stageId: ${executionMemorySpillRecommendation}."
+      }
+      Severity.NONE
+    }
+    if (hasSignificantSeverity(rawSpillSeverity)) {
+      val memoryBytesSpilled = MemoryFormatUtils.bytesToString(stageData.memoryBytesSpilled)
+      details += s"Stage $stageId has $memoryBytesSpilled execution memory spill."
+      if (maxData > maxDataProcessedThreshold) {
+        // if a lot of data is being processed, the severity is supressed, but give information
+        // about the spill to the user, so that they know that spill is happening, and can check
+        // if the application can be modified to process less data.
+        details += s"Stage $stageId has ${stageData.numTasks} tasks, " +
+          s"${MemoryFormatUtils.bytesToString(stageData.inputBytes)} input read, " +
+          s"${MemoryFormatUtils.bytesToString(stageData.shuffleReadBytes)} shuffle read, " +
+          s"${MemoryFormatUtils.bytesToString(stageData.shuffleWriteBytes)} shuffle write, " +
+          s"${MemoryFormatUtils.bytesToString(stageData.outputBytes)} output."
+        stageData.taskSummary.foreach { summary =>
+          val memorySpill = summary.memoryBytesSpilled(DISTRIBUTION_MEDIAN_IDX).toLong
+          val inputBytes = summary.inputMetrics.map(_.bytesRead(DISTRIBUTION_MEDIAN_IDX))
+              .getOrElse(0.0).toLong
+          val outputBytes = summary.outputMetrics.map(_.bytesWritten(DISTRIBUTION_MEDIAN_IDX))
+            .getOrElse(0.0).toLong
+          val shuffleReadBytes = summary.shuffleReadMetrics.map(_.readBytes(DISTRIBUTION_MEDIAN_IDX))
+            .getOrElse(0.0).toLong
+          val shuffleWriteBytes = summary.shuffleWriteMetrics.map(_.writeBytes(DISTRIBUTION_MEDIAN_IDX))
+            .getOrElse(0.0).toLong
+          details += s"Stage $stageId has median task values: " +
+          s"${MemoryFormatUtils.bytesToString(memorySpill)} memory spill, " +
+            s"${MemoryFormatUtils.bytesToString(inputBytes)} input, " +
+            s"${MemoryFormatUtils.bytesToString(shuffleReadBytes)} shuffle read, " +
+            s"${MemoryFormatUtils.bytesToString(shuffleWriteBytes)} shuffle write, " +
+            s"${MemoryFormatUtils.bytesToString(outputBytes)} output."
+        }
+      }
+    }
+
+    val maxTaskSpill = stageData.taskSummary.collect {
+      case distribution => distribution.memoryBytesSpilled(DISTRIBUTION_MAX_IDX)
+    }.map(_.toLong).getOrElse(0L)
+    val score = Utils.getHeuristicScore(executionSpillSeverity, stageData.numTasks)
+
+    ExecutionMemorySpillResult(executionSpillSeverity, score, details, rawSpillSeverity,
+      stageData.memoryBytesSpilled, maxTaskSpill)
+  }
+
+  /**
+    * Check stage for task skew.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data
+    * @param medianTime median task run time (ms).
+    * @param maxTime maximum task run time (ms).
+    * @param stageDuration stage duration (ms).
+    * @param executionSpillSeverity execution spill severity
+    * @return results of task skew analysis for the stage.
+    */
+  private def checkForTaskSkew(
+      stageId: Int,
+      stageData: StageData,
+      medianTime: Option[Double],
+      maxTime: Option[Double],
+      stageDuration: Option[Long],
+      executionSpillSeverity: Severity): TaskSkewResult = {
+    val rawSkewSeverity = (medianTime, maxTime) match {
+      case (Some(median), Some(max)) =>
+        taskSkewThresholds.severityOf(max / median)
+      case _ => Severity.NONE
+    }
+    val maximum = maxTime.getOrElse(0.0D)
+    val taskSkewSeverity =
+      if (maximum > taskDurationMinThreshold &&
+        maximum > longTaskToStageDurationRatio * stageDuration.getOrElse(Long.MaxValue)) {
+      rawSkewSeverity
+    } else {
+      Severity.NONE
+    }
+    val details = new ArrayBuffer[String]
+
+    if (hasSignificantSeverity(taskSkewSeverity) || hasSignificantSeverity(executionSpillSeverity)) {
+      // add more information about what might be causing skew if skew is being flagged
+      // (reported severity is significant), or there is execution memory spill, since skew
+      // can also cause execution memory spill.
+      val medianStr = Utils.getDuration(medianTime.map(_.toLong).getOrElse(0L))
+      val maximumStr = Utils.getDuration(maxTime.map(_.toLong).getOrElse(0L))
+      var inputSkewSeverity = Severity.NONE
+      if (hasSignificantSeverity(taskSkewSeverity)) {
+        details +=
+          s"Stage $stageId has skew in task run time (median is $medianStr, max is $maximumStr)."
+      }
+      stageData.taskSummary.foreach { summary =>
+        checkSkewedData(stageId, summary.memoryBytesSpilled(DISTRIBUTION_MEDIAN_IDX),
+          summary.memoryBytesSpilled(DISTRIBUTION_MAX_IDX), "memory bytes spilled", details)
+        summary.inputMetrics.foreach { input =>
+          inputSkewSeverity = checkSkewedData(stageId, input.bytesRead(DISTRIBUTION_MEDIAN_IDX),
+            input.bytesRead(DISTRIBUTION_MAX_IDX), "task input bytes", details)
+          if (hasSignificantSeverity(inputSkewSeverity)) {
+            // The stage is reading input data, try to adjust the amount of data to even the partitions
+            details += s"Stage $stageId: ${taskSkewInputDataRecommendation}."
+          }
+        }
+        summary.outputMetrics.foreach { output =>
+          checkSkewedData(stageId, output.bytesWritten(DISTRIBUTION_MEDIAN_IDX),
+            output.bytesWritten(DISTRIBUTION_MAX_IDX), "task output bytes", details)
+        }
+        summary.shuffleReadMetrics.foreach { shuffle =>
+          checkSkewedData(stageId, shuffle.readBytes(DISTRIBUTION_MEDIAN_IDX),
+            shuffle.readBytes(DISTRIBUTION_MAX_IDX), "task shuffle read bytes", details)
+        }
+        summary.shuffleWriteMetrics.foreach { shuffle =>
+             checkSkewedData(stageId, shuffle.writeBytes(DISTRIBUTION_MEDIAN_IDX),
+              shuffle.writeBytes(DISTRIBUTION_MAX_IDX), "task shuffle write bytes", details)
+        }
+      }
+      if (hasSignificantSeverity(rawSkewSeverity) && !hasSignificantSeverity(inputSkewSeverity)) {
+        details += s"Stage $stageId: ${taskSkewGenericRecommendation}."
+      }
+    }
+    val score = Utils.getHeuristicScore(taskSkewSeverity, stageData.numTasks)
+
+    TaskSkewResult(taskSkewSeverity, score, details, rawSkewSeverity)
+  }
+
+  /**
+    * Check for skewed data.
+    *
+    * @param stageId stage ID
+    * @param median median data size for tasks.
+    * @param maximum maximum data size for tasks.
+    * @param description type of data.
+    * @param details information and recommendations -- any new recommendations
+    *                from analyzing the stage for data skew will be appended.
+    */
+  private def checkSkewedData(
+      stageId: Int,
+      median: Double,
+      maximum: Double,
+      description: String,
+      details: ArrayBuffer[String]): Severity = {
+    val severity = taskSkewThresholds.severityOf(maximum / median)
+    if (hasSignificantSeverity(severity)) {
+      details += s"Stage $stageId has skew in $description (median is " +
+        s"${MemoryFormatUtils.bytesToString(median.toLong)}, " +
+        s"max is ${MemoryFormatUtils.bytesToString(maximum.toLong)})."
+    }
+    severity
+  }
+
+  /**
+    * Check the stage for long running tasks.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @param medianTime median task run time.
+    * @param curNumPartitions number of partitions for the Spark application
+    *                         (spark.sql.shuffle.partitions).
+    * @return results of long running task analysis for the stage
+    */
+  private def checkForLongTasks(
+      stageId: Int,
+      stageData: StageData,
+      medianTime: Option[Double],
+      curNumPartitions: Int): SimpleStageAnalysisResult = {
+    val longTaskSeverity = stageData.taskSummary.map { distributions =>
+      taskDurationThresholds.severityOf(distributions.executorRunTime(DISTRIBUTION_MEDIAN_IDX))
+    }.getOrElse(Severity.NONE)
+    val details = new ArrayBuffer[String]
+    if (hasSignificantSeverity(longTaskSeverity)) {
+      val runTime = Utils.getDuration(medianTime.map(_.toLong).getOrElse(0L))
+      val maxData = Seq(stageData.inputBytes, stageData.shuffleReadBytes, stageData.shuffleWriteBytes,
+        stageData.outputBytes).max
+      val inputBytes = MemoryFormatUtils.bytesToString(stageData.inputBytes)
+      val outputBytes = MemoryFormatUtils.bytesToString(stageData.outputBytes)
+      val shuffleReadBytes = MemoryFormatUtils.bytesToString(stageData.shuffleReadBytes)
+      val shuffleWriteBytes = MemoryFormatUtils.bytesToString(stageData.shuffleWriteBytes)
+      details += s"Stage $stageId has a long median task run time of $runTime."
+      details += s"Stage $stageId has ${stageData.numTasks} tasks, $inputBytes input," +
+        s" $shuffleReadBytes shuffle read, $shuffleWriteBytes shuffle write, and $outputBytes output."
+      if (stageData.numTasks >= maxRecommendedPartitions) {
+        if (maxData >= maxDataProcessedThreshold) {
+          details += s"Stage $stageId: ${longTasksLargeDataRecommenation}."
+        } else {
+          details += s"Stage $stageId: ${slowTasksRecommendation}."
+        }
+      }
+      else {
+        if (stageData.inputBytes > 0) {
+          // The stage is reading input data, try to increase the number of readers
+          details += s"Stage $stageId: ${longTasksFewInputPartitionsRecommendation}."
+        } else if (stageData.numTasks != curNumPartitions) {
+          details += s"Stage $stageId: ${longTasksFewPartitionsRecommendation}."
+        }
+      }
+    }
+    val score = Utils.getHeuristicScore(longTaskSeverity, stageData.numTasks)
+
+    SimpleStageAnalysisResult(longTaskSeverity, score, details)
+  }
+
+  /**
+    * Check for stage failure.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @return results of stage failure analysis for the stage.
+    */
+  private def checkForStageFailure(stageId: Int, stageData: StageData): SimpleStageAnalysisResult = {
+    val severity = if (stageData.status == StageStatus.FAILED) {
+      Severity.CRITICAL
+    } else {
+      Severity.NONE
+    }
+    val score = Utils.getHeuristicScore(severity, stageData.numTasks)
+    val details = stageData.failureReason.map(reason => s"Stage $stageId failed: $reason")
+    SimpleStageAnalysisResult(severity, score, details.toSeq)
+  }
+
+  /**
+    * Check for failed tasks, including failures caused by OutOfMemory errors, and containers
+    * killed by YARN for exceeding memory limits.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @return result of failed tasks analysis for the stage.
+    */
+  private def checkForTaskFailure(
+      stageId: Int,
+      stageData: StageData): TaskFailureResult = {
+    val failedTasksStageMap = data.stagesWithFailedTasks.flatMap { stageData =>
+      stageData.tasks.map(tasks => (stageData.stageId, tasks.values))
+    }.toMap
+    
+    val failedTasks = failedTasksStageMap.get(stageId)
+
+    val details = new ArrayBuffer[String]()
+
+    val taskFailureSeverity = taskFailureRateSeverityThresholds.severityOf(
+      stageData.numFailedTasks.toDouble / stageData.numTasks)
+    if (hasSignificantSeverity(taskFailureSeverity)) {
+      details += s"Stage $stageId has ${stageData.numFailedTasks} failed tasks."
+    }
+
+    val score = Utils.getHeuristicScore(taskFailureSeverity, stageData.numFailedTasks)
+
+    val (numTasksWithOOM, oomSeverity) =
+      checkForSpecificTaskError(stageId, stageData, failedTasks,
+        StagesWithFailedTasksHeuristic.OOM_ERROR, "of OutOfMemory exception.",
+        details)
+
+    val (numTasksWithContainerKilled, containerKilledSeverity) =
+      checkForSpecificTaskError(stageId, stageData, failedTasks,
+        StagesWithFailedTasksHeuristic.OVERHEAD_MEMORY_ERROR,
+        "the container was killed by YARN for exeeding memory limits.", details)
+
+    TaskFailureResult(taskFailureSeverity, score, details, oomSeverity, containerKilledSeverity,
+      stageData.numFailedTasks, numTasksWithOOM, numTasksWithContainerKilled)
+  }
+
+  /**
+    * Check the stage for a high ratio of time spent in GC compared to task run time.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @return result of GC analysis for the stage.
+    */
+  private def checkForGC(stageId: Int, stageData: StageData): SimpleStageAnalysisResult = {
+    var gcTime = 0.0D
+    var taskTime = 0.0D
+    val severity = stageData.taskSummary.map { task =>
+      gcTime = task.jvmGcTime(DISTRIBUTION_MEDIAN_IDX)
+      taskTime = task.executorRunTime(DISTRIBUTION_MEDIAN_IDX)
+      DEFAULT_GC_SEVERITY_A_THRESHOLDS.severityOf(gcTime / taskTime)
+    }.getOrElse(Severity.NONE)
+
+    val score = Utils.getHeuristicScore(severity, stageData.numTasks)
+
+    val details = if (hasSignificantSeverity(severity)) {
+      Seq(s"Stage ${stageId}: tasks are spending signficant time in GC (median task GC time is " +
+        s"${Utils.getDuration(gcTime.toLong)}, median task runtime is " +
+        s"${Utils.getDuration(gcTime.toLong)}")
+    } else {
+      Seq.empty
+    }
+
+    new SimpleStageAnalysisResult(severity, score, details)
+  }
+
+  /**
+    * Check the stage for tasks that failed for a specified error.
+    *
+    * @param stageId stage ID.
+    * @param stageData stage data.
+    * @param failedTasks list of failed tasks.
+    * @param taskError the error to check for.
+    * @param errorMessage the message/explanation to print if the the specified error is found.
+    * @param details information and recommendations -- any new recommendations
+    *                from analyzing the stage for errors causing tasks to fail will be appended.
+    * @return
+    */
+  private def checkForSpecificTaskError(
+      stageId: Int,
+      stageData: StageData,
+      failedTasks: Option[Iterable[TaskDataImpl]],
+      taskError: String,
+      errorMessage: String,
+      details: ArrayBuffer[String]): (Int, Severity) = {
+    val numTasksWithError = getNumTasksWithError(failedTasks, taskError)
+    if (numTasksWithError > 0) {
+      details += s"Stage $stageId has $numTasksWithError tasks that failed because " +
+        errorMessage
+    }
+    val severity = taskFailureRateSeverityThresholds.severityOf(numTasksWithError.toDouble / stageData.numTasks)
+    (numTasksWithError, severity)
+  }
+
+  /**
+    * Get the number of tasks that failed with the specified error, using a simple string search.
+    *
+    * @param tasks list of failed tasks.
+    * @param error error to look for.
+    * @return number of failed tasks wit the specified error.
+    */
+  private def getNumTasksWithError(tasks: Option[Iterable[TaskDataImpl]], error: String): Int = {
+    tasks.map { failedTasks =>
+      failedTasks.filter { task =>
+        val hasError = task.errorMessage.map(_.contains(error)).getOrElse(false)
+        hasError
+      }.size
+    }.getOrElse(0)
+  }
+
+  /** Given the severity, return true if the severity is not NONE or LOW. */
+  private def hasSignificantSeverity(severity: Severity): Boolean = {
+    severity != Severity.NONE && severity != Severity.LOW
+  }
+}
diff --git a/app/com/linkedin/drelephant/spark/legacydata/LegacyDataConverters.scala b/app/com/linkedin/drelephant/spark/legacydata/LegacyDataConverters.scala
index 4c0d6f727..17b206c64 100644
--- a/app/com/linkedin/drelephant/spark/legacydata/LegacyDataConverters.scala
+++ b/app/com/linkedin/drelephant/spark/legacydata/LegacyDataConverters.scala
@@ -60,6 +60,18 @@ object LegacyDataConverters {
       override def name: String = ""
       override def executorSummary: Option[collection.Map[String, ExecutorStageSummary]] = None
       override def status = StageStatus.COMPLETE
+        override    def completionTime: Option[java.util.Date] = None
+        override    def executorCpuTime: Long = 0L
+        override    def executorMetricsSummary: Option[ExecutorMetricDistributions] = None
+        override    def failureReason: Option[String] = None
+        override    def firstTaskLaunchedTime: Option[java.util.Date] = None
+        override    def numTasks: Int = 0
+        override    def peakExecutionMemory: Option[Long] = None
+        override    def peakJvmUsedMemory: Option[Long] = None
+        override    def peakStorageMemory: Option[Long] = None
+        override    def peakUnifiedMemory: Option[Long] = None
+        override    def submissionTime: Option[java.util.Date] = None
+        override    def taskSummary: Option[TaskMetricDistributions] = None
     })
   }
 
@@ -144,11 +156,19 @@ object LegacyDataConverters {
         extractStageStatus(stageAttemptId),
         stageAttemptId.stageId,
         stageAttemptId.attemptId,
+        numTasks = 0,
         stageInfo.numActiveTasks,
         stageInfo.numCompleteTasks,
         stageInfo.numFailedTasks,
+
         stageInfo.executorRunTime,
-        stageInfo.inputBytes,
+        executorCpuTime = 0,
+        submissionTime = None,
+        firstTaskLaunchedTime = None,
+        completionTime = None,
+        failureReason = None,
+
+      stageInfo.inputBytes,
         inputRecords = 0,
         stageInfo.outputBytes,
         outputRecords = 0,
@@ -158,12 +178,20 @@ object LegacyDataConverters {
         shuffleWriteRecords = 0,
         stageInfo.memoryBytesSpilled,
         stageInfo.diskBytesSpilled,
+
         stageInfo.name,
         stageInfo.description,
         schedulingPool = "",
+
         accumulatorUpdates = Seq.empty,
         tasks = None,
-        executorSummary = None
+        executorSummary = None,
+        peakJvmUsedMemory = None,
+        peakExecutionMemory = None,
+        peakStorageMemory = None,
+        peakUnifiedMemory = None,
+        taskSummary = None,
+        executorMetricsSummary = None
       )
     }
 
diff --git a/app/com/linkedin/drelephant/spark/legacydata/SparkStageData.java b/app/com/linkedin/drelephant/spark/legacydata/SparkStageData.java
new file mode 100644
index 000000000..406586781
--- /dev/null
+++ b/app/com/linkedin/drelephant/spark/legacydata/SparkStageData.java
@@ -0,0 +1,30 @@
+/*
+ * Copyright 2016 LinkedIn Corp.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License"); you may not
+ * use this file except in compliance with the License. You may obtain a copy of
+ * the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+ * License for the specific language governing permissions and limitations under
+ * the License.
+ */
+
+package com.linkedin.drelephant.spark.legacydata;
+
+
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Set;
+
+
+/**
+ * This class contains Spark stage information.
+ */public class SparkStageData {
+
+
+}
diff --git a/app/com/linkedin/drelephant/util/Utils.java b/app/com/linkedin/drelephant/util/Utils.java
index 6314483db..9867128ac 100644
--- a/app/com/linkedin/drelephant/util/Utils.java
+++ b/app/com/linkedin/drelephant/util/Utils.java
@@ -268,6 +268,37 @@ public static String getDurationBreakdown(long millis) {
     return String.format("%d:%02d:%02d", hours, minutes, seconds);
   }
 
+  /**
+   * Convert a millisecond duration to a string format, specifying
+   * milliseconds, seconds, minutes, hours, or days, for the largest unit
+   * that has a > 1.0 value.
+   *
+   * @param millis duration in milliseconds
+   * @return The string format.
+   */
+  public static String getDuration(long millis) {
+    double seconds = millis / 1000.0;
+    if (seconds < 1) {
+      return millis + " ms";
+    } else {
+      double minutes = seconds / 60.0;
+      if (minutes < 1) {
+        return String.format("%.2f sec", seconds);
+      } else {
+        double hours = minutes / 60.0;
+        if (hours < 1) {
+          return String.format("%.2f min", minutes);
+        } else {
+          double days = hours / 24.0;
+          if (days < 1) {
+            return String.format("%.2f hr", hours);
+          }
+          return String.format("%.2f days", days);
+        }
+      }
+    }
+  }
+
   /**
    * Convert a value in MBSeconds to GBHours
    * @param MBSeconds The value to convert
diff --git a/test/com/linkedin/drelephant/spark/fetchers/SparkRestClientTest.scala b/test/com/linkedin/drelephant/spark/fetchers/SparkRestClientTest.scala
index c20223fb8..00581a68b 100644
--- a/test/com/linkedin/drelephant/spark/fetchers/SparkRestClientTest.scala
+++ b/test/com/linkedin/drelephant/spark/fetchers/SparkRestClientTest.scala
@@ -300,7 +300,7 @@ object SparkRestClientTest {
       @Path("applications/{appId}/{attemptId}/jobs")
       def getJobs(): JobsResource = new JobsResource()
 
-      @Path("applications/{appId}/{attemptId}/stages")
+      @Path("applications/{appId}/{attemptId}/stages/withSummaries")
       def getStages(): StagesResource = new StagesResource()
 
       @Path("applications/{appId}/{attemptId}/allexecutors")
@@ -382,7 +382,7 @@ object SparkRestClientTest {
       @Path("applications/{appId}/jobs")
       def getJobs(): JobsResource = new JobsResource()
 
-      @Path("applications/{appId}/stages")
+      @Path("applications/{appId}/stages/withSummaries")
       def getStages(): StagesResource = new StagesResource()
 
       @Path("applications/{appId}/allexecutors")
diff --git a/test/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristicTest.scala b/test/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristicTest.scala
new file mode 100644
index 000000000..da629d491
--- /dev/null
+++ b/test/com/linkedin/drelephant/spark/heuristics/ConfigurationParametersHeuristicTest.scala
@@ -0,0 +1,883 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import com.linkedin.drelephant.analysis.{HeuristicResult, Severity}
+import com.linkedin.drelephant.spark.heuristics.SparkTestUtilities._
+import com.linkedin.drelephant.spark.heuristics.ConfigurationUtils._
+import org.scalatest.{FunSpec, Matchers}
+
+class ConfigurationParametersHeuristicTest extends FunSpec with Matchers {
+  describe(".apply") {
+    it("unused executor memory, increase executor cores") {
+      // executor and driver memory are both over provisioned, increase executor
+      // cores and decrease driver memory
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).create(),
+        StageBuilder(2, 200).create(),
+        StageBuilder(3, 200).create(),
+        StageBuilder(4, 200).create(),
+        StageBuilder(5, 10).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 200, 3, 300),
+        createExecutorSummary("1", 800, 3, 300),
+        createExecutorSummary("2", 500, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+      SPARK_EXECUTOR_MEMORY -> "4G",
+      SPARK_DRIVER_MEMORY -> "6G",
+      SPARK_EXECUTOR_MEMORY_OVERHEAD -> "1G",
+      SPARK_DRIVER_MEMORY_OVERHEAD -> "2G",
+      SPARK_EXECUTOR_CORES -> "1",
+      SPARK_DRIVER_CORES -> "1",
+      SPARK_EXECUTOR_INSTANCES -> "200",
+      SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+      SPARK_MEMORY_FRACTION -> "0.1"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "4GB",
+        "Current spark.driver.memory" -> "6GB",
+        "Current spark.executor.cores" -> "1",
+        "Current spark.driver.cores" -> "1",
+        "Current spark.memory.fraction" -> "0.1",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.yarn.executor.memoryOverhead" -> "1024MB",
+        "Current spark.yarn.driver.memoryOverhead" -> "2GB",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "3",
+        "Recommended spark.executor.memory" -> "4GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.driver.cores" -> "1",
+        "Recommended spark.driver.memory" -> "640MB",
+        "Recommended spark.yarn.executor.memoryOverhead" -> "1024MB",
+        "Recommended spark.yarn.driver.memoryOverhead" -> "2GB",
+        "Recommended spark.executor.instances" -> "66")
+      checkHeuristicResults(result, Severity.CRITICAL, 16, expectedDetails)
+    }
+
+    it("unused executor memory, decrease executor memory") {
+      // executor memory and driver memory are both over provisioned, decrease both
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).create(),
+        StageBuilder(2, 200).create(),
+        StageBuilder(3, 200).create(),
+        StageBuilder(4, 200).create(),
+        StageBuilder(5, 10).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1200, 3, 300),
+        createExecutorSummary("1", 800, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "4G",
+        SPARK_DRIVER_MEMORY -> "6G",
+        SPARK_EXECUTOR_MEMORY_OVERHEAD -> "1G",
+        SPARK_DRIVER_MEMORY_OVERHEAD -> "2G",
+        SPARK_EXECUTOR_CORES -> "5",
+        SPARK_DRIVER_CORES -> "5",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.1"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "4GB",
+        "Current spark.driver.memory" -> "6GB",
+        "Current spark.executor.cores" -> "5",
+        "Current spark.driver.cores" -> "5",
+        "Current spark.memory.fraction" -> "0.1",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.yarn.executor.memoryOverhead" -> "1024MB",
+        "Current spark.yarn.driver.memoryOverhead" -> "2GB",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "5",
+        "Recommended spark.executor.memory" -> "1550MB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "1800MB",
+        "Recommended spark.yarn.executor.memoryOverhead" -> "1024MB",
+        "Recommended spark.yarn.driver.memoryOverhead" -> "2GB",
+        "Recommended spark.executor.instances" -> "40")
+      checkHeuristicResults(result, Severity.CRITICAL, 17, expectedDetails)
+    }
+
+    it("long and skewed tasks, increase partitions") {
+      // There are both skewed tasks and long tasks, increase the number of partitions
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(500, 5300, 15000).create(),
+        StageBuilder(2, 200).taskRuntime(600, 600, 120000).create(),
+        StageBuilder(3, 200).taskRuntime(300, 800, 120000).create(),
+        StageBuilder(4, 200).taskRuntime(20, 30, 5000).create(),
+        StageBuilder(5, 10).taskRuntime(1000, 1000, 10000).create()
+
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails =
+        "Stage 1 has skew in task run time (median is 8.33 min, max is 1.47 hr).\n" +
+        "Stage 1: please try to modify the application to make the partitions more even.\n" +
+        "Stage 1 has a long median task run time of 8.33 min.\n" +
+        "Stage 1 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 1: please increase the number of partitions.\n" +
+        "Stage 2 has a long median task run time of 10.00 min.\n" +
+        "Stage 2 has 200 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 3 has a long median task run time of 5.00 min.\n" +
+        "Stage 3 has 200 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 5 has a long median task run time of 16.67 min.\n" +
+        "Stage 5 has 10 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 5: please increase the number of partitions."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "2GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "800",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "200",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 1055, expectedDetails)
+    }
+
+    it("OOM and long tasks, increase partitions") {
+      // There are both failed tasks and long tasks, increase the number of partitions
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(500, 5300, 15000).create(),
+        StageBuilder(2, 200).taskRuntime(600, 600, 120000).create(),
+        StageBuilder(3, 200).taskRuntime(300, 800, 120000).create(),
+        StageBuilder(4, 200).taskRuntime(20, 30, 5000).failures(20, 20, 0).create(),
+        StageBuilder(5, 10).taskRuntime(1000, 1000, 10000).create()
+
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails =
+        "Stage 1 has skew in task run time (median is 8.33 min, max is 1.47 hr).\n" +
+          "Stage 1: please try to modify the application to make the partitions more even.\n" +
+          "Stage 1 has a long median task run time of 8.33 min.\n" +
+          "Stage 1 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+          "Stage 1: please increase the number of partitions.\n" +
+          "Stage 2 has a long median task run time of 10.00 min.\n" +
+          "Stage 2 has 200 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+          "Stage 3 has a long median task run time of 5.00 min.\n" +
+          "Stage 3 has 200 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+          "Stage 4 has 20 failed tasks.\n" +
+          "Stage 4 has 20 tasks that failed because of OutOfMemory exception.\n" +
+          "Stage 5 has a long median task run time of 16.67 min.\n" +
+          "Stage 5 has 10 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.\n" +
+          "Stage 5: please increase the number of partitions."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "2GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "800",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "200",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 1095, expectedDetails)
+    }
+
+    it("OOM, double memory") {
+      // tasks failed with OOM, since executor memory is low (2G), double the memory
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).failures(5, 5, 0).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "20",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has 5 failed tasks.\n" +
+        "Stage 2 has 5 tasks that failed because of OutOfMemory exception."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "20",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "4GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "5",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 20, expectedDetails)
+    }
+
+    it("OOM, increase memory by half") {
+      // tasks failed with OOM, since executor memory is moderate (6G), increase memory by .5
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).failures(5, 5, 0).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 5000, 3, 300),
+        createExecutorSummary("2", 5500, 3, 300),
+        createExecutorSummary("3", 3000, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "6G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "20",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has 5 failed tasks.\n" +
+        "Stage 2 has 5 tasks that failed because of OutOfMemory exception."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "6GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "20",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "9GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "5",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 20, expectedDetails)
+    }
+
+    it("OOM, increase partitions") {
+      // tasks failed with OOM, since executor memory is higher (9G), increase partitions
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).failures(5, 5, 0).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 8000, 3, 300),
+        createExecutorSummary("2", 6000, 3, 300),
+        createExecutorSummary("3", 6000, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "9G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "20",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has 5 failed tasks.\n" +
+        "Stage 2 has 5 tasks that failed because of OutOfMemory exception."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "9GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "20",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "9GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "40",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "10",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 20, expectedDetails)
+    }
+
+    it("OOM, non-default partitions, decrease cores") {
+      // tasks failed with OOM, since executor memory is higher (9G), decrease cores
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).failures(5, 5, 0).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 8000, 3, 300),
+        createExecutorSummary("2", 6000, 3, 300),
+        createExecutorSummary("3", 6000, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "9G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "20",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 3 has 5 failed tasks.\n" +
+        "Stage 3 has 5 tasks that failed because of OutOfMemory exception."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "9GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "20",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "2",
+        "Recommended spark.executor.memory" -> "9GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "10",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 20, expectedDetails)
+    }
+
+    it("OOM, non-default partitions, increase memory by 0.25") {
+      // tasks failed with OOM, since executor memory is higher (9G), increase memory 25%
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).failures(5, 5, 0).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 8000, 3, 300),
+        createExecutorSummary("2", 6000, 3, 300),
+        createExecutorSummary("3", 6000, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "9G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "2",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "20",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 3 has 5 failed tasks.\n" +
+        "Stage 3 has 5 tasks that failed because of OutOfMemory exception."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "9GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "2",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "20",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "2",
+        "Recommended spark.executor.memory" -> "12GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "10",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 20, expectedDetails)
+    }
+
+    it("Container killed by yarn") {
+      // tasks failed with container killed by YARN, increase memory overhead
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 60, 15000).create(),
+        StageBuilder(2, 20).taskRuntime(60, 60, 1200).create(),
+        StageBuilder(3, 10).taskRuntime(100, 100, 1000).failures(7, 0, 5).create()
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 8000, 3, 300),
+        createExecutorSummary("2", 6000, 3, 300),
+        createExecutorSummary("3", 6000, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "9G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "2",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "20",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 3 has 7 failed tasks.\n" +
+        "Stage 3 has 5 tasks that failed because the container was killed by YARN for exeeding memory limits."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "9GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "2",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.executor.cores" -> "2",
+        "Recommended spark.executor.memory" -> "9GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "20",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.yarn.executor.memoryOverhead" -> "1946MB",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 28, expectedDetails)
+    }
+
+    it("long tasks and execution memory spill 1") {
+      // There are both long tasks and execution memory spill, increasing the number of
+      // partitions for long tasks to 800 is sufficient to fix execution memory spill as well
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 50, 1500).create(),
+        StageBuilder(2, 200).taskRuntime(600, 600, 120000).shuffleRead(500, 600, 12000).spill(50, 60, 1200).create(),
+        StageBuilder(3, 200).taskRuntime(30, 80, 1200).create(),
+        StageBuilder(4, 10).taskRuntime(100, 100, 1000).create())
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has a long median task run time of 10.00 min.\n" +
+        "Stage 2 has 200 tasks, 0 B input, 11.72 GB shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 2 has 1.17 GB execution memory spill."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "2GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "800",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "200",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.SEVERE, 1000, expectedDetails)
+    }
+
+    it("long tasks and execution memory spill 2") {
+      // There are both long tasks and execution memory spill, increase the number of
+      // partitions and executor memory.
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 50, 1500).create(),
+        StageBuilder(2, 200).taskRuntime(90, 90, 1800).shuffleRead(500, 600, 12000).spill(500, 600, 600000).create(),
+        StageBuilder(3, 200).taskRuntime(900, 900, 180000).shuffleRead(500, 600, 12000).spill(50, 60, 1200).create(),
+        StageBuilder(4, 10).taskRuntime(100, 100, 1000).create())
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has 585.94 GB execution memory spill.\n" +
+        "Stage 3 has a long median task run time of 15.00 min.\n" +
+        "Stage 3 has 200 tasks, 0 B input, 11.72 GB shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 3 has 1.17 GB execution memory spill."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "4GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "1200",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "200",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 2000, expectedDetails)
+    }
+
+    it("long tasks and execution memory spill 3") {
+      // There are both long tasks and execution memory spill, increase partitions
+      // and memory, and decrease cores.
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 50, 1500).create(),
+        StageBuilder(2, 200).taskRuntime(60, 60, 1200).shuffleRead(500, 600, 12000).spill(500, 600, 1200000).create(),
+        StageBuilder(3, 200).taskRuntime(600, 600, 120000).shuffleRead(500, 600, 12000).spill(50, 60, 1200).create(),
+        StageBuilder(4, 10).taskRuntime(100, 100, 1000).create())
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 2 has 1.14 TB execution memory spill.\n" +
+        "Stage 3 has a long median task run time of 10.00 min.\n" +
+        "Stage 3 has 200 tasks, 0 B input, 11.72 GB shuffle read, 0 B shuffle write, and 0 B output.\n" +
+        "Stage 3 has 1.17 GB execution memory spill."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "3",
+        "Recommended spark.executor.memory" -> "6GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "2000",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "266",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 1800, expectedDetails)
+    }
+
+    it("execution memory spill 1") {
+      // Execution memory spill for stages 2 and 3, stage 2 is processing a lot of data.
+      // Values should be calculated for stage 2, but do not flag stage 2.
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 50, 1500).create(),
+        StageBuilder(2, 200).taskRuntime(60, 60, 1200).shuffleRead(50000, 60000, 4000000).spill(500, 600, 4000000).create(),
+        StageBuilder(3, 200).taskRuntime(60, 60, 1200).shuffleRead(500, 600, 12000).spill(50, 60, 1200).create(),
+        StageBuilder(4, 10).taskRuntime(100, 100, 1000).create()
+
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails =
+        "Stage 2: a large amount of data is being processesd. Examine the application to see if this can be reduced.\n" +
+          "Stage 2 has 3.81 TB execution memory spill.\n" +
+          "Stage 2 has 200 tasks, 0 B input read, 3.81 TB shuffle read, 0 B shuffle write, 0 B output.\n" +
+          "Stage 2 has median task values: 500 MB memory spill, 0 B input, 48.83 GB shuffle read, 0 B shuffle write, 0 B output.\n" +
+          "Stage 3 has 1.17 GB execution memory spill."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "2",
+        "Recommended spark.executor.memory" -> "8GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "2000",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "400",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.MODERATE, 400, expectedDetails)
+    }
+
+    it("execution memory spill 2") {
+      // Execution memory spill for stages 1 and 2, where stage 1 has different number of partitions.
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(50, 50, 1500).input(50000, 60000, 2000000).spill(5000, 6000, 2000000).create(),
+        StageBuilder(2, 200).taskRuntime(60, 60, 1200).shuffleRead(5000, 6000, 400000).spill(500, 600, 400000).create(),
+        StageBuilder(3, 200).taskRuntime(60, 60, 1200).create(),
+        StageBuilder(4, 10).taskRuntime(100, 100, 1000).create()
+
+      )
+      val executors = Seq(
+        createExecutorSummary("driver", 1500, 3, 300),
+        createExecutorSummary("1", 1500, 3, 300),
+        createExecutorSummary("2", 1000, 3, 300),
+        createExecutorSummary("3", 800, 3, 300)
+      )
+      val properties = Map(
+        SPARK_EXECUTOR_MEMORY -> "2G",
+        SPARK_DRIVER_MEMORY -> "2G",
+        SPARK_EXECUTOR_CORES -> "4",
+        SPARK_DRIVER_CORES -> "2",
+        SPARK_EXECUTOR_INSTANCES -> "200",
+        SPARK_SQL_SHUFFLE_PARTITIONS -> "200",
+        SPARK_MEMORY_FRACTION -> "0.6"
+      )
+
+      val data = createSparkApplicationData(stages, executors, Some(properties))
+
+      val configurationParametersHeuristic = new ConfigurationParametersHeuristic(
+        heuristicConfigurationData)
+      val evaluator = new ConfigurationParametersHeuristic.Evaluator(
+        configurationParametersHeuristic, data)
+
+      val result = configurationParametersHeuristic.apply(data)
+      val expectedStageDetails = "Stage 1 has 1.91 TB execution memory spill.\n" +
+        "Stage 2 has 390.62 GB execution memory spill."
+      val expectedDetails = Map(
+        "Current spark.executor.memory" -> "2GB",
+        "Current spark.driver.memory" -> "2GB",
+        "Current spark.executor.cores" -> "4",
+        "Current spark.driver.cores" -> "2",
+        "Current spark.memory.fraction" -> "0.6",
+        "Current spark.executor.instances" -> "200",
+        "Current spark.sql.shuffle.partitions" -> "200",
+        "Recommended spark.executor.cores" -> "4",
+        "Recommended spark.executor.memory" -> "4GB",
+        "Recommended spark.memory.fraction" -> "0.6",
+        "Recommended spark.sql.shuffle.partitions" -> "1000",
+        "Recommended spark.driver.cores" -> "2",
+        "Recommended spark.driver.memory" -> "2GB",
+        "Recommended spark.executor.instances" -> "200",
+        "stage details" -> expectedStageDetails)
+      checkHeuristicResults(result, Severity.CRITICAL, 812, expectedDetails)
+    }
+  }
+
+  /**
+    * Check if the calculated heuristic results match the expected values.
+    *
+    * @param actual the actual heuristic result.
+    * @param expectedSeverity expected severity.
+    * @param expectedScore expeced score.
+    * @param expectedDetails expected details.
+    */
+  private def checkHeuristicResults(
+      actual: HeuristicResult,
+      expectedSeverity: Severity,
+      expectedScore: Int,
+      expectedDetails: Map[String, String]) = {
+    actual.getSeverity should be(expectedSeverity)
+    actual.getScore should be(expectedScore)
+    actual.getHeuristicResultDetails.size() should be(expectedDetails.size)
+    (0 until expectedDetails.size).foreach { i =>
+      val actualDetail = actual.getHeuristicResultDetails.get(i)
+      Some(actualDetail.getValue) should be (expectedDetails.get(actualDetail.getName))
+    }
+  }
+}
diff --git a/test/com/linkedin/drelephant/spark/heuristics/SparkTestUtilities.scala b/test/com/linkedin/drelephant/spark/heuristics/SparkTestUtilities.scala
new file mode 100644
index 000000000..cf2ad79b7
--- /dev/null
+++ b/test/com/linkedin/drelephant/spark/heuristics/SparkTestUtilities.scala
@@ -0,0 +1,542 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import java.util.Date
+
+import com.linkedin.drelephant.analysis.{ApplicationType, Severity}
+import com.linkedin.drelephant.configurations.heuristic.HeuristicConfigurationData
+import com.linkedin.drelephant.spark.data.{SparkApplicationData, SparkLogDerivedData, SparkRestDerivedData}
+import com.linkedin.drelephant.spark.fetchers.statusapiv1._
+import org.apache.spark.scheduler.SparkListenerEnvironmentUpdate
+
+import scala.collection.JavaConverters
+
+private [heuristics] object SparkTestUtilities {
+  import JavaConverters._
+  import java.text.SimpleDateFormat
+
+  val OOM_ERROR = "java.lang.OutOfMemoryError"
+  val OVERHEAD_MEMORY_ERROR = "killed by YARN for exceeding memory limits"
+
+  private val sdf = new SimpleDateFormat("dd/MM/yyyy HH:mm:ss")
+
+  /** Create a ample heuristics configuration data. */
+  def createHeuristicConfigurationData(
+      params: Map[String, String] = Map.empty): HeuristicConfigurationData =
+    new HeuristicConfigurationData("heuristic", "class", "view", new ApplicationType("type"), params.asJava)
+
+  /**
+    * Builder for creating a StageAnalysis.
+    *
+    * @param stageId stage ID.
+    * @param numTasks total number of tasks for the stage.
+    */
+  case class StageAnalysisBuilder(stageId: Int, numTasks: Int) {
+    var rawSpillSeverity = Severity.NONE
+    var executionSpillSeverity = Severity.NONE
+    var longTaskSeverity = Severity.NONE
+    var rawSkewSeverity = Severity.NONE
+    var taskSkewSeverity = Severity.NONE
+    var failedWithOOMSeverity = Severity.NONE
+    var failedWithContainerKilledSeverity = Severity.NONE
+    var gcSeverity = Severity.NONE
+    var taskFailureSeverity = Severity.NONE
+    var stageFailureSeverity = Severity.NONE
+    var spillScore = 0
+    var longTaskScore = 0
+    var taskSkewScore = 0
+    var taskFailureScore = 0
+    var stageFailureScore = 0
+    var gcScore = 0
+    var medianRunTime: Option[Double] = None
+    var maxRunTime: Option[Double] = None
+    var memoryBytesSpilled = 0L
+    var maxTaskBytesSpilled = 0L
+    var inputBytes: Long = 0L
+    var outputBytes: Long = 0L
+    var shuffleReadBytes: Long = 0L
+    var shuffleWriteBytes: Long = 0L
+    var numFailedTasks = 0
+    var numTasksWithOOM = 0
+    var numTasksWithContainerKilled = 0
+    var stageDuration = Some((5 * 60 * 1000).toLong)
+    var spillDetails: Seq[String] = Seq()
+    var longTaskDetails: Seq[String] = Seq()
+    var taskSkewDetails: Seq[String] = Seq()
+    var taskFailureDetails: Seq[String] = Seq()
+    var stageFailureDetails: Seq[String] = Seq()
+    var gcDetails: Seq[String] = Seq()
+
+    /**
+      * Configure execution memory spill related parameters.
+      *
+      * @param raw the raw execution memory spill severity.
+      * @param severity the reported execution memory spill severity.
+      * @param maxTaskSpillMb maximum amount (MB) of execution memory spill for a task.
+      * @param bytesSpilledMb total amount (MB) of execution memory spill.
+      * @return this StageAnalysisBuilder.
+      */
+    def spill(
+        raw: Severity,
+        severity: Severity,
+        score: Int,
+        maxTaskSpillMb: Long,
+        bytesSpilledMb: Long,
+        details: Seq[String]): StageAnalysisBuilder = {
+      rawSpillSeverity = raw
+      executionSpillSeverity = severity
+      spillScore = score
+      maxTaskBytesSpilled = maxTaskSpillMb << 20
+      memoryBytesSpilled = bytesSpilledMb << 20
+      spillDetails = details
+      this
+    }
+
+    /** Set the amount of input data in MB. */
+    def input(inputMb: Long): StageAnalysisBuilder = {
+      inputBytes = inputMb << 20
+      this
+    }
+
+    /** Set the amount of output data in MB. */
+    def output(outputMb: Long): StageAnalysisBuilder = {
+      outputBytes = outputMb << 20
+      this
+    }
+
+    /** Set the amount of shuffle read data in MB. */
+    def shuffleRead(shuffleReadMb: Long): StageAnalysisBuilder = {
+      shuffleReadBytes = shuffleReadMb << 20
+      this
+    }
+
+    /** Set the amount of shuffle write data in MB. */
+    def shuffleWrite(shuffleWriteMb: Long): StageAnalysisBuilder = {
+      shuffleWriteBytes = shuffleWriteMb << 20
+      this
+    }
+
+    /** Set the stage duration. */
+    def duration(sec: Long): StageAnalysisBuilder = {
+      stageDuration = Some(sec * 1000)
+      this
+    }
+
+    /** Set the median and max task runtimes in seconds */
+    def taskRuntime(median: Double, maximum: Double): StageAnalysisBuilder = {
+      medianRunTime = Some(median * 1000)
+      maxRunTime = Some(maximum * 1000)
+      this
+    }
+
+    /** set the long task analysis information */
+    def longTask(severity: Severity, score: Int, details: Seq[String]): StageAnalysisBuilder = {
+      longTaskSeverity = severity
+      longTaskScore = score
+      longTaskDetails = details
+      this
+    }
+
+    /** set the raw and reported task skew severity and details */
+    def skew(
+        raw: Severity,
+        severity: Severity,
+        score: Int,
+        details: Seq[String]): StageAnalysisBuilder = {
+      rawSkewSeverity = raw
+      taskSkewSeverity = severity
+      taskSkewScore = score
+      taskSkewDetails = details
+      this
+    }
+
+    /**
+      * Configure stage failure information.
+      *
+      * @param severity severity of stage failure.
+      * @param score score for stage failure analysis
+      * @param details information and recommendations
+      * @return
+      */
+    def stageFailure(severity: Severity,
+                     score: Int,
+                     details: Seq[String]): StageAnalysisBuilder = {
+      stageFailureSeverity = severity
+      stageFailureScore = score
+      stageFailureDetails = details
+      this
+    }
+
+    /**
+      * Configure task failure information.
+      *
+      * @param taskSeverity severity of all task failures.
+      * @param oomSeverity severity of task failures due to OutOfMemory errors.
+      * @param containerKilledSeverity severity of failures due to containers killed by YARN.
+      * @param score score from task failure analysis.
+      * @param numFailures total number of task failures.
+      * @param numOOM total number of tasks failed with OutOfMemory errors.
+      * @param numContainerKilled total number of tasks failed due to container killed by YARN.
+      * @param details information and recommendations for task failures
+      * @return this StageAnalysisBuilder.
+      */
+    def taskFailures(
+        taskSeverity: Severity,
+        oomSeverity: Severity,
+        containerKilledSeverity: Severity,
+        score: Int,
+        numFailures: Int,
+        numOOM: Int,
+        numContainerKilled: Int,
+        details: Seq[String]): StageAnalysisBuilder = {
+      taskFailureSeverity = taskSeverity
+      failedWithOOMSeverity = oomSeverity
+      failedWithContainerKilledSeverity = containerKilledSeverity
+      taskFailureScore = score
+      numFailedTasks = numFailures
+      numTasksWithOOM = numOOM
+      numTasksWithContainerKilled = numContainerKilled
+      taskFailureDetails = details
+      this
+    }
+
+    /** Create the StageAnalysis. */
+    def create(): StageAnalysis = {
+      StageAnalysis(
+        stageId,
+        ExecutionMemorySpillResult(executionSpillSeverity, spillScore, spillDetails,
+          rawSpillSeverity, memoryBytesSpilled, maxTaskBytesSpilled),
+        SimpleStageAnalysisResult(longTaskSeverity, longTaskScore, longTaskDetails),
+        TaskSkewResult(taskSkewSeverity, taskSkewScore, taskSkewDetails, rawSkewSeverity),
+        TaskFailureResult(taskFailureSeverity, taskFailureScore, taskFailureDetails,
+          failedWithOOMSeverity, failedWithContainerKilledSeverity, numFailedTasks,
+          numTasksWithOOM, numTasksWithContainerKilled),
+        SimpleStageAnalysisResult(stageFailureSeverity, stageFailureScore, stageFailureDetails),
+        SimpleStageAnalysisResult(gcSeverity, gcScore, gcDetails),
+        numTasks, medianRunTime, maxRunTime, stageDuration, inputBytes, outputBytes,
+        shuffleReadBytes, shuffleWriteBytes)
+    }
+  }
+
+  /**
+    * Builder for creating StageData.
+    *
+    * @param stageId stage ID
+    * @param numTasks total number of tasks for the stage.
+    */
+  case class StageBuilder(stageId: Int, numTasks: Int) {
+    val stage = new StageDataImpl(
+      StageStatus.COMPLETE,
+      stageId,
+      attemptId = 0,
+      numTasks = numTasks,
+      numActiveTasks = numTasks,
+      numCompleteTasks = numTasks,
+      numFailedTasks = 0,
+      executorRunTime = 0,
+      executorCpuTime = 0,
+      submissionTime = Some(sdf.parse("09/09/2018 12:00:00")),
+      firstTaskLaunchedTime = None,
+      completionTime = Some(sdf.parse("09/09/2018 12:05:00")),
+      failureReason = None,
+
+      inputBytes = 0,
+      inputRecords = 0,
+      outputBytes = 0,
+      outputRecords = 0,
+      shuffleReadBytes = 0,
+      shuffleReadRecords = 0,
+      shuffleWriteBytes = 0,
+      shuffleWriteRecords = 0,
+      memoryBytesSpilled = 0,
+      diskBytesSpilled = 0,
+      name = "foo",
+      details = "stage details",
+      schedulingPool = "",
+      accumulatorUpdates = Seq.empty,
+      tasks = None,
+      executorSummary = None,
+      peakJvmUsedMemory = None,
+      peakExecutionMemory = None,
+      peakStorageMemory = None,
+      peakUnifiedMemory = None,
+      taskSummary = None,
+      executorMetricsSummary = None
+    )
+
+    /** Create the specified number of tasks for the stage. */
+    private def createTasks(numTasks: Int): Map[Long, TaskDataImpl] = {
+      (1 until (numTasks + 1)).map { i =>
+        (i.toLong, new TaskDataImpl(
+          taskId = i.toLong,
+          index = 1,
+          attempt = 0,
+          launchTime = new Date(),
+          executorId = "1",
+          host = "SomeHost",
+          taskLocality = "ANY",
+          speculative = false,
+          accumulatorUpdates = Seq(),
+          errorMessage = None,
+          taskMetrics = None))
+      }.toMap
+    }
+
+    /** Set the stage status. */
+    def status(stageStatus: StageStatus, reason: Option[String]): StageBuilder = {
+      stage.status = stageStatus
+      stage.failureReason = reason
+      this
+    }
+
+    /**
+      * Set the run times.
+      *
+      * @param medianS median task run time in seconds.
+      * @param maxS maximum task runtime in seconds.
+      * @param totalS total runtime for all tasks.
+      * @return this StageBuilder.
+      */
+    def taskRuntime(medianS: Int, maxS: Int, totalS: Int): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianMs = (medianS  * 1000).toDouble
+      val maxMs = (maxS * 1000).toDouble
+      taskMetricDistributions.executorRunTime =
+        IndexedSeq(medianMs/2, medianMs, medianMs, medianMs, maxMs)
+      stage.executorRunTime = totalS * 1000
+      this
+    }
+
+    /**
+      * Set the input information.
+      *
+      * @param medianMB median amount of input read for a task in MB.
+      * @param maxMB maximum amount of input read for a task in MB.
+      * @param totalMB total amount of input read for the stage in MB.
+      * @return this StageBuilder.
+      */
+    def input(medianMB: Long, maxMB: Long, totalMB: Long): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianBytes = (medianMB << 20).toDouble
+      val maxBytes = (maxMB << 20).toDouble
+      taskMetricDistributions.inputMetrics =
+        Some(new InputMetricDistributionsImpl(
+          IndexedSeq(medianBytes/2, medianBytes, medianBytes, medianBytes, maxBytes),
+          IndexedSeq(1000.0, 2000.0, 2000.0, 2000.0, 3000.0)))
+      stage.inputBytes = totalMB << 20
+      this
+    }
+
+    /**
+      * Set the output information.
+      *
+      * @param medianMB median amount of output written for a task in MB.
+      * @param maxMB maximum amount of output written for a task in MB.
+      * @param totalMB total amount of output written for the stage in MB.
+      * @return this StageBuilder.
+      */
+    def output(medianMB: Long, maxMB: Long, totalMB: Long): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianBytes = (medianMB << 20).toDouble
+      val maxBytes = (maxMB << 20).toDouble
+      taskMetricDistributions.outputMetrics =
+        Some(new OutputMetricDistributionsImpl(
+          IndexedSeq(medianBytes/2, medianBytes, medianBytes, medianBytes, maxBytes),
+          IndexedSeq(1000.0, 2000.0, 2000.0, 2000.0, 3000.0)))
+      stage.outputBytes = totalMB << 20
+      this
+    }
+
+    /**
+      * Set the shuffle read information.
+      *
+      * @param medianMB median amount of shuffle read for a task in MB.
+      * @param maxMB maximum amount of shuffle read for a task in MB.
+      * @param totalMB total amount of shuffle read for the stage in MB.
+      * @return this StageBuilder.
+      */
+    def shuffleRead(medianMB: Long, maxMB: Long, totalMB: Long): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianBytes = (medianMB << 20).toDouble
+      val maxBytes = (maxMB << 20).toDouble
+      taskMetricDistributions.shuffleReadMetrics =
+        Some(new ShuffleReadMetricDistributionsImpl(
+          IndexedSeq(medianBytes/2, medianBytes, medianBytes, medianBytes, maxBytes),
+          IndexedSeq(1000.0, 2000.0, 2000.0, 2000.0, 3000.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0)))
+      stage.shuffleReadBytes = totalMB << 20
+      this
+    }
+
+    /**
+      * Set the shuffle write information.
+      *
+      * @param medianMB median amount of shuffle write for a task in MB.
+      * @param maxMB maximum amount of shuffle write for a task in MB.
+      * @param totalMB total amount of shuffle write for the stage in MB.
+      * @return this StageBuilder.
+      */
+    def shuffleWrite(medianMB: Long, maxMB: Long, totalMB: Long): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianBytes = (medianMB << 20).toDouble
+      val maxBytes = (maxMB << 20).toDouble
+      taskMetricDistributions.shuffleWriteMetrics =
+        Some(new ShuffleWriteMetricDistributionsImpl(
+          IndexedSeq(medianBytes/2, medianBytes, medianBytes, medianBytes, maxBytes),
+          IndexedSeq(1000.0, 2000.0, 2000.0, 2000.0, 3000.0),
+          IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0)))
+      stage.shuffleWriteBytes = totalMB << 20
+      this
+    }
+
+    /**
+      * Set the execution memory spill information.
+      *
+      * @param medianMB median amount of execution memory spill for a task in MB.
+      * @param maxMB maximum amount of iexecution memory spill for a task in MB.
+      * @param totalMB total amount of execution memory spill for the stage in MB.
+      * @return this StageBuilder.
+      */
+    def spill(medianMB: Long, maxMB: Long, totalMB: Long): StageBuilder = {
+      val taskMetricDistributions = getTaskMetricDistributions()
+      val medianBytes = (medianMB << 20).toDouble
+      val maxBytes = (maxMB << 20).toDouble
+      taskMetricDistributions.memoryBytesSpilled =
+        IndexedSeq(medianBytes/2, medianBytes, medianBytes, medianBytes, maxBytes)
+      stage.memoryBytesSpilled = totalMB << 20
+      this
+    }
+
+    /**
+      * Set the failure information.
+      *
+      * @param numFailed total number of tasks failed.
+      * @param numOOM total number of tasks which failed due to OutOfMemory.
+      * @param numContainerKilled total number of ask which failed due to container killed by YARN.
+      * @return this StageBuilder.
+      */
+    def failures(numFailed: Int, numOOM: Int, numContainerKilled: Int): StageBuilder = {
+      stage.tasks = Some(createTasks(numFailed))
+      (1 until (numOOM + 1)).map { i =>
+        stage.tasks.get(i.toLong).errorMessage = Some(OOM_ERROR)
+      }
+      ((numOOM + 1) until (numOOM + numContainerKilled + 1)).map { i =>
+        stage.tasks.get(i.toLong).errorMessage = Some(OVERHEAD_MEMORY_ERROR)
+      }
+      ((numOOM + numContainerKilled + 1) until numFailed + 1).map { i =>
+        stage.tasks.get(i.toLong).errorMessage = Some("ArrayIndexOutOfBoundsException")
+      }
+      stage.numFailedTasks = numFailed
+      this
+    }
+
+    /** Set the stage submission and completion times. */
+    def times(submissionTime: String, completionTime: String): StageBuilder = {
+      stage.submissionTime = Some(sdf.parse(submissionTime))
+      stage.completionTime = Some(sdf.parse(completionTime))
+      this
+    }
+
+    /** Create the StageDataImpl. */
+    def create(): StageDataImpl = stage
+
+    /** @return a askMetricDistributionsImpl for the StageData, creating it if needed. */
+    private def getTaskMetricDistributions(): TaskMetricDistributionsImpl = {
+      stage.taskSummary match {
+        case None =>
+          val taskMetricDistributions =
+            new TaskMetricDistributionsImpl(
+              quantiles = IndexedSeq(0.0, 0.25, 0.5, 0.75, 1.0),
+              executorDeserializeTime = IndexedSeq(0.0, 0.0, 0.1, 0.1, 0.2),
+              executorDeserializeCpuTime = IndexedSeq(0.0, 0.0, 0.1, 0.1, 0.2),
+              executorRunTime = IndexedSeq(1000.0, 5000.0, 6000.0, 6500.0, 7000.0),
+              executorCpuTime = IndexedSeq(1000.0, 5000.0, 6000.0, 6500.0, 7000.0),
+              resultSize = IndexedSeq(0.0, 0.0, 0.0, 0.0),
+              jvmGcTime = IndexedSeq(0.0, 0.0, 0.0, 0.0),
+              resultSerializationTime = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              gettingResultTime = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              schedulerDelay = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              peakExecutionMemory = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              memoryBytesSpilled = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              diskBytesSpilled = IndexedSeq(0.0, 0.0, 0.0, 0.0, 0.0),
+              inputMetrics = None,
+              outputMetrics = None,
+              shuffleReadMetrics = None,
+              shuffleWriteMetrics = None)
+          stage.taskSummary = Some(taskMetricDistributions)
+          taskMetricDistributions
+        case Some(taskMetricDistributions) =>
+          taskMetricDistributions
+      }
+    }
+  }
+
+  /**
+    * Create an  executor metrics summary.
+    *
+    * @param id executor ID
+    * @param jvmUsedMemoryMb peak JVM used memory for the executor.
+    * @param totalGCTimeSec total time spent in GC by the executor.
+    * @param totalDurationSec total task runtime for the executor.
+    * @return executor summary.
+    */
+  private[heuristics] def createExecutorSummary(
+      id: String,
+      jvmUsedMemoryMb: Long,
+      totalGCTimeSec: Long,
+      totalDurationSec: Long): ExecutorSummaryImpl = new ExecutorSummaryImpl(
+    id,
+    hostPort = "",
+    rddBlocks = 0,
+    memoryUsed=0,
+    diskUsed = 0,
+    activeTasks = 0,
+    failedTasks = 0,
+    completedTasks = 0,
+    totalTasks = 0,
+    maxTasks = 0,
+    totalDurationSec * 1000,
+    totalInputBytes=0,
+    totalShuffleRead=0,
+    totalShuffleWrite= 0,
+    maxMemory = 0,
+    totalGCTimeSec * 1000,
+    totalMemoryBytesSpilled = 0,
+    executorLogs = Map.empty,
+    peakJvmUsedMemory = Map("jvmUsedMemory" -> (jvmUsedMemoryMb << 20)),
+    peakUnifiedMemory = Map.empty
+  )
+
+  /**
+    * Create the Spark application data.
+    *
+    * @param stages list of stage data
+    * @param executorSummaries list of executor summaries.
+    * @param properties configuration properties for the Spark application.
+    * @return Spark application data.
+    */
+  def createSparkApplicationData
+  (stages: Seq[StageDataImpl],
+   executorSummaries: Seq[ExecutorSummaryImpl],
+   properties: Option[Map[String, String]]): SparkApplicationData = {
+    val appId = "application_1"
+
+    val logDerivedData = properties.map { props =>
+      SparkLogDerivedData(
+      SparkListenerEnvironmentUpdate(Map("Spark Properties" -> props.toSeq))
+      )}
+
+    val restDerivedData = SparkRestDerivedData(
+      new ApplicationInfoImpl(appId, name = "app", Seq.empty),
+      jobDatas = Seq.empty,
+      stageDatas = stages,
+      executorSummaries = executorSummaries,
+      stagesWithFailedTasks = stages
+    )
+    SparkApplicationData(appId, restDerivedData, logDerivedData)
+  }
+}
diff --git a/test/com/linkedin/drelephant/spark/heuristics/StagesAnalyzerTest.scala b/test/com/linkedin/drelephant/spark/heuristics/StagesAnalyzerTest.scala
new file mode 100644
index 000000000..6d240ebef
--- /dev/null
+++ b/test/com/linkedin/drelephant/spark/heuristics/StagesAnalyzerTest.scala
@@ -0,0 +1,465 @@
+package com.linkedin.drelephant.spark.heuristics
+
+import java.util.Date
+
+import com.linkedin.drelephant.analysis.{ApplicationType, Severity}
+import com.linkedin.drelephant.spark.fetchers.statusapiv1._
+import org.scalatest.{FunSpec, Matchers}
+
+import scala.collection.JavaConverters
+
+/** Tests for the StagesAnalyzer. */
+class StagesAnalyzerTest extends FunSpec with Matchers {
+  import SparkTestUtilities._
+
+  describe("StagesAnalyzer") {
+    it("has task failures severity") {
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).create(),
+        StageBuilder(2, 5).failures(2, 2, 0).create(),
+        StageBuilder(3, 15).failures(2, 0, 1).create(),
+        StageBuilder(4, 15).failures(3, 1, 2).create(),
+        StageBuilder(5, 4).failures(2, 0, 0).status(StageStatus.FAILED, Some("array issues")).create())
+      val properties = Map( "spark.sql.shuffle.partitions" -> "200")
+      val data = createSparkApplicationData(stages, Seq.empty, Some(properties))
+
+      val expectedAnalysis = Seq(
+        StageAnalysisBuilder(1, 3).create(),
+        StageAnalysisBuilder(2, 5)
+          .taskFailures(Severity.CRITICAL, Severity.CRITICAL, Severity.NONE, 8, 2, 2, 0,
+            Seq("Stage 2 has 2 failed tasks.",
+              "Stage 2 has 2 tasks that failed because of OutOfMemory exception."))
+          .create(),
+        StageAnalysisBuilder(3, 15)
+          .taskFailures(Severity.MODERATE, Severity.NONE, Severity.LOW, 4, 2, 0, 1,
+            Seq("Stage 3 has 2 failed tasks.",
+              "Stage 3 has 1 tasks that failed because the container was killed by YARN for exeeding memory limits."))
+          .create(),
+        StageAnalysisBuilder(4, 15)
+          .taskFailures(Severity.CRITICAL, Severity.LOW, Severity.MODERATE, 12, 3, 1, 2,
+            Seq("Stage 4 has 3 failed tasks.",
+              "Stage 4 has 1 tasks that failed because of OutOfMemory exception.",
+              "Stage 4 has 2 tasks that failed because the container was killed by YARN for exeeding memory limits."))
+          .create(),
+        StageAnalysisBuilder(5, 4)
+          .taskFailures(Severity.CRITICAL, Severity.NONE, Severity.NONE, 8, 2, 0, 0,
+            Seq("Stage 5 has 2 failed tasks."))
+            .stageFailure(Severity.CRITICAL, 16, Seq("Stage 5 failed: array issues"))
+          .create())
+
+      val stageAnalyzer = new StagesAnalyzer(heuristicConfigurationData, data)
+      val stageAnalysis = stageAnalyzer.getStageAnalysis()
+      (0 until expectedAnalysis.size).foreach { i =>
+        compareStageAnalysis(stageAnalysis(i), expectedAnalysis(i))
+      }
+    }
+
+    it("has task skew severity") {
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 5).taskRuntime(200, 250, 600).create(),
+        StageBuilder(2, 5).taskRuntime(100, 250, 260).input(5, 250, 260).create(),
+        StageBuilder(3, 5).taskRuntime(20, 250, 53).create(),
+        StageBuilder(4, 5).taskRuntime(5, 250, 260).input(5, 250, 260).create(),
+        StageBuilder(5, 5).taskRuntime(50, 250, 350).shuffleRead(50, 250, 350).shuffleWrite(50, 250, 400).create(),
+        StageBuilder(6, 5).taskRuntime(50, 250, 350).shuffleRead(50, 50, 50).output(50, 50, 50).create(),
+        StageBuilder(7, 5).taskRuntime(20, 250, 290).shuffleWrite(250, 250, 600).output(20, 250, 290).create(),
+        StageBuilder(8, 3).taskRuntime(200, 250, 1000).create(),
+        StageBuilder(9, 3).taskRuntime(5, 250, 70).create(),
+        StageBuilder(10, 3).taskRuntime(20, 250, 300).input(20, 250, 300).create(),
+        StageBuilder(11, 3).taskRuntime(50, 250, 350).shuffleRead(50, 250, 350).create(),
+        StageBuilder(12, 5).taskRuntime(2, 50, 53).times("09/09/2018 12:00:00", "09/09/2018 12:01:00").create(),
+        StageBuilder(13, 5).taskRuntime(5, 50, 60).input(50, 500, 600).create(),
+        StageBuilder(14, 5).taskRuntime(5, 200, 210).output(5, 200, 210).create())
+      val properties = Map( "spark.sql.shuffle.partitions" -> "5")
+      val data = createSparkApplicationData(stages, Seq.empty, Some(properties))
+
+      val expectedAnalysis = Seq(
+        StageAnalysisBuilder(1, 5).taskRuntime(200, 250)
+            .longTask(Severity.LOW, 0, Seq()).create(),
+        StageAnalysisBuilder(2, 5).taskRuntime(100, 250).input(260)
+          .skew(Severity.LOW, Severity.LOW, 0,
+            Seq()).create(),
+        StageAnalysisBuilder(3, 5).taskRuntime(20, 250)
+          .skew(Severity.SEVERE, Severity.SEVERE, 15,
+            Seq("Stage 3 has skew in task run time (median is 20.00 sec, max is 4.17 min).",
+              "Stage 3: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(4, 5).taskRuntime(5, 250).input(260)
+          .skew(Severity.CRITICAL, Severity.CRITICAL, 20,
+            Seq("Stage 4 has skew in task run time (median is 5.00 sec, max is 4.17 min).",
+              "Stage 4 has skew in task input bytes (median is 5 MB, max is 250 MB).",
+              "Stage 4: please try to modify the application to make the input partitions more even.")).create(),
+        StageAnalysisBuilder(5, 5).taskRuntime(50, 250).shuffleRead(350).shuffleWrite(400)
+          .skew(Severity.MODERATE, Severity.MODERATE, 10,
+            Seq("Stage 5 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 5 has skew in task shuffle read bytes (median is 50 MB, max is 250 MB).",
+              "Stage 5 has skew in task shuffle write bytes (median is 50 MB, max is 250 MB).",
+              "Stage 5: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(6, 5).taskRuntime(50, 250).shuffleRead(50).output(50)
+          .skew(Severity.MODERATE, Severity.MODERATE, 10,
+            Seq( "Stage 6 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 6: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(7, 5).taskRuntime(20, 250).shuffleWrite(600).output(290)
+          .skew(Severity.SEVERE, Severity.SEVERE, 15,
+        Seq("Stage 7 has skew in task run time (median is 20.00 sec, max is 4.17 min).",
+          "Stage 7 has skew in task output bytes (median is 20 MB, max is 250 MB).",
+          "Stage 7: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(8, 3).taskRuntime(200, 250)
+            .longTask(Severity.LOW, 0, Seq()).create(),
+        StageAnalysisBuilder(9, 3).taskRuntime(5, 250)
+          .skew(Severity.CRITICAL, Severity.CRITICAL, 12,
+            Seq("Stage 9 has skew in task run time (median is 5.00 sec, max is 4.17 min).",
+              "Stage 9: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(10, 3).taskRuntime(20, 250).input(300)
+          .skew(Severity.SEVERE, Severity.SEVERE, 9,
+            Seq("Stage 10 has skew in task run time (median is 20.00 sec, max is 4.17 min).",
+              "Stage 10 has skew in task input bytes (median is 20 MB, max is 250 MB).",
+              "Stage 10: please try to modify the application to make the input partitions more even.")).create(),
+        StageAnalysisBuilder(11, 3).taskRuntime(50, 250).shuffleRead(350)
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 11 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 11 has skew in task shuffle read bytes (median is 50 MB, max is 250 MB).",
+              "Stage 11: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(12, 5).taskRuntime(2, 50).duration(60)
+          .skew(Severity.CRITICAL, Severity.NONE, 0,
+            Seq()).create(),
+        StageAnalysisBuilder(13, 5).taskRuntime(5, 50).input(600)
+          .skew(Severity.SEVERE, Severity.NONE, 0,
+            Seq()).create(),
+        StageAnalysisBuilder(14, 5).taskRuntime(5, 200).output(210)
+          .skew(Severity.CRITICAL, Severity.NONE, 0,
+            Seq()).create())
+
+      val stageAnalyzer = new StagesAnalyzer(heuristicConfigurationData, data)
+      val stageAnalysis = stageAnalyzer.getStageAnalysis()
+       (0 until expectedAnalysis.size).foreach { i =>
+        compareStageAnalysis(stageAnalysis(i), expectedAnalysis(i))
+      }
+    }
+
+    it("has long task severity") {
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 3).taskRuntime(120, 150, 300).create(),
+        StageBuilder(2, 3).taskRuntime(180, 200, 400).create(),
+        StageBuilder(3, 3).taskRuntime(400, 500, 1000).create(),
+        StageBuilder(4, 3).taskRuntime(700, 900, 2000).create(),
+        StageBuilder(5, 3).taskRuntime(1200, 1500, 4000).create(),
+        StageBuilder(6, 3).taskRuntime(700, 3500, 4500).create(),
+        StageBuilder(7, 2).taskRuntime(700, 900, 2000).create(),
+        StageBuilder(8, 3).taskRuntime(3000, 3000, 9000).input(2 << 20, 3 << 20, 5 << 20).create(),
+        StageBuilder(9, 4003).taskRuntime(3000, 3000, 9000).shuffleRead(2 << 20, 3 << 20, 5 << 20).create(),
+        StageBuilder(10, 4000).taskRuntime(700, 900, 2000).create())
+      val properties = Map( "spark.sql.shuffle.partitions" -> "3")
+      val data = createSparkApplicationData(stages, Seq.empty, Some(properties))
+
+      val expectedAnalysis = Seq(
+        StageAnalysisBuilder(1, 3).taskRuntime(120, 150).create(),
+        StageAnalysisBuilder(2, 3).taskRuntime(180, 200).longTask(Severity.LOW, 0, Seq()).create(),
+        StageAnalysisBuilder(3, 3).taskRuntime(400, 500).longTask(Severity.MODERATE, 6,
+          Seq("Stage 3 has a long median task run time of 6.67 min.",
+            "Stage 3 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.")).create(),
+        StageAnalysisBuilder(4, 3).taskRuntime(700, 900).longTask(Severity.SEVERE, 9,
+          Seq("Stage 4 has a long median task run time of 11.67 min.",
+            "Stage 4 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.")).create(),
+        StageAnalysisBuilder(5, 3).taskRuntime(1200, 1500).longTask(Severity.CRITICAL, 12,
+          Seq("Stage 5 has a long median task run time of 20.00 min.",
+            "Stage 5 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.")).create(),
+        StageAnalysisBuilder(6, 3).taskRuntime(700, 3500).longTask(Severity.SEVERE, 9,
+          Seq("Stage 6 has a long median task run time of 11.67 min.",
+            "Stage 6 has 3 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output."))
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 6 has skew in task run time (median is 11.67 min, max is 58.33 min).",
+              "Stage 6: please try to modify the application to make the partitions more even.")).create(),
+        StageAnalysisBuilder(7, 2).taskRuntime(700, 900).longTask(Severity.SEVERE, 6,
+          Seq("Stage 7 has a long median task run time of 11.67 min.",
+            "Stage 7 has 2 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+            "Stage 7: please increase the number of partitions.")).create(),
+        StageAnalysisBuilder(8, 3).taskRuntime(3000, 3000).longTask(Severity.CRITICAL, 12,
+          Seq("Stage 8 has a long median task run time of 50.00 min.",
+            "Stage 8 has 3 tasks, 5 TB input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+            "Stage 8: please increase the number of partitions for reading data."))
+          .input(5 << 20).create(),
+        StageAnalysisBuilder(9, 4003).taskRuntime(3000, 3000).longTask(Severity.CRITICAL, 16012,
+          Seq("Stage 9 has a long median task run time of 50.00 min.",
+            "Stage 9 has 4003 tasks, 0 B input, 5 TB shuffle read, 0 B shuffle write, and 0 B output.",
+            "Stage 9: please try to reduce the amount of data being processed."))
+          .shuffleRead(5 << 20).create(),
+        StageAnalysisBuilder(10, 4000).taskRuntime(700, 900).longTask(Severity.SEVERE, 12000,
+          Seq("Stage 10 has a long median task run time of 11.67 min.",
+            "Stage 10 has 4000 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+            "Stage 10: please optimize the code to improve performance.")).create())
+
+      val stageAnalyzer = new StagesAnalyzer(heuristicConfigurationData, data)
+      val stageAnalysis = stageAnalyzer.getStageAnalysis()
+      (0 until expectedAnalysis.size).foreach { i =>
+        compareStageAnalysis(stageAnalysis(i), expectedAnalysis(i))
+      }
+     }
+
+    it("has execution memory spill severity") {
+      val heuristicConfigurationData = createHeuristicConfigurationData()
+      val stages = Seq(
+        StageBuilder(1, 5).taskRuntime(100, 150, 400).shuffleRead(200, 300, 800)
+          .spill(1, 2, 5).create(),
+        StageBuilder(2, 5).taskRuntime(100, 150, 400).shuffleRead(200, 300, 800)
+          .spill(10, 15, 40).create(),
+        StageBuilder(3, 5).taskRuntime(100, 150, 400).input(500, 2000, 3000)
+          .spill(100, 150, 400).create(),
+        StageBuilder(4, 5).taskRuntime(300, 350, 1500).shuffleWrite(1000, 1000, 5000)
+          .spill(300, 350, 1500).create(),
+        StageBuilder(5, 5).taskRuntime(300, 2500, 3000).shuffleRead(1000, 5000, 16000)
+          .shuffleWrite(300, 2500, 3000).spill(300, 2500, 3000).create(),
+        StageBuilder(6, 3).taskRuntime(50, 250, 350).input(50, 250, 350)
+          .spill(250, 250, 750).create(),
+        StageBuilder(7, 3).taskRuntime(50, 250, 350).output(250, 1000, 1500)
+          .spill(250, 250, 750).create(),
+        StageBuilder(8, 5).taskRuntime(2, 50, 53)
+          .times("09/09/2018 12:00:00", "09/09/2018 12:01:00")
+            .shuffleRead(500, 500, 1500).spill(250, 250, 750).create(),
+        StageBuilder(9, 5).taskRuntime(50, 250, 350).output(50, 250, 6L << 20)
+          .spill(50, 250, 2L << 20).create(),
+        StageBuilder(10, 5).taskRuntime(50, 250, 350).input(50, 250, 6L << 20)
+          .spill(50, 250, 2L << 20).create(),
+        StageBuilder(11, 3).taskRuntime(50, 250, 350).input(50, 250, 6L << 20)
+          .spill(50, 250, 3L << 20).create(),
+        StageBuilder(12, 3).taskRuntime(50, 250, 350).output(50, 250, 6L << 20)
+          .spill(50, 250, 4L << 20).create())
+      val properties = Map( "spark.sql.shuffle.partitions" -> "5")
+      val data = createSparkApplicationData(stages, Seq.empty, Some(properties))
+
+      val expectedAnalysis = Seq(
+        StageAnalysisBuilder(1, 5).taskRuntime(100, 150).shuffleRead(800)
+          .spill(Severity.NONE, Severity.NONE, 0, 2, 5, Seq()).create(),
+        StageAnalysisBuilder(2, 5).taskRuntime(100, 150).shuffleRead(800)
+          .spill(Severity.LOW, Severity.LOW, 0, 15, 40, Seq()).create(),
+        StageAnalysisBuilder(3, 5).taskRuntime(100, 150).input(3000)
+          .spill(Severity.MODERATE, Severity.MODERATE, 10, 150, 400,
+            Seq("Stage 3 has 400 MB execution memory spill."))
+          .skew(Severity.NONE, Severity.NONE, 0,
+            Seq("Stage 3 has skew in task input bytes (median is 500 MB, max is 1.95 GB).",
+              "Stage 3: please try to modify the application to make the input partitions more even."))
+          .create(),
+        StageAnalysisBuilder(4, 5).taskRuntime(300, 350).shuffleWrite(5000)
+          .longTask(Severity.MODERATE, 10,
+            Seq("Stage 4 has a long median task run time of 5.00 min.",
+              "Stage 4 has 5 tasks, 0 B input, 0 B shuffle read, 4.88 GB shuffle write, and 0 B output."))
+          .spill(Severity.SEVERE, Severity.SEVERE, 15, 350, 1500,
+            Seq("Stage 4 has 1.46 GB execution memory spill.")).create(),
+        StageAnalysisBuilder(5, 5).taskRuntime(300, 2500).shuffleRead(16000).shuffleWrite(3000)
+          .longTask(Severity.MODERATE, 10, Seq("Stage 5 has a long median task run time of 5.00 min.",
+            "Stage 5 has 5 tasks, 0 B input, 15.62 GB shuffle read, 2.93 GB shuffle write, and 0 B output."))
+          .skew(Severity.SEVERE, Severity.SEVERE, 15,
+            Seq("Stage 5 has skew in task run time (median is 5.00 min, max is 41.67 min).",
+              "Stage 5 has skew in memory bytes spilled (median is 300 MB, max is 2.44 GB).",
+              "Stage 5 has skew in task shuffle read bytes (median is 1,000 MB, max is 4.88 GB).",
+              "Stage 5 has skew in task shuffle write bytes (median is 300 MB, max is 2.44 GB).",
+              "Stage 5: please try to modify the application to make the partitions more even."))
+          .spill(Severity.MODERATE, Severity.MODERATE, 10, 2500, 3000
+            , Seq("Stage 5 has 2.93 GB execution memory spill.")).create(),
+        StageAnalysisBuilder(6, 3).taskRuntime(50, 250).input(350)
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 6 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 6 has skew in task input bytes (median is 50 MB, max is 250 MB).",
+              "Stage 6: please try to modify the application to make the input partitions more even."))
+          .spill(Severity.CRITICAL, Severity.CRITICAL, 12, 250, 750,
+            Seq("Stage 6 has 750 MB execution memory spill.")).create(),
+        StageAnalysisBuilder(7, 3).taskRuntime(50, 250).output(1500)
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 7 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 7 has skew in task output bytes (median is 250 MB, max is 1,000 MB).",
+              "Stage 7: please try to modify the application to make the partitions more even."))
+          .spill(Severity.CRITICAL, Severity.CRITICAL, 12, 250, 750,
+            Seq("Stage 7 has 750 MB execution memory spill.")).create(),
+        StageAnalysisBuilder(8, 5).taskRuntime(2, 50).duration(60).shuffleRead(1500)
+          .skew(Severity.CRITICAL, Severity.NONE, 0,
+            Seq("Stage 8: please try to modify the application to make the partitions more even."))
+          .spill(Severity.CRITICAL, Severity.CRITICAL, 20, 250, 750,
+            Seq("Stage 8 has 750 MB execution memory spill.")).create(),
+        StageAnalysisBuilder(9, 5).taskRuntime(50, 250).output(6L << 20)
+          .skew(Severity.MODERATE, Severity.MODERATE, 10,
+            Seq("Stage 9 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 9 has skew in memory bytes spilled (median is 50 MB, max is 250 MB).",
+              "Stage 9 has skew in task output bytes (median is 50 MB, max is 250 MB).",
+              "Stage 9: please try to modify the application to make the partitions more even.")
+          )
+          .spill(Severity.SEVERE, Severity.NONE, 0, 250, 2L << 20,
+            Seq("Stage 9: a large amount of data is being processesd. Examine the application to see if this can be reduced.",
+              "Stage 9 has 2 TB execution memory spill.",
+              "Stage 9 has 5 tasks, 0 B input read, 0 B shuffle read, 0 B shuffle write, 6 TB output.",
+              "Stage 9 has median task values: 50 MB memory spill, 0 B input, 0 B shuffle read, 0 B shuffle write, 50 MB output."))
+          .create(),
+        StageAnalysisBuilder(10, 5).taskRuntime(50, 250).input(6 << 20)
+          .skew(Severity.MODERATE, Severity.MODERATE, 10,
+            Seq("Stage 10 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 10 has skew in memory bytes spilled (median is 50 MB, max is 250 MB).",
+              "Stage 10 has skew in task input bytes (median is 50 MB, max is 250 MB).",
+              "Stage 10: please try to modify the application to make the input partitions more even."))
+          .spill(Severity.SEVERE, Severity.NONE, 0, 250, 2L << 20,
+            Seq("Stage 10: a large amount of data is being processesd. Examine the application to see if this can be reduced.",
+              "Stage 10 has 2 TB execution memory spill.",
+              "Stage 10 has 5 tasks, 6 TB input read, 0 B shuffle read, 0 B shuffle write, 0 B output.",
+              "Stage 10 has median task values: 50 MB memory spill, 50 MB input, 0 B shuffle read, 0 B shuffle write, 0 B output."))
+          .create(),
+        StageAnalysisBuilder(11, 3).taskRuntime(50, 250).input(6 << 20)
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 11 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 11 has skew in memory bytes spilled (median is 50 MB, max is 250 MB).",
+              "Stage 11 has skew in task input bytes (median is 50 MB, max is 250 MB).",
+              "Stage 11: please try to modify the application to make the input partitions more even."))
+          .spill(Severity.CRITICAL, Severity.NONE, 0, 250, 3L << 20,
+            Seq("Stage 11: a large amount of data is being processesd. Examine the application to see if this can be reduced.",
+              "Stage 11 has 3 TB execution memory spill.",
+              "Stage 11 has 3 tasks, 6 TB input read, 0 B shuffle read, 0 B shuffle write, 0 B output.",
+              "Stage 11 has median task values: 50 MB memory spill, 50 MB input, 0 B shuffle read, 0 B shuffle write, 0 B output."))
+          .create(),
+        StageAnalysisBuilder(12, 3).taskRuntime(50, 250).output(6L << 20)
+          .skew(Severity.MODERATE, Severity.MODERATE, 6,
+            Seq("Stage 12 has skew in task run time (median is 50.00 sec, max is 4.17 min).",
+              "Stage 12 has skew in memory bytes spilled (median is 50 MB, max is 250 MB).",
+              "Stage 12 has skew in task output bytes (median is 50 MB, max is 250 MB).",
+              "Stage 12: please try to modify the application to make the partitions more even."))
+          .spill(Severity.CRITICAL, Severity.NONE, 0, 250, 4L << 20,
+            Seq("Stage 12: a large amount of data is being processesd. Examine the application to see if this can be reduced.",
+              "Stage 12 has 4 TB execution memory spill.",
+              "Stage 12 has 3 tasks, 0 B input read, 0 B shuffle read, 0 B shuffle write, 6 TB output.",
+              "Stage 12 has median task values: 50 MB memory spill, 0 B input, 0 B shuffle read, 0 B shuffle write, 50 MB output."))
+          .create())
+
+      val stageAnalyzer = new StagesAnalyzer(heuristicConfigurationData, data)
+      val stageAnalysis = stageAnalyzer.getStageAnalysis()
+      (0 until expectedAnalysis.size).foreach { i =>
+        compareStageAnalysis(stageAnalysis(i), expectedAnalysis(i))
+      }
+    }
+  }
+
+  it("custom recommendations") {
+    val heuristicConfigurationData = createHeuristicConfigurationData(
+      Map("execution_memory_spill_large_data_recommendation" -> "please try to filter the data to reduce the size",
+    "task_skew_input_data_recommendation" -> "please set DaliSpark.SPLIT_SIZE to make partitions more even",
+    "task_skew_generic_recommendation" -> "please make the partitions more even",
+    "long_tasks_large_data_recommendation" -> "please try to filter the data to reduce the size and increase speed",
+    "slow_tasks_recommendation" -> "optimize the code to increase speed",
+    "long tasks_few_partitions" -> "increase the number of partitions to speed up the stage",
+    "long tasks_few_input_partitions" -> "please set DaliSpark.SPLIT_SIZE to make partitions more even"))
+    val stages = Seq(
+      StageBuilder(1, 4003).taskRuntime(3000, 3000, 9000).shuffleRead(2 << 20, 3 << 20, 5 << 20).create(),
+      StageBuilder(2, 4000).taskRuntime(700, 900, 2000).create(),
+      StageBuilder(3, 2).taskRuntime(700, 900, 2000).create(),
+      StageBuilder(4, 3).taskRuntime(3000, 3000, 9000).input(2 << 20, 3 << 20, 5 << 20).create(),
+      StageBuilder(5, 3).taskRuntime(5, 250, 70).create(),
+      StageBuilder(6, 3).taskRuntime(20, 250, 300).input(20, 250, 300).create(),
+      StageBuilder(9, 5).taskRuntime(50, 50, 350).output(250, 250, 6L << 20)
+        .spill(250, 250, 2L << 20).create())
+    val properties = Map( "spark.sql.shuffle.partitions" -> "3")
+    val data = createSparkApplicationData(stages, Seq.empty, Some(properties))
+
+    val expectedAnalysis = Seq(
+      StageAnalysisBuilder(1, 4003).taskRuntime(3000, 3000).longTask(Severity.CRITICAL, 16012,
+        Seq("Stage 1 has a long median task run time of 50.00 min.",
+          "Stage 1 has 4003 tasks, 0 B input, 5 TB shuffle read, 0 B shuffle write, and 0 B output.",
+          "Stage 1: please try to filter the data to reduce the size and increase speed."))
+        .shuffleRead(5 << 20).create(),
+      StageAnalysisBuilder(2, 4000).taskRuntime(700, 900).longTask(Severity.SEVERE, 12000,
+        Seq("Stage 2 has a long median task run time of 11.67 min.",
+          "Stage 2 has 4000 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+          "Stage 2: optimize the code to increase speed.")).create(),
+       StageAnalysisBuilder(3, 2).taskRuntime(700, 900).longTask(Severity.SEVERE, 6,
+        Seq("Stage 3 has a long median task run time of 11.67 min.",
+          "Stage 3 has 2 tasks, 0 B input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+          "Stage 3: increase the number of partitions to speed up the stage.")).create(),
+      StageAnalysisBuilder(4, 3).taskRuntime(3000, 3000).longTask(Severity.CRITICAL, 12,
+        Seq("Stage 4 has a long median task run time of 50.00 min.",
+          "Stage 4 has 3 tasks, 5 TB input, 0 B shuffle read, 0 B shuffle write, and 0 B output.",
+          "Stage 4: please set DaliSpark.SPLIT_SIZE to make partitions more even."))
+        .input(5 << 20).create(),
+      StageAnalysisBuilder(5, 3).taskRuntime(5, 250)
+        .skew(Severity.CRITICAL, Severity.CRITICAL, 12,
+          Seq("Stage 5 has skew in task run time (median is 5.00 sec, max is 4.17 min).",
+            "Stage 5: please make the partitions more even.")
+        ).create(),
+      StageAnalysisBuilder(6, 3).taskRuntime(20, 250).input(300)
+        .skew(Severity.SEVERE, Severity.SEVERE, 9,
+          Seq("Stage 6 has skew in task run time (median is 20.00 sec, max is 4.17 min).",
+            "Stage 6 has skew in task input bytes (median is 20 MB, max is 250 MB).",
+            "Stage 6: please set DaliSpark.SPLIT_SIZE to make partitions more even.")).create(),
+      StageAnalysisBuilder(7, 5).taskRuntime(50, 50).output(6L << 20)
+        .spill(Severity.SEVERE, Severity.NONE, 0, 250, 2L << 20,
+          Seq("Stage 9: please try to filter the data to reduce the size.",
+            "Stage 9 has 2 TB execution memory spill.",
+            "Stage 9 has 5 tasks, 0 B input read, 0 B shuffle read, 0 B shuffle write, 6 TB output.",
+            "Stage 9 has median task values: 250 MB memory spill, 0 B input, 0 B shuffle read, 0 B shuffle write, 250 MB output."))
+        .create())
+
+    val stageAnalyzer = new StagesAnalyzer(heuristicConfigurationData, data)
+    val stageAnalysis = stageAnalyzer.getStageAnalysis()
+    (0 until expectedAnalysis.size).foreach { i =>
+      compareStageAnalysis(stageAnalysis(i), expectedAnalysis(i))
+    }
+  }
+
+  /** compare actual and expected StageAnalysis */
+  private def compareStageAnalysis(actual: StageAnalysis, expected: StageAnalysis): Unit = {
+    compareExecutionMemorySpillResult(actual.executionMemorySpillResult, expected.executionMemorySpillResult)
+    compareSimpleStageAnalysisResult(actual.longTaskResult, expected.longTaskResult)
+    compareTaskSkewResult(actual.taskSkewResult, expected.taskSkewResult)
+    compareTaskFailureResult(actual.taskFailureResult, expected.taskFailureResult)
+    compareSimpleStageAnalysisResult(actual.stageFailureResult, expected.stageFailureResult)
+    compareSimpleStageAnalysisResult(actual.stageGCResult, expected.stageGCResult)
+    actual.numTasks should be (expected.numTasks)
+    actual.medianRunTime should be (expected.medianRunTime)
+    actual.maxRunTime should be (expected.maxRunTime)
+    actual.stageDuration should be (expected.stageDuration)
+    actual.inputBytes should be(expected.inputBytes)
+    actual.outputBytes should be(expected.outputBytes)
+    actual.shuffleReadBytes should be(expected.shuffleReadBytes)
+    actual.shuffleWriteBytes should be(expected.shuffleWriteBytes)
+  }
+
+  /** compare actual and expected ExecutionMemorySpillResult */
+  private def compareExecutionMemorySpillResult(
+      actual: ExecutionMemorySpillResult,
+      expected: ExecutionMemorySpillResult) = {
+    actual.severity should be(expected.severity)
+    actual.rawSeverity should be(expected.rawSeverity)
+    actual.score should be(expected.score)
+    actual.memoryBytesSpilled should be(expected.memoryBytesSpilled)
+    actual.maxTaskBytesSpilled should be(expected.maxTaskBytesSpilled)
+    actual.details should be(expected.details)
+  }
+
+  /** compare actual and expected SimpleStageAnalysisResult */
+  private def compareSimpleStageAnalysisResult(
+      actual: SimpleStageAnalysisResult,
+      expected: SimpleStageAnalysisResult) = {
+    actual.severity should be(expected.severity)
+    actual.score should be(expected.score)
+    actual.details should be(expected.details)
+  }
+
+  /** compare actual and expected TaskSkewResult */
+  private def compareTaskSkewResult(
+      actual: TaskSkewResult,
+      expected: TaskSkewResult) = {
+    actual.severity should be(expected.severity)
+    actual.rawSeverity should be(expected.rawSeverity)
+    actual.score should be(expected.score)
+    actual.details should be(expected.details)
+  }
+
+  /** compare actual and expected TaskFailureResult */
+  private def compareTaskFailureResult(
+      actual: TaskFailureResult,
+      expected: TaskFailureResult) = {
+    actual.severity should be(expected.severity)
+    actual.oomSeverity should be(expected.oomSeverity)
+    actual.containerKilledSeverity should be(expected.containerKilledSeverity)
+    actual.score should be(expected.score)
+    actual.numFailures should be(expected.numFailures)
+    actual.numOOM should be(expected.numOOM)
+    actual.numContainerKilled should be (expected.numContainerKilled)
+    actual.details should be(expected.details)
+  }
+}
diff --git a/test/com/linkedin/drelephant/spark/heuristics/StagesHeuristicTest.scala b/test/com/linkedin/drelephant/spark/heuristics/StagesHeuristicTest.scala
index e6aae4fe1..cd1acc3d0 100644
--- a/test/com/linkedin/drelephant/spark/heuristics/StagesHeuristicTest.scala
+++ b/test/com/linkedin/drelephant/spark/heuristics/StagesHeuristicTest.scala
@@ -133,10 +133,16 @@ object StagesHeuristicTest {
     status,
     stageId,
     attemptId = 0,
+    numTasks = numCompleteTasks + numFailedTasks,
     numActiveTasks = numCompleteTasks + numFailedTasks,
     numCompleteTasks,
     numFailedTasks,
     executorRunTime,
+    executorCpuTime = 0,
+    submissionTime = None,
+    firstTaskLaunchedTime = None,
+    completionTime = None,
+    failureReason = None,
     inputBytes = 0,
     inputRecords = 0,
     outputBytes = 0,
@@ -152,7 +158,13 @@ object StagesHeuristicTest {
     schedulingPool = "",
     accumulatorUpdates = Seq.empty,
     tasks = None,
-    executorSummary = None
+    executorSummary = None,
+    peakJvmUsedMemory = None,
+    peakExecutionMemory = None,
+    peakStorageMemory = None,
+    peakUnifiedMemory = None,
+    taskSummary = None,
+    executorMetricsSummary = None
   )
 
   def newFakeSparkApplicationData(
diff --git a/test/com/linkedin/drelephant/spark/heuristics/StagesWithFailedTasksHeuristicTest.scala b/test/com/linkedin/drelephant/spark/heuristics/StagesWithFailedTasksHeuristicTest.scala
index cdfdc11ea..7a6191395 100644
--- a/test/com/linkedin/drelephant/spark/heuristics/StagesWithFailedTasksHeuristicTest.scala
+++ b/test/com/linkedin/drelephant/spark/heuristics/StagesWithFailedTasksHeuristicTest.scala
@@ -97,11 +97,18 @@ object StagesWithFailedTasksHeuristicTest {
     status,
     stageId,
     attemptId = 0,
+    numTasks = 0,
     numActiveTasks = numCompleteTasks,
     numCompleteTasks,
     numFailedTasks = 3,
     executorRunTime = 0,
-    inputBytes = 0,
+    executorCpuTime = 0,
+    submissionTime = None,
+    firstTaskLaunchedTime = None,
+    completionTime = None,
+    failureReason = None,
+
+  inputBytes = 0,
     inputRecords = 0,
     outputBytes = 0,
     outputRecords = 0,
@@ -150,7 +157,13 @@ object StagesWithFailedTasksHeuristicTest {
       errorMessage = None,
       taskMetrics = None)
     )),
-    executorSummary = None
+    executorSummary = None,
+    peakJvmUsedMemory = None,
+    peakExecutionMemory = None,
+    peakStorageMemory = None,
+    peakUnifiedMemory = None,
+    taskSummary = None,
+    executorMetricsSummary = None
   )
 
   def newFakeSparkApplicationData
diff --git a/test/com/linkedin/drelephant/util/UtilsTest.java b/test/com/linkedin/drelephant/util/UtilsTest.java
index 69f5509c4..8cef6c2ea 100644
--- a/test/com/linkedin/drelephant/util/UtilsTest.java
+++ b/test/com/linkedin/drelephant/util/UtilsTest.java
@@ -197,6 +197,17 @@ public void testGetDurationBreakdown() {
     assertEquals("0:05:24", Utils.getDurationBreakdown(durations[4]));
     assertEquals("314483:43:34", Utils.getDurationBreakdown(durations[5]));
   }
+
+  @Test
+  public void testGetDuration() {
+    long []durations = { 153, 25431, 432344, 23423562, 178123456L};
+    assertEquals("153 ms", Utils.getDuration(durations[0]));
+    assertEquals("25.43 sec", Utils.getDuration(durations[1]));
+    assertEquals("7.21 min", Utils.getDuration(durations[2]));
+    assertEquals("6.51 hr", Utils.getDuration(durations[3]));
+    assertEquals("2.06 days", Utils.getDuration(durations[4]));
+  }
+
   @Test
   public void testGetPercentage() {
     long []numerators = {10,20,30,40,50};