I'm running a spark streaming job and I seem to occasionally run into this after running for a few hours. I don't spot any exceptions on the UI. Does anyone know what I can do to troubleshoot further?
13/04/02 03:32:47 ERROR cluster.TaskSetManager: Task 90304.0:2 failed more than 4 times; aborting job
13/04/02 03:32:47 ERROR streaming.JobManager: Running streaming job 7852 @ 1364873520000 ms failed
spark.SparkException: Job failed: Task 90304.0:2 failed more than 4 times
at spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:642)
at spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:640)
at scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:60)
at scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:47)
at spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:640)
at spark.scheduler.DAGScheduler.processEvent(DAGScheduler.scala:303)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$run(DAGScheduler.scala:364)
at spark.scheduler.DAGScheduler$$anon$1.run(DAGScheduler.scala:107)
13/04/02 03:33:45 ERROR cluster.TaskSetManager: Task 90321.0:3 failed more than 4 times; aborting job
13/04/02 03:33:45 ERROR streaming.JobManager: Running streaming job 7853 @ 1364873525000 ms failed
spark.SparkException: Job failed: Task 90321.0:3 failed more than 4 times
at spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:642)
at spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:640)
at scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:60)
at scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:47)
at spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:640)
at spark.scheduler.DAGScheduler.processEvent(DAGScheduler.scala:303)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$run(DAGScheduler.scala:364)
at spark.scheduler.DAGScheduler$$anon$1.run(DAGScheduler.scala:107)
13/04/02 03:33:45 ERROR cluster.TaskSetManager: Task 90342.0:2 failed more than 4 times; aborting job
13/04/02 03:33:45 ERROR streaming.JobManager: Running streaming job 7854 @ 1364873530000 ms failed
spark.SparkException: Job failed: Task 90342.0:2 failed more than 4 times
...
Exception in thread "DAGScheduler" java.lang.IllegalArgumentException: Shuffle ID 71056 registered twice
at spark.MapOutputTracker.registerShuffle(MapOutputTracker.scala:81)
at spark.scheduler.DAGScheduler.newStage(DAGScheduler.scala:151)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$getShuffleMapStage(DAGScheduler.scala:135)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:196)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:193)
at scala.collection.LinearSeqOptimized$class.foreach(LinearSeqOptimized.scala:59)
at scala.collection.immutable.List.foreach(List.scala:76)
at spark.scheduler.DAGScheduler.visit$2(DAGScheduler.scala:193)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:201)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:193)
at scala.collection.LinearSeqOptimized$class.foreach(LinearSeqOptimized.scala:59)
at scala.collection.immutable.List.foreach(List.scala:76)
at spark.scheduler.DAGScheduler.visit$2(DAGScheduler.scala:193)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:201)
at spark.scheduler.DAGScheduler$$anonfun$visit$2$1.apply(DAGScheduler.scala:193)
at scala.collection.LinearSeqOptimized$class.foreach(LinearSeqOptimized.scala:59)
...
t spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$getMissingParentStages(DAGScheduler.scala:207)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$submitStage(DAGScheduler.scala:420)
at spark.scheduler.DAGScheduler$$anonfun$spark$scheduler$DAGScheduler$$submitStage$4.apply(DAGScheduler.scala:428)
at spark.scheduler.DAGScheduler$$anonfun$spark$scheduler$DAGScheduler$$submitStage$4.apply(DAGScheduler.scala:427)
at scala.collection.LinearSeqOptimized$class.foreach(LinearSeqOptimized.scala:59)
at scala.collection.immutable.List.foreach(List.scala:76)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$submitStage(DAGScheduler.scala:427)
at spark.scheduler.DAGScheduler$$anonfun$spark$scheduler$DAGScheduler$$submitStage$4.apply(DAGScheduler.scala:428)
at spark.scheduler.DAGScheduler$$anonfun$spark$scheduler$DAGScheduler$$submitStage$4.apply(DAGScheduler.scala:427)
at scala.collection.LinearSeqOptimized$class.foreach(LinearSeqOptimized.scala:59)
at scala.collection.immutable.List.foreach(List.scala:76)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$submitStage(DAGScheduler.scala:427)
at spark.scheduler.DAGScheduler$$anonfun$submitWaitingStages$6.apply(DAGScheduler.scala:344)
at spark.scheduler.DAGScheduler$$anonfun$submitWaitingStages$6.apply(DAGScheduler.scala:343)
at scala.collection.IndexedSeqOptimized$class.foreach(IndexedSeqOptimized.scala:34)
at scala.collection.mutable.ArrayOps.foreach(ArrayOps.scala:38)
at spark.scheduler.DAGScheduler.submitWaitingStages(DAGScheduler.scala:343)
at spark.scheduler.DAGScheduler.spark$scheduler$DAGScheduler$$run(DAGScheduler.scala:378)
at spark.scheduler.DAGScheduler$$anon$1.run(DAGScheduler.scala:107)