import co.cask.cdap.api.spark._
import org.apache.spark._
import org.slf4j._
class SparkProgram extends SparkMain {
import SparkProgram._
override def run(implicit sec: SparkExecutionContext): Unit = {
LOG.info("Spark Program Started")
LOG.info("---------------------")
val conf = new SparkConf().setMaster("yarn").setAppName("CDAP_Spark-On-Yarn")
val sc = new SparkContext(conf)
LOG.info("Spark Context : " + sc)
LOG.info("Spark Version : " + sc.version)
val text = sc.textFile("hdfs://cl1/user/simon/bigShakes.txt")
val counts = text.flatMap(line => line.split(" ")).map(word => (word,1)).reduceByKey(_+_)
val col = counts.collect
LOG.info("Result : " + col)
LOG.info("Spark Program Completed")
LOG.info("-----------------------")
}
}
object SparkProgram {
val LOG = LoggerFactory.getLogger(getClass())
}
2018-07-31 19:43:21,208 - INFO [program.status:c.c.c.i.a.r.d.DistributedProgramRunner@475] - Starting Workflow Program 'DataPipelineWorkflow' with Arguments [logical.start.time=1533062593447]
2018-07-31 19:43:21,208 - INFO [program.status:c.c.c.i.a.r.d.DistributedProgramRunner@475] - Starting Workflow Program 'DataPipelineWorkflow' with Arguments [logical.start.time=1533062593447]
2018-07-31 19:44:55,379 - INFO [WorkflowDriver:c.c.c.d.SmartWorkflow@440] - Pipeline 'SV14' is started by user 'cdap' with arguments {logical.start.time=1533062593447}
2018-07-31 19:44:55,435 - INFO [WorkflowDriver:c.c.c.d.SmartWorkflow@474] - Pipeline 'SV14' running
2018-07-31 19:44:55,530 - INFO [WorkflowDriver:c.c.c.i.a.r.w.WorkflowDriver@611] - Starting workflow execution for 'DataPipelineWorkflow' with Run id '9486c6d1-94f1-11e8-8a9d-000c299af245'
2018-07-31 19:45:04,535 - INFO [action-phase-1-0:c.c.c.i.a.r.w.WorkflowDriver@342] - Starting Spark Program 'phase-1' in workflow
2018-07-31 19:45:06,551 - INFO [SparkExecutionService STARTING:c.c.h.NettyHttpService@172] - Starting HTTP Service phase-1-spark-exec-service at address wk2.cdh.localnet/192.168.10.24:0
2018-07-31 19:45:11,676 - WARN [spark-submitter-phase-1-d6b8bae1-94f1-11e8-aaec-000c29ad103d:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hbase.enabled is deprecated, using spark.yarn.security.credentials.hbase.enabled instead
2018-07-31 19:45:11,684 - WARN [spark-submitter-phase-1-d6b8bae1-94f1-11e8-aaec-000c29ad103d:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hive.enabled is deprecated, using spark.yarn.security.credentials.hive.enabled instead
2018-07-31 19:45:51,337 - INFO [SparkDriverHttpService STARTING:c.c.h.NettyHttpService@172] - Starting HTTP Service phase-1-http-service at address wk1.cdh.localnet/192.168.10.23:0
2018-07-31 19:45:51,871 - INFO [Driver:c.c.c.a.r.s.d.SparkDriverService@188] - Credentials DIR: hdfs://cl1/user/cdap/.sparkStaging/application_1533062157811_0003
2018-07-31 19:45:54,071 - INFO [SparkDriverService:c.c.c.a.r.s.d.SparkDriverService@98] - SparkDriverService started.
2018-07-31 19:45:54,122 - INFO [Driver:c.c.c.a.r.s.SparkMainWrapper$@77] - Launching user spark class class co.cask.cdap.datapipeline.JavaSparkMainWrapper
2018-07-31 19:46:18,497 - INFO [Driver:SparkProgram$@9] - Spark Program Started
2018-07-31 19:46:18,499 - INFO [Driver:SparkProgram$@10] - ---------------------
2018-07-31 19:46:20,037 - INFO [Driver:o.s.j.u.log@186] - Logging initialized @48543ms
2018-07-31 19:46:20,322 - INFO [Driver:o.s.j.s.Server@327] - jetty-9.2.z-SNAPSHOT
2018-07-31 19:46:20,414 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@2d614990{/jobs,null,AVAILABLE}
2018-07-31 19:46:20,417 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@4a6124fb{/jobs/json,null,AVAILABLE}
2018-07-31 19:46:20,419 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@ba1e844{/jobs/job,null,AVAILABLE}
2018-07-31 19:46:20,420 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@6a9e5b19{/jobs/job/json,null,AVAILABLE}
2018-07-31 19:46:20,420 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@4d14a213{/stages,null,AVAILABLE}
2018-07-31 19:46:20,421 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@e9111b6{/stages/json,null,AVAILABLE}
2018-07-31 19:46:20,421 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@af62be8{/stages/stage,null,AVAILABLE}
2018-07-31 19:46:20,422 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@12a8ff3c{/stages/stage/json,null,AVAILABLE}
2018-07-31 19:46:20,424 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@7a44c340{/stages/pool,null,AVAILABLE}
2018-07-31 19:46:20,425 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@7c5e611f{/stages/pool/json,null,AVAILABLE}
2018-07-31 19:46:20,433 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@474cbc17{/storage,null,AVAILABLE}
2018-07-31 19:46:20,434 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@1248fadd{/storage/json,null,AVAILABLE}
2018-07-31 19:46:20,434 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@4eca6517{/storage/rdd,null,AVAILABLE}
2018-07-31 19:46:20,435 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@4193b348{/storage/rdd/json,null,AVAILABLE}
2018-07-31 19:46:20,436 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@631d0369{/environment,null,AVAILABLE}
2018-07-31 19:46:20,437 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@36d693c5{/environment/json,null,AVAILABLE}
2018-07-31 19:46:20,438 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@2ba9bad5{/executors,null,AVAILABLE}
2018-07-31 19:46:20,439 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@77fc451b{/executors/json,null,AVAILABLE}
2018-07-31 19:46:20,440 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@7cf106c6{/executors/threadDump,null,AVAILABLE}
2018-07-31 19:46:20,440 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@7ebbfa26{/executors/threadDump/json,null,AVAILABLE}
2018-07-31 19:46:20,465 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@18a29836{/static,null,AVAILABLE}
2018-07-31 19:46:20,466 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@de3d2a4{/,null,AVAILABLE}
2018-07-31 19:46:20,470 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@79d032e8{/api,null,AVAILABLE}
2018-07-31 19:46:20,471 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@581b9d3e{/jobs/job/kill,null,AVAILABLE}
2018-07-31 19:46:20,472 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@5474cd23{/stages/stage/kill,null,AVAILABLE}
2018-07-31 19:46:20,494 - INFO [Driver:o.s.j.s.ServerConnector@266] - Started ServerConnector@65953dab{HTTP/1.1}{0.0.0.0:45608}
2018-07-31 19:46:20,495 - INFO [Driver:o.s.j.s.Server@379] - Started @49001ms
2018-07-31 19:46:21,810 - INFO [Driver:o.s.j.s.h.ContextHandler@744] - Started o.s.j.s.ServletContextHandler@56457c3a{/metrics/json,null,AVAILABLE}
2018-07-31 19:46:22,208 - WARN [dispatcher-event-loop-1:o.a.s.s.c.YarnSchedulerBackend$YarnSchedulerEndpoint@66] - Attempted to request executors before the AM has registered!
2018-07-31 19:46:22,348 - INFO [Driver:SparkProgram$@16] - Spark Context : org.apache.spark.SparkContext@7e09c844
2018-07-31 19:46:22,349 - INFO [Driver:SparkProgram$@17] - Spark Version : 2.1.0.cloudera1
2018-07-31 19:46:40,477 - WARN [Timer-0:o.a.s.s.c.YarnClusterScheduler@66] - Initial job has not accepted any resources; check your cluster UI to ensure that workers are registered and have sufficient resources
2018-07-31 19:46:55,486 - WARN [Timer-0:o.a.s.s.c.YarnClusterScheduler@66] - Initial job has not accepted any resources; check your cluster UI to ensure that workers are registered and have sufficient resources
2018-07-31 19:47:07,407 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hbase.enabled is deprecated, using spark.yarn.security.credentials.hbase.enabled instead
2018-07-31 19:47:07,460 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hive.enabled is deprecated, using spark.yarn.security.credentials.hive.enabled instead
2018-07-31 19:47:07,531 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hbase.enabled is deprecated, using spark.yarn.security.credentials.hbase.enabled instead
2018-07-31 19:47:07,541 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hive.enabled is deprecated, using spark.yarn.security.credentials.hive.enabled instead
2018-07-31 19:47:10,485 - WARN [Timer-0:o.a.s.s.c.YarnClusterScheduler@66] - Initial job has not accepted any resources; check your cluster UI to ensure that workers are registered and have sufficient resources
2018-07-31 19:47:18,900 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hbase.enabled is deprecated, using spark.yarn.security.credentials.hbase.enabled instead
2018-07-31 19:47:18,912 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hive.enabled is deprecated, using spark.yarn.security.credentials.hive.enabled instead
2018-07-31 19:47:19,256 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hbase.enabled is deprecated, using spark.yarn.security.credentials.hbase.enabled instead
2018-07-31 19:47:19,264 - WARN [main:o.a.s.d.y.s.ConfigurableCredentialManager@66] - spark.yarn.security.tokens.hive.enabled is deprecated, using spark.yarn.security.credentials.hive.enabled instead
2018-07-31 19:52:45,219 - INFO [Driver:SparkProgram$@23] - Result : [Lscala.Tuple2;@2f40d16e
2018-07-31 19:52:45,219 - INFO [Driver:SparkProgram$@25] - Spark Program Completed
2018-07-31 19:52:45,219 - INFO [Driver:SparkProgram$@26] - -----------------------
2018-07-31 19:52:45,254 - INFO [SparkDriverService:c.c.c.a.r.s.d.SparkDriverService@145] - SparkDriverService stopped.
2018-07-31 19:52:45,341 - INFO [Thread-11:o.s.j.s.ServerConnector@306] - Stopped ServerConnector@65953dab{HTTP/1.1}{0.0.0.0:0}
2018-07-31 19:52:46,108 - INFO [SparkExecutionService STOPPING:c.c.h.NettyHttpService@242] - Stopping HTTP Service phase-1-spark-exec-service
2018-07-31 19:52:46,309 - INFO [action-phase-1-0:c.c.c.i.a.r.w.WorkflowDriver@345] - Spark Program 'phase-1' in workflow completed
2018-07-31 19:52:46,335 - INFO [WorkflowDriver:c.c.c.i.a.r.w.WorkflowDriver@619] - Workflow 'DataPipelineWorkflow' with run id '9486c6d1-94f1-11e8-8a9d-000c299af245' completed
2018-07-31 19:52:46,401 - INFO [WorkflowDriver:c.c.c.d.SmartWorkflow@531] - Pipeline 'SV14' succeeded.