如何导入 spark.jobserver.SparkSessionJob
How to import spark.jobserver.SparkSessionJob
我通过添加
在 build.sbt 中添加了作业服务器 0.9.0 依赖项
scalaVersion := "2.11.0"
resolvers += "Job Server Bintray" at "https://dl.bintray.com/spark-jobserver/maven"
libraryDependencies ++= Seq(
"spark.jobserver" %% "job-server-api" % "0.9.0",
"org.apache.spark" %% "spark-core" % "2.3.2",
"org.apache.spark" %% "spark-sql" % "2.3.2",
)
但是,当我尝试测试这样的代码时(从 https://github.com/spark-jobserver/spark-jobserver#new-sparkjob-api-with-spark-v21 复制):
import com.typesafe.config.Config
import org.apache.spark.sql.SparkSession
import org.scalactic._
import spark.jobserver.api.{JobEnvironment, SingleProblem, ValidationProblem}
import spark.jobserver.SparkSessionJob
import scala.util.Try
object WordCountExampleSparkSession extends SparkSessionJob {
type JobData = Seq[String]
type JobOutput = collection.Map[String, Long]
override def runJob(sparkSession: SparkSession, runtime: JobEnvironment, data: JobData): JobOutput =
sparkSession.sparkContext.parallelize(data).countByValue
override def validate(sparkSession: SparkSession, runtime: JobEnvironment, config: Config): JobData Or Every[ValidationProblem] = {
Try(config.getString("input.string").split(" ").toSeq)
.map(words => Good(words))
.getOrElse(Bad(One(SingleProblem("No input.string param"))))
}
}
IntelliJ 显示错误:"Can not resolve symbol 'SparkSessionJob'"
jar 文件如下所示:
enter image description here
我想通了,sparkSessionJob 位于 job-server-extras,所以我只需要添加
libraryDependencies += "spark.jobserver" %% "job-server-api" % "0.9.0"
我通过添加
在 build.sbt 中添加了作业服务器 0.9.0 依赖项scalaVersion := "2.11.0"
resolvers += "Job Server Bintray" at "https://dl.bintray.com/spark-jobserver/maven"
libraryDependencies ++= Seq(
"spark.jobserver" %% "job-server-api" % "0.9.0",
"org.apache.spark" %% "spark-core" % "2.3.2",
"org.apache.spark" %% "spark-sql" % "2.3.2",
)
但是,当我尝试测试这样的代码时(从 https://github.com/spark-jobserver/spark-jobserver#new-sparkjob-api-with-spark-v21 复制):
import com.typesafe.config.Config
import org.apache.spark.sql.SparkSession
import org.scalactic._
import spark.jobserver.api.{JobEnvironment, SingleProblem, ValidationProblem}
import spark.jobserver.SparkSessionJob
import scala.util.Try
object WordCountExampleSparkSession extends SparkSessionJob {
type JobData = Seq[String]
type JobOutput = collection.Map[String, Long]
override def runJob(sparkSession: SparkSession, runtime: JobEnvironment, data: JobData): JobOutput =
sparkSession.sparkContext.parallelize(data).countByValue
override def validate(sparkSession: SparkSession, runtime: JobEnvironment, config: Config): JobData Or Every[ValidationProblem] = {
Try(config.getString("input.string").split(" ").toSeq)
.map(words => Good(words))
.getOrElse(Bad(One(SingleProblem("No input.string param"))))
}
}
IntelliJ 显示错误:"Can not resolve symbol 'SparkSessionJob'" jar 文件如下所示: enter image description here
我想通了,sparkSessionJob 位于 job-server-extras,所以我只需要添加
libraryDependencies += "spark.jobserver" %% "job-server-api" % "0.9.0"