1.在安装有spark的客户端上安装sbt(请参考上一篇博客)
2.在一台slave终端机的/home/hadoop1/xuguokun/下创建WordCount文件夹。
3.创建build.sbt文件,该文件的里面的内容如下:
name := "o2o-spark"
version := "0.1"
scalaVersion := "2.10.4"
libraryDependencies ++= Seq(
"org.scalanlp" % "chalk" % "1.3.0",
"org.apache.spark" %% "spark-core" % "1.3.1",
"org.apache.spark" %% "spark-mllib" % "1.3.1",
"org.apache.spark" % "spark-streaming_2.10" % "1.3.1",
"org.apache.spark" %% "spark-streaming-kafka" % "1.1.0",
"org.apache.hadoop" % "hadoop-client" % "2.2.0",
"org.apache.hadoop" % "hadoop-common" % "2.2.0",
"org.apache.hadoop" % "hadoop-hdfs" % "2.2.0",
"com.github.scopt" %% "scopt" % "3.3.0",
"org.apache.spark" %% "spark-sql" % "1.5.1",
"org.apache.spark" %% "spark-hive" % "1.5.1",
"org.apache.hbase" % "hbase" % "0.94.18"
)
resolvers += "Akka Repository" at "http:/