1.Flink读取Text文件,实现Word Count示例
package com.mkluo.flink
import org.apache.flink.api.scala.ExecutionEnvironment
/**
* @author luomingkui
* @date 2019/7/7 下午2:44
* @desc 批处理的WorldCount
*/
object BatchWcApp {
def main(args: Array[String]): Unit = {
//1.构造执行环境
val env = ExecutionEnvironment.getExecutionEnvironment
// 其中flatMap 和Map 需要引入隐式转换
import org.apache.flink.api.scala._
//2.source
val ds: DataSet[String] = env.readTextFile("/Users/luomingkui/Downloads/CaseData/test/helloworlds.txt")
//3.经过groupby进行分组,sum进行聚合
val aggDs: AggregateDataSet[(String, Int)] = ds.flatMap(_.split(" ")).map((_, 1)).groupBy(0).sum(1)
//4.打印
aggDs.print()
//4.输出到?点地点
aggDs.writeAsCsv("/Users/luomingkui/Downloads/data")
env.execute()
}
}
2.Flink读取Socket流,实现Word Count示例
package com.mkluo.flink
import org.apache.flink.streaming.api.scala.{DataStream, St