大数据之单词统计

package com.sjw.flink

import org.apache.flink.api.scala._

object WordCount {

def main(args: Array[String]): Unit = {

//创建批处理执行环境
val env: ExecutionEnvironment = ExecutionEnvironment.getExecutionEnvironment
//数据源 文件读取
val dataDS: DataSet[String] = env.readTextFile("src\\main\\resources\\words.txt")
//对DS处理
dataDS.flatMap(_.split(" ")).map((_,1)).groupBy(0).sum(1).print()

}

}

posted @ 2020-07-09 23:19  潇洒哥浩浩  阅读(220)  评论(0)    收藏  举报