WordCountOnline

package com.bjsxt.scala.spark.streaming

import org.apache.spark.SparkConf
import org.apache.spark.streaming.StreamingContext
import org.apache.spark.streaming.Durations
import org.apache.spark.storage.StorageLevel
import org.apache.spark.streaming.api.java.JavaStreamingContextFactory

object WordCountOnline {
  def main(args: Array[String]): Unit = {
    
    val sparkConf = new SparkConf()
    sparkConf.setMaster("local[2]")
    sparkConf.setAppName("WordCountOnline")

    val ssc = new StreamingContext(sparkConf,Durations.seconds(5))
    
    val linesDStream = ssc.socketTextStream("hadoop1",9999,StorageLevel.MEMORY_AND_DISK_SER)
    
    val wordsDStream = linesDStream.flatMap { _.split(" ") }
    
    val pairDStream = wordsDStream.map { (_,1) }
    val resultDStream = pairDStream.reduceByKey(_+_)
    
    resultDStream.print()
    
    ssc.start()
    ssc.awaitTermination()
  }
}

  

posted @ 2018-06-23 16:47  uuhh  阅读(79)  评论(0)    收藏  举报