spark1.统计句子中特定内容

    val logFile = "./README.md"  // Should be some file on your server.
val conf = new SparkConf().setAppName("Simple Application").setMaster("local")
val sc = new SparkContext(conf)
val logData = sc.textFile(logFile, 2).cache()
// val numAs = logData.filter(line => line.contains("h")).count()
// val numBs = logData.filter(line => line.contains("j")).count()
var params = List("h","j","c","w");

var searchAnylisay = params.map(item => logData.filter(line => line.contains(item)).count() )

println("searchAnylisay length : %s,".format(searchAnylisay.length))

searchAnylisay.foreach( x => println(x))
posted @ 2017-03-26 19:01  小毛驴  阅读(221)  评论(0编辑  收藏  举报