1 package com.bawei.foryk 2 3 import org.apache.spark.rdd.RDD 4 import org.apache.spark.{SparkConf, SparkContext} 5 6 7 object SparkCoreReview02 { 8 9 def main(args: Array[String]): Unit = { 10 val conf: SparkConf = new SparkConf().setAppName("SparkCoreReview02").setMaster("local") 11 val sc = new SparkContext(conf) 12 val lineRDD: RDD[String] = sc.textFile("./data/*") 13 14 //统计文件的行数 15 //var totalcount = 0; 16 var acc = sc.longAccumulator 17 lineRDD.map(line=>{ 18 //totalcount=totalcount+1 19 acc.add(1) 20 }).foreach(println(_)) 21 22 //println("总行数是:"+totalcount) 23 println("总行数是:"+acc.value) 24 25 } 26 }